diff --git a/lib/lxml/ElementInclude.py b/lib/lxml/ElementInclude.py
new file mode 100644
index 00000000..f7806709
--- /dev/null
+++ b/lib/lxml/ElementInclude.py
@@ -0,0 +1,223 @@
+#
+# ElementTree
+# $Id: ElementInclude.py 1862 2004-06-18 07:31:02Z Fredrik $
+#
+# limited xinclude support for element trees
+#
+# history:
+# 2003-08-15 fl   created
+# 2003-11-14 fl   fixed default loader
+#
+# Copyright (c) 2003-2004 by Fredrik Lundh.  All rights reserved.
+#
+# fredrik@pythonware.com
+# http://www.pythonware.com
+#
+# --------------------------------------------------------------------
+# The ElementTree toolkit is
+#
+# Copyright (c) 1999-2004 by Fredrik Lundh
+#
+# By obtaining, using, and/or copying this software and/or its
+# associated documentation, you agree that you have read, understood,
+# and will comply with the following terms and conditions:
+#
+# Permission to use, copy, modify, and distribute this software and
+# its associated documentation for any purpose and without fee is
+# hereby granted, provided that the above copyright notice appears in
+# all copies, and that both that copyright notice and this permission
+# notice appear in supporting documentation, and that the name of
+# Secret Labs AB or the author not be used in advertising or publicity
+# pertaining to distribution of the software without specific, written
+# prior permission.
+#
+# SECRET LABS AB AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD
+# TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANT-
+# ABILITY AND FITNESS.  IN NO EVENT SHALL SECRET LABS AB OR THE AUTHOR
+# BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY
+# DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,
+# WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
+# ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE
+# OF THIS SOFTWARE.
+# --------------------------------------------------------------------
+
+"""
+Limited XInclude support for the ElementTree package.
+
+While lxml.etree has full support for XInclude (see
+`etree.ElementTree.xinclude()`), this module provides a simpler, pure
+Python, ElementTree compatible implementation that supports a simple
+form of custom URL resolvers.
+"""
+
+from lxml import etree
+import copy
+try:
+    from urlparse import urljoin
+    from urllib2 import urlopen
+except ImportError:
+    # Python 3
+    from urllib.parse import urljoin
+    from urllib.request import urlopen
+
+try:
+    set
+except NameError:
+    # Python 2.3
+    from sets import Set as set
+
+XINCLUDE = "{http://www.w3.org/2001/XInclude}"
+
+XINCLUDE_INCLUDE = XINCLUDE + "include"
+XINCLUDE_FALLBACK = XINCLUDE + "fallback"
+
+##
+# Fatal include error.
+
+class FatalIncludeError(etree.LxmlSyntaxError):
+    pass
+
+##
+# ET compatible default loader.
+# This loader reads an included resource from disk.
+#
+# @param href Resource reference.
+# @param parse Parse mode.  Either "xml" or "text".
+# @param encoding Optional text encoding.
+# @return The expanded resource.  If the parse mode is "xml", this
+#    is an ElementTree instance.  If the parse mode is "text", this
+#    is a Unicode string.  If the loader fails, it can return None
+#    or raise an IOError exception.
+# @throws IOError If the loader fails to load the resource.
+
+def default_loader(href, parse, encoding=None):
+    file = open(href, 'rb')
+    if parse == "xml":
+        data = etree.parse(file).getroot()
+    else:
+        data = file.read()
+        if not encoding:
+            encoding = 'utf-8'
+        data = data.decode(encoding)
+    file.close()
+    return data
+
+##
+# Default loader used by lxml.etree - handles custom resolvers properly
+# 
+
+def _lxml_default_loader(href, parse, encoding=None, parser=None):
+    if parse == "xml":
+        data = etree.parse(href, parser).getroot()
+    else:
+        if "://" in href:
+            f = urlopen(href)
+        else:
+            f = open(href, 'rb')
+        data = f.read()
+        f.close()
+        if not encoding:
+            encoding = 'utf-8'
+        data = data.decode(encoding)
+    return data
+
+##
+# Wrapper for ET compatibility - drops the parser
+
+def _wrap_et_loader(loader):
+    def load(href, parse, encoding=None, parser=None):
+        return loader(href, parse, encoding)
+    return load
+
+
+##
+# Expand XInclude directives.
+#
+# @param elem Root element.
+# @param loader Optional resource loader.  If omitted, it defaults
+#     to {@link default_loader}.  If given, it should be a callable
+#     that implements the same interface as <b>default_loader</b>.
+# @throws FatalIncludeError If the function fails to include a given
+#     resource, or if the tree contains malformed XInclude elements.
+# @throws IOError If the function fails to load a given resource.
+# @returns the node or its replacement if it was an XInclude node
+
+def include(elem, loader=None, base_url=None):
+    if base_url is None:
+        if hasattr(elem, 'getroot'):
+            tree = elem
+            elem = elem.getroot()
+        else:
+            tree = elem.getroottree()
+        if hasattr(tree, 'docinfo'):
+            base_url = tree.docinfo.URL
+    elif hasattr(elem, 'getroot'):
+        elem = elem.getroot()
+    _include(elem, loader, base_url=base_url)
+
+def _include(elem, loader=None, _parent_hrefs=None, base_url=None):
+    if loader is not None:
+        load_include = _wrap_et_loader(loader)
+    else:
+        load_include = _lxml_default_loader
+
+    if _parent_hrefs is None:
+        _parent_hrefs = set()
+
+    parser = elem.getroottree().parser
+
+    include_elements = list(
+        elem.iter('{http://www.w3.org/2001/XInclude}*'))
+
+    for e in include_elements:
+        if e.tag == XINCLUDE_INCLUDE:
+            # process xinclude directive
+            href = urljoin(base_url, e.get("href"))
+            parse = e.get("parse", "xml")
+            parent = e.getparent()
+            if parse == "xml":
+                if href in _parent_hrefs:
+                    raise FatalIncludeError(
+                        "recursive include of %r detected" % href
+                        )
+                _parent_hrefs.add(href)
+                node = load_include(href, parse, parser=parser)
+                if node is None:
+                    raise FatalIncludeError(
+                        "cannot load %r as %r" % (href, parse)
+                        )
+                node = _include(node, loader, _parent_hrefs)
+                if e.tail:
+                    node.tail = (node.tail or "") + e.tail
+                if parent is None:
+                    return node # replaced the root node!
+                parent.replace(e, node)
+            elif parse == "text":
+                text = load_include(href, parse, encoding=e.get("encoding"))
+                if text is None:
+                    raise FatalIncludeError(
+                        "cannot load %r as %r" % (href, parse)
+                        )
+                predecessor = e.getprevious()
+                if predecessor is not None:
+                    predecessor.tail = (predecessor.tail or "") + text
+                elif parent is None:
+                    return text # replaced the root node!
+                else:
+                    parent.text = (parent.text or "") + text + (e.tail or "")
+                parent.remove(e)
+            else:
+                raise FatalIncludeError(
+                    "unknown parse type in xi:include tag (%r)" % parse
+                )
+        elif e.tag == XINCLUDE_FALLBACK:
+            parent = e.getparent()
+            if parent is not None and parent.tag != XINCLUDE_INCLUDE:
+                raise FatalIncludeError(
+                    "xi:fallback tag must be child of xi:include (%r)" % e.tag
+                    )
+        else:
+            raise FatalIncludeError(
+                "Invalid element found in XInclude namespace (%r)" % e.tag
+                )
+    return elem
diff --git a/lib/lxml/__init__.py b/lib/lxml/__init__.py
new file mode 100644
index 00000000..07cbe3a2
--- /dev/null
+++ b/lib/lxml/__init__.py
@@ -0,0 +1,20 @@
+# this is a package
+
+def get_include():
+    """
+    Returns a list of header include paths (for lxml itself, libxml2
+    and libxslt) needed to compile C code against lxml if it was built
+    with statically linked libraries.
+    """
+    import os
+    lxml_path = __path__[0]
+    include_path = os.path.join(lxml_path, 'includes')
+    includes = [include_path, lxml_path]
+
+    for name in os.listdir(include_path):
+        path = os.path.join(include_path, name)
+        if os.path.isdir(path):
+            includes.append(path)
+
+    return includes
+
diff --git a/lib/lxml/_elementpath.py b/lib/lxml/_elementpath.py
new file mode 100644
index 00000000..bc9176e8
--- /dev/null
+++ b/lib/lxml/_elementpath.py
@@ -0,0 +1,306 @@
+#
+# ElementTree
+# $Id: ElementPath.py 3375 2008-02-13 08:05:08Z fredrik $
+#
+# limited xpath support for element trees
+#
+# history:
+# 2003-05-23 fl   created
+# 2003-05-28 fl   added support for // etc
+# 2003-08-27 fl   fixed parsing of periods in element names
+# 2007-09-10 fl   new selection engine
+# 2007-09-12 fl   fixed parent selector
+# 2007-09-13 fl   added iterfind; changed findall to return a list
+# 2007-11-30 fl   added namespaces support
+# 2009-10-30 fl   added child element value filter
+#
+# Copyright (c) 2003-2009 by Fredrik Lundh.  All rights reserved.
+#
+# fredrik@pythonware.com
+# http://www.pythonware.com
+#
+# --------------------------------------------------------------------
+# The ElementTree toolkit is
+#
+# Copyright (c) 1999-2009 by Fredrik Lundh
+#
+# By obtaining, using, and/or copying this software and/or its
+# associated documentation, you agree that you have read, understood,
+# and will comply with the following terms and conditions:
+#
+# Permission to use, copy, modify, and distribute this software and
+# its associated documentation for any purpose and without fee is
+# hereby granted, provided that the above copyright notice appears in
+# all copies, and that both that copyright notice and this permission
+# notice appear in supporting documentation, and that the name of
+# Secret Labs AB or the author not be used in advertising or publicity
+# pertaining to distribution of the software without specific, written
+# prior permission.
+#
+# SECRET LABS AB AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD
+# TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANT-
+# ABILITY AND FITNESS.  IN NO EVENT SHALL SECRET LABS AB OR THE AUTHOR
+# BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY
+# DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,
+# WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
+# ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE
+# OF THIS SOFTWARE.
+# --------------------------------------------------------------------
+
+##
+# Implementation module for XPath support.  There's usually no reason
+# to import this module directly; the <b>ElementTree</b> does this for
+# you, if needed.
+##
+
+import re
+
+xpath_tokenizer_re = re.compile(
+    "("
+    "'[^']*'|\"[^\"]*\"|"
+    "::|"
+    "//?|"
+    "\.\.|"
+    "\(\)|"
+    "[/.*:\[\]\(\)@=])|"
+    "((?:\{[^}]+\})?[^/\[\]\(\)@=\s]+)|"
+    "\s+"
+    )
+
+def xpath_tokenizer(pattern, namespaces=None):
+    for token in xpath_tokenizer_re.findall(pattern):
+        tag = token[1]
+        if tag and tag[0] != "{" and ":" in tag:
+            try:
+                prefix, uri = tag.split(":", 1)
+                if not namespaces:
+                    raise KeyError
+                yield token[0], "{%s}%s" % (namespaces[prefix], uri)
+            except KeyError:
+                raise SyntaxError("prefix %r not found in prefix map" % prefix)
+        else:
+            yield token
+
+
+def prepare_child(next, token):
+    tag = token[1]
+    def select(result):
+        for elem in result:
+            for e in elem.iterchildren(tag):
+                yield e
+    return select
+
+def prepare_star(next, token):
+    def select(result):
+        for elem in result:
+            for e in elem.iterchildren('*'):
+                yield e
+    return select
+
+def prepare_self(next, token):
+    def select(result):
+        return result
+    return select
+
+def prepare_descendant(next, token):
+    token = next()
+    if token[0] == "*":
+        tag = "*"
+    elif not token[0]:
+        tag = token[1]
+    else:
+        raise SyntaxError("invalid descendant")
+    def select(result):
+        for elem in result:
+            for e in elem.iterdescendants(tag):
+                yield e
+    return select
+
+def prepare_parent(next, token):
+    def select(result):
+        for elem in result:
+            parent = elem.getparent()
+            if parent is not None:
+                yield parent
+    return select
+
+def prepare_predicate(next, token):
+    # FIXME: replace with real parser!!! refs:
+    # http://effbot.org/zone/simple-iterator-parser.htm
+    # http://javascript.crockford.com/tdop/tdop.html
+    signature = []
+    predicate = []
+    while 1:
+        token = next()
+        if token[0] == "]":
+            break
+        if token[0] and token[0][:1] in "'\"":
+            token = "'", token[0][1:-1]
+        signature.append(token[0] or "-")
+        predicate.append(token[1])
+    signature = "".join(signature)
+    # use signature to determine predicate type
+    if signature == "@-":
+        # [@attribute] predicate
+        key = predicate[1]
+        def select(result):
+            for elem in result:
+                if elem.get(key) is not None:
+                    yield elem
+        return select
+    if signature == "@-='":
+        # [@attribute='value']
+        key = predicate[1]
+        value = predicate[-1]
+        def select(result):
+            for elem in result:
+                if elem.get(key) == value:
+                    yield elem
+        return select
+    if signature == "-" and not re.match("-?\d+$", predicate[0]):
+        # [tag]
+        tag = predicate[0]
+        def select(result):
+            for elem in result:
+                for _ in elem.iterchildren(tag):
+                    yield elem
+                    break
+        return select
+    if signature == "-='" and not re.match("-?\d+$", predicate[0]):
+        # [tag='value']
+        tag = predicate[0]
+        value = predicate[-1]
+        def select(result):
+            for elem in result:
+                for e in elem.iterchildren(tag):
+                    if "".join(e.itertext()) == value:
+                        yield elem
+                        break
+        return select
+    if signature == "-" or signature == "-()" or signature == "-()-":
+        # [index] or [last()] or [last()-index]
+        if signature == "-":
+            # [index]
+            index = int(predicate[0]) - 1
+            if index < 0:
+                if index == -1:
+                    raise SyntaxError(
+                        "indices in path predicates are 1-based, not 0-based")
+                else:
+                    raise SyntaxError("path index >= 1 expected")
+        else:
+            if predicate[0] != "last":
+                raise SyntaxError("unsupported function")
+            if signature == "-()-":
+                try:
+                    index = int(predicate[2]) - 1
+                except ValueError:
+                    raise SyntaxError("unsupported expression")
+            else:
+                index = -1
+        def select(result):
+            for elem in result:
+                parent = elem.getparent()
+                if parent is None:
+                    continue
+                try:
+                    # FIXME: what if the selector is "*" ?
+                    elems = list(parent.iterchildren(elem.tag))
+                    if elems[index] is elem:
+                        yield elem
+                except IndexError:
+                    pass
+        return select
+    raise SyntaxError("invalid predicate")
+
+ops = {
+    "": prepare_child,
+    "*": prepare_star,
+    ".": prepare_self,
+    "..": prepare_parent,
+    "//": prepare_descendant,
+    "[": prepare_predicate,
+    }
+
+_cache = {}
+
+# --------------------------------------------------------------------
+
+def _build_path_iterator(path, namespaces):
+    # compile selector pattern
+    if path[-1:] == "/":
+        path = path + "*" # implicit all (FIXME: keep this?)
+    try:
+        return _cache[(path, namespaces and tuple(sorted(namespaces.items())) or None)]
+    except KeyError:
+        pass
+    if len(_cache) > 100:
+        _cache.clear()
+
+    if path[:1] == "/":
+        raise SyntaxError("cannot use absolute path on element")
+    stream = iter(xpath_tokenizer(path, namespaces))
+    try:
+        _next = stream.next
+    except AttributeError:
+        # Python 3
+        _next = stream.__next__
+    try:
+        token = _next()
+    except StopIteration:
+        raise SyntaxError("empty path expression")
+    selector = []
+    while 1:
+        try:
+            selector.append(ops[token[0]](_next, token))
+        except StopIteration:
+            raise SyntaxError("invalid path")
+        try:
+            token = _next()
+            if token[0] == "/":
+                token = _next()
+        except StopIteration:
+            break
+    _cache[path] = selector
+    return selector
+
+##
+# Iterate over the matching nodes
+
+def iterfind(elem, path, namespaces=None):
+    selector = _build_path_iterator(path, namespaces)
+    result = iter((elem,))
+    for select in selector:
+        result = select(result)
+    return result
+
+##
+# Find first matching object.
+
+def find(elem, path, namespaces=None):
+    it = iterfind(elem, path, namespaces)
+    try:
+        try:
+            _next = it.next
+        except AttributeError:
+            return next(it)
+        else:
+            return _next()
+    except StopIteration:
+        return None
+
+##
+# Find all matching objects.
+
+def findall(elem, path, namespaces=None):
+    return list(iterfind(elem, path, namespaces))
+
+##
+# Find text for first matching object.
+
+def findtext(elem, path, default=None, namespaces=None):
+    el = find(elem, path, namespaces)
+    if el is None:
+        return default
+    else:
+        return el.text or ''
diff --git a/lib/lxml/apihelpers.pxi b/lib/lxml/apihelpers.pxi
new file mode 100644
index 00000000..c41e3044
--- /dev/null
+++ b/lib/lxml/apihelpers.pxi
@@ -0,0 +1,1645 @@
+# Private/public helper functions for API functions
+
+from lxml.includes cimport uri
+
+cdef object OrderedDict = None
+try:
+    from collections import OrderedDict
+except ImportError:
+    pass
+
+cdef void displayNode(xmlNode* c_node, indent):
+    # to help with debugging
+    cdef xmlNode* c_child
+    try:
+        print indent * u' ', <long>c_node
+        c_child = c_node.children
+        while c_child is not NULL:
+            displayNode(c_child, indent + 1)
+            c_child = c_child.next
+    finally:
+        return  # swallow any exceptions
+
+cdef inline int _assertValidNode(_Element element) except -1:
+    assert element._c_node is not NULL, u"invalid Element proxy at %s" % id(element)
+
+cdef inline int _assertValidDoc(_Document doc) except -1:
+    assert doc._c_doc is not NULL, u"invalid Document proxy at %s" % id(doc)
+
+cdef _Document _documentOrRaise(object input):
+    u"""Call this to get the document of a _Document, _ElementTree or _Element
+    object, or to raise an exception if it can't be determined.
+
+    Should be used in all API functions for consistency.
+    """
+    cdef _Document doc
+    if isinstance(input, _ElementTree):
+        if (<_ElementTree>input)._context_node is not None:
+            doc = (<_ElementTree>input)._context_node._doc
+        else:
+            doc = None
+    elif isinstance(input, _Element):
+        doc = (<_Element>input)._doc
+    elif isinstance(input, _Document):
+        doc = <_Document>input
+    else:
+        raise TypeError, u"Invalid input object: %s" % \
+            python._fqtypename(input).decode('utf8')
+    if doc is None:
+        raise ValueError, u"Input object has no document: %s" % \
+            python._fqtypename(input).decode('utf8')
+    _assertValidDoc(doc)
+    return doc
+
+cdef _Element _rootNodeOrRaise(object input):
+    u"""Call this to get the root node of a _Document, _ElementTree or
+     _Element object, or to raise an exception if it can't be determined.
+
+    Should be used in all API functions for consistency.
+     """
+    cdef _Element node
+    if isinstance(input, _ElementTree):
+        node = (<_ElementTree>input)._context_node
+    elif isinstance(input, _Element):
+        node = <_Element>input
+    elif isinstance(input, _Document):
+        node = (<_Document>input).getroot()
+    else:
+        raise TypeError, u"Invalid input object: %s" % \
+            python._fqtypename(input).decode('utf8')
+    if (node is None or not node._c_node or
+            node._c_node.type != tree.XML_ELEMENT_NODE):
+        raise ValueError, u"Input object has no element: %s" % \
+            python._fqtypename(input).decode('utf8')
+    _assertValidNode(node)
+    return node
+
+cdef _Element _makeElement(tag, xmlDoc* c_doc, _Document doc,
+                           _BaseParser parser, text, tail, attrib, nsmap,
+                           dict extra_attrs):
+    u"""Create a new element and initialize text content, namespaces and
+    attributes.
+
+    This helper function will reuse as much of the existing document as
+    possible:
+
+    If 'parser' is None, the parser will be inherited from 'doc' or the
+    default parser will be used.
+
+    If 'doc' is None, 'c_doc' is used to create a new _Document and the new
+    element is made its root node.
+
+    If 'c_doc' is also NULL, a new xmlDoc will be created.
+    """
+    cdef xmlNode* c_node
+    if doc is not None:
+        c_doc = doc._c_doc
+    ns_utf, name_utf = _getNsTag(tag)
+    if parser is not None and parser._for_html:
+        _htmlTagValidOrRaise(name_utf)
+        if c_doc is NULL:
+            c_doc = _newHTMLDoc()
+    else:
+        _tagValidOrRaise(name_utf)
+        if c_doc is NULL:
+            c_doc = _newXMLDoc()
+    c_node = _createElement(c_doc, name_utf)
+    if c_node is NULL:
+        if doc is None and c_doc is not NULL:
+            tree.xmlFreeDoc(c_doc)
+        raise MemoryError()
+    try:
+        if doc is None:
+            tree.xmlDocSetRootElement(c_doc, c_node)
+            doc = _documentFactory(c_doc, parser)
+        if text is not None:
+            _setNodeText(c_node, text)
+        if tail is not None:
+            _setTailText(c_node, tail)
+        # add namespaces to node if necessary
+        _initNodeNamespaces(c_node, doc, ns_utf, nsmap)
+        _initNodeAttributes(c_node, doc, attrib, extra_attrs)
+        return _elementFactory(doc, c_node)
+    except:
+        # free allocated c_node/c_doc unless Python does it for us
+        if c_node.doc is not c_doc:
+            # node not yet in document => will not be freed by document
+            if tail is not None:
+                _removeText(c_node.next) # tail
+            tree.xmlFreeNode(c_node)
+        if doc is None:
+            # c_doc will not be freed by doc
+            tree.xmlFreeDoc(c_doc)
+        raise
+
+cdef int _initNewElement(_Element element, bint is_html, name_utf, ns_utf,
+                         _BaseParser parser, attrib, nsmap, dict extra_attrs) except -1:
+    u"""Initialise a new Element object.
+
+    This is used when users instantiate a Python Element subclass
+    directly, without it being mapped to an existing XML node.
+    """
+    cdef xmlDoc* c_doc
+    cdef xmlNode* c_node
+    cdef _Document doc
+    if is_html:
+        _htmlTagValidOrRaise(name_utf)
+        c_doc = _newHTMLDoc()
+    else:
+        _tagValidOrRaise(name_utf)
+        c_doc = _newXMLDoc()
+    c_node = _createElement(c_doc, name_utf)
+    if c_node is NULL:
+        if c_doc is not NULL:
+            tree.xmlFreeDoc(c_doc)
+        raise MemoryError()
+    tree.xmlDocSetRootElement(c_doc, c_node)
+    doc = _documentFactory(c_doc, parser)
+    # add namespaces to node if necessary
+    _initNodeNamespaces(c_node, doc, ns_utf, nsmap)
+    _initNodeAttributes(c_node, doc, attrib, extra_attrs)
+    _registerProxy(element, doc, c_node)
+    element._init()
+    return 0
+
+cdef _Element _makeSubElement(_Element parent, tag, text, tail,
+                              attrib, nsmap, dict extra_attrs):
+    u"""Create a new child element and initialize text content, namespaces and
+    attributes.
+    """
+    cdef xmlNode* c_node
+    cdef xmlDoc* c_doc
+    if parent is None or parent._doc is None:
+        return None
+    _assertValidNode(parent)
+    ns_utf, name_utf = _getNsTag(tag)
+    c_doc = parent._doc._c_doc
+
+    if parent._doc._parser is not None and parent._doc._parser._for_html:
+        _htmlTagValidOrRaise(name_utf)
+    else:
+        _tagValidOrRaise(name_utf)
+
+    c_node = _createElement(c_doc, name_utf)
+    if c_node is NULL:
+        raise MemoryError()
+    tree.xmlAddChild(parent._c_node, c_node)
+
+    try:
+        if text is not None:
+            _setNodeText(c_node, text)
+        if tail is not None:
+            _setTailText(c_node, tail)
+
+        # add namespaces to node if necessary
+        _initNodeNamespaces(c_node, parent._doc, ns_utf, nsmap)
+        _initNodeAttributes(c_node, parent._doc, attrib, extra_attrs)
+        return _elementFactory(parent._doc, c_node)
+    except:
+        # make sure we clean up in case of an error
+        _removeNode(parent._doc, c_node)
+        raise
+
+cdef int _initNodeNamespaces(xmlNode* c_node, _Document doc,
+                             object node_ns_utf, object nsmap) except -1:
+    u"""Lookup current namespace prefixes, then set namespace structure for
+    node and register new ns-prefix mappings.
+
+    This only works for a newly created node!
+    """
+    cdef xmlNs* c_ns
+    cdef list nsdefs
+    if not nsmap:
+        if node_ns_utf is not None:
+            _uriValidOrRaise(node_ns_utf)
+            doc._setNodeNs(c_node, _xcstr(node_ns_utf))
+        return 0
+
+    nsdefs = list(nsmap.items())
+    if None in nsmap and len(nsdefs) > 1:
+        # Move the default namespace to the end.  This makes sure libxml2
+        # prefers a prefix if the ns is defined redundantly on the same
+        # element.  That way, users can work around a problem themselves
+        # where default namespace attributes on non-default namespaced
+        # elements serialise without prefix (i.e. into the non-default
+        # namespace).
+        item = (None, nsmap[None])
+        nsdefs.remove(item)
+        nsdefs.append(item)
+
+    for prefix, href in nsdefs:
+        href_utf = _utf8(href)
+        _uriValidOrRaise(href_utf)
+        c_href = _xcstr(href_utf)
+        if prefix is not None:
+            prefix_utf = _utf8(prefix)
+            _prefixValidOrRaise(prefix_utf)
+            c_prefix = _xcstr(prefix_utf)
+        else:
+            c_prefix = <const_xmlChar*>NULL
+        # add namespace with prefix if it is not already known
+        c_ns = tree.xmlSearchNs(doc._c_doc, c_node, c_prefix)
+        if c_ns is NULL or \
+                c_ns.href is NULL or \
+                tree.xmlStrcmp(c_ns.href, c_href) != 0:
+            c_ns = tree.xmlNewNs(c_node, c_href, c_prefix)
+        if href_utf == node_ns_utf:
+            tree.xmlSetNs(c_node, c_ns)
+            node_ns_utf = None
+
+    if node_ns_utf is not None:
+        doc._setNodeNs(c_node, _xcstr(node_ns_utf))
+    return 0
+
+cdef _initNodeAttributes(xmlNode* c_node, _Document doc, attrib, dict extra):
+    u"""Initialise the attributes of an element node.
+    """
+    cdef bint is_html
+    cdef xmlNs* c_ns
+    if attrib is not None and not hasattr(attrib, u'items'):
+        raise TypeError, u"Invalid attribute dictionary: %s" % \
+            python._fqtypename(attrib).decode('utf8')
+    if not attrib and not extra:
+        return  # nothing to do
+    is_html = doc._parser._for_html
+    seen = set()
+    if extra:
+        for name, value in sorted(extra.items()):
+            _addAttributeToNode(c_node, doc, is_html, name, value, seen)
+    if attrib:
+        # attrib will usually be a plain unordered dict
+        if type(attrib) is dict:
+            attrib = sorted(attrib.items())
+        elif isinstance(attrib, _Attrib) or (
+                OrderedDict is not None and isinstance(attrib, OrderedDict)):
+            attrib = attrib.items()
+        else:
+            # assume it's an unordered mapping of some kind
+            attrib = sorted(attrib.items())
+        for name, value in attrib:
+            _addAttributeToNode(c_node, doc, is_html, name, value, seen)
+
+cdef int _addAttributeToNode(xmlNode* c_node, _Document doc, bint is_html,
+                             name, value, set seen_tags) except -1:
+    ns_utf, name_utf = tag = _getNsTag(name)
+    if tag in seen_tags:
+        return 0
+    seen_tags.add(tag)
+    if not is_html:
+        _attributeValidOrRaise(name_utf)
+    value_utf = _utf8(value)
+    if ns_utf is None:
+        tree.xmlNewProp(c_node, _xcstr(name_utf), _xcstr(value_utf))
+    else:
+        _uriValidOrRaise(ns_utf)
+        c_ns = doc._findOrBuildNodeNs(c_node, _xcstr(ns_utf), NULL, 1)
+        tree.xmlNewNsProp(c_node, c_ns,
+                          _xcstr(name_utf), _xcstr(value_utf))
+    return 0
+
+ctypedef struct _ns_node_ref:
+    xmlNs* ns
+    xmlNode* node
+
+cdef int _removeUnusedNamespaceDeclarations(xmlNode* c_element) except -1:
+    u"""Remove any namespace declarations from a subtree that are not used by
+    any of its elements (or attributes).
+    """
+    cdef _ns_node_ref* c_ns_list
+    cdef _ns_node_ref* c_nsref_ptr
+    cdef xmlNs* c_nsdef
+    cdef xmlNode* c_node
+    cdef size_t c_ns_list_size
+    cdef size_t c_ns_list_len
+    cdef size_t i
+
+    c_ns_list = NULL
+    c_ns_list_size = 0
+    c_ns_list_len  = 0
+
+    if c_element.parent is not NULL and \
+            c_element.parent.type == tree.XML_DOCUMENT_NODE:
+        # include the document node
+        c_nsdef = c_element.parent.nsDef
+        while c_nsdef is not NULL:
+            if c_ns_list_len >= c_ns_list_size:
+                if c_ns_list is NULL:
+                    c_ns_list_size = 20
+                else:
+                    c_ns_list_size *= 2
+                c_nsref_ptr = <_ns_node_ref*> stdlib.realloc(
+                    c_ns_list, c_ns_list_size * sizeof(_ns_node_ref))
+                if c_nsref_ptr is NULL:
+                    if c_ns_list is not NULL:
+                        stdlib.free(c_ns_list)
+                    raise MemoryError()
+                c_ns_list = c_nsref_ptr
+
+            c_ns_list[c_ns_list_len].ns   = c_nsdef
+            c_ns_list[c_ns_list_len].node = c_element.parent
+            c_ns_list_len += 1
+            c_nsdef = c_nsdef.next
+
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_element, c_element, 1)
+    # collect all new namespace declarations into the ns list
+    c_nsdef = c_element.nsDef
+    while c_nsdef is not NULL:
+        if c_ns_list_len >= c_ns_list_size:
+            if c_ns_list is NULL:
+                c_ns_list_size = 20
+            else:
+                c_ns_list_size *= 2
+            c_nsref_ptr = <_ns_node_ref*> stdlib.realloc(
+                c_ns_list, c_ns_list_size * sizeof(_ns_node_ref))
+            if c_nsref_ptr is NULL:
+                if c_ns_list is not NULL:
+                    stdlib.free(c_ns_list)
+                raise MemoryError()
+            c_ns_list = c_nsref_ptr
+
+        c_ns_list[c_ns_list_len].ns   = c_nsdef
+        c_ns_list[c_ns_list_len].node = c_element
+        c_ns_list_len += 1
+        c_nsdef = c_nsdef.next
+
+    # remove all namespace declarations from the list that are referenced
+    if c_element.type == tree.XML_ELEMENT_NODE:
+        c_node = c_element
+        while c_node is not NULL:
+            if c_node.ns is not NULL:
+                for i in range(c_ns_list_len):
+                    if c_node.ns is c_ns_list[i].ns:
+                        c_ns_list_len -= 1
+                        c_ns_list[i].ns   = c_ns_list[c_ns_list_len].ns
+                        c_ns_list[i].node = c_ns_list[c_ns_list_len].node
+                        c_ns_list[c_ns_list_len].ns   = NULL
+                        c_ns_list[c_ns_list_len].node = NULL
+                        break
+            if c_node is c_element:
+                # continue with attributes
+                c_node = <xmlNode*>c_element.properties
+            else:
+                c_node = c_node.next
+    tree.END_FOR_EACH_ELEMENT_FROM(c_element)
+
+    if c_ns_list is NULL:
+        return 0
+
+    # free all namespace declarations that remained in the list
+    for i in range(c_ns_list_len):
+        c_node = c_ns_list[i].node
+        c_nsdef = c_node.nsDef
+        if c_nsdef is c_ns_list[i].ns:
+            c_node.nsDef = c_node.nsDef.next
+        else:
+            while c_nsdef.next is not c_ns_list[i].ns:
+                c_nsdef = c_nsdef.next
+            c_nsdef.next = c_nsdef.next.next
+        tree.xmlFreeNs(c_ns_list[i].ns)
+    
+    if c_ns_list is not NULL:
+        stdlib.free(c_ns_list)
+    return 0
+
+cdef xmlNs* _searchNsByHref(xmlNode* c_node, const_xmlChar* c_href, bint is_attribute):
+    u"""Search a namespace declaration that covers a node (element or
+    attribute).
+
+    For attributes, try to find a prefixed namespace declaration
+    instead of the default namespaces.  This helps in supporting
+    round-trips for attributes on elements with a different namespace.
+    """
+    cdef xmlNs* c_ns
+    cdef xmlNs* c_default_ns = NULL
+    cdef xmlNode* c_element
+    if c_href is NULL or c_node is NULL or c_node.type == tree.XML_ENTITY_REF_NODE:
+        return NULL
+    if tree.xmlStrcmp(c_href, tree.XML_XML_NAMESPACE) == 0:
+        # no special cases here, let libxml2 handle this
+        return tree.xmlSearchNsByHref(c_node.doc, c_node, c_href)
+    if c_node.type == tree.XML_ATTRIBUTE_NODE:
+        is_attribute = 1
+    while c_node is not NULL and c_node.type != tree.XML_ELEMENT_NODE:
+        c_node = c_node.parent
+    c_element = c_node
+    while c_node is not NULL:
+        if c_node.type == tree.XML_ELEMENT_NODE:
+            c_ns = c_node.nsDef
+            while c_ns is not NULL:
+                if c_ns.href is not NULL and tree.xmlStrcmp(c_href, c_ns.href) == 0:
+                    if c_ns.prefix is NULL and is_attribute:
+                        # for attributes, continue searching a named
+                        # prefix, but keep the first default namespace
+                        # declaration that we found
+                        if c_default_ns is NULL:
+                            c_default_ns = c_ns
+                    elif tree.xmlSearchNs(
+                        c_element.doc, c_element, c_ns.prefix) is c_ns:
+                        # start node is in namespace scope => found!
+                        return c_ns
+                c_ns = c_ns.next
+            if c_node is not c_element and c_node.ns is not NULL:
+                # optimise: the node may have the namespace itself
+                c_ns = c_node.ns
+                if c_ns.href is not NULL and tree.xmlStrcmp(c_href, c_ns.href) == 0:
+                    if c_ns.prefix is NULL and is_attribute:
+                        # for attributes, continue searching a named
+                        # prefix, but keep the first default namespace
+                        # declaration that we found
+                        if c_default_ns is NULL:
+                            c_default_ns = c_ns
+                    elif tree.xmlSearchNs(
+                        c_element.doc, c_element, c_ns.prefix) is c_ns:
+                        # start node is in namespace scope => found!
+                        return c_ns
+        c_node = c_node.parent
+    # nothing found => use a matching default namespace or fail
+    if c_default_ns is not NULL:
+        if tree.xmlSearchNs(c_element.doc, c_element, NULL) is c_default_ns:
+            return c_default_ns
+    return NULL
+
+cdef int _replaceNodeByChildren(_Document doc, xmlNode* c_node) except -1:
+    # NOTE: this does not deallocate the node, just unlink it!
+    cdef xmlNode* c_parent
+    cdef xmlNode* c_child
+    if c_node.children is NULL:
+        tree.xmlUnlinkNode(c_node)
+        return 0
+
+    c_parent = c_node.parent
+    # fix parent links of children
+    c_child = c_node.children
+    while c_child is not NULL:
+        c_child.parent = c_parent
+        c_child = c_child.next
+
+    # fix namespace references of children if their parent's namespace
+    # declarations get lost
+    if c_node.nsDef is not NULL:
+        c_child = c_node.children
+        while c_child is not NULL:
+            moveNodeToDocument(doc, doc._c_doc, c_child)
+            c_child = c_child.next
+
+    # fix sibling links to/from child slice
+    if c_node.prev is NULL:
+        c_parent.children = c_node.children
+    else:
+        c_node.prev.next = c_node.children
+        c_node.children.prev = c_node.prev
+    if c_node.next is NULL:
+        c_parent.last = c_node.last
+    else:
+        c_node.next.prev = c_node.last
+        c_node.last.next = c_node.next
+
+    # unlink c_node
+    c_node.children = c_node.last = NULL
+    c_node.parent = c_node.next = c_node.prev = NULL
+    return 0
+
+cdef object _attributeValue(xmlNode* c_element, xmlAttr* c_attrib_node):
+    c_href = _getNs(<xmlNode*>c_attrib_node)
+    value = tree.xmlGetNsProp(c_element, c_attrib_node.name, c_href)
+    try:
+        result = funicode(value)
+    finally:
+        tree.xmlFree(value)
+    return result
+
+cdef object _attributeValueFromNsName(xmlNode* c_element,
+                                      const_xmlChar* c_href, const_xmlChar* c_name):
+    c_result = tree.xmlGetNsProp(c_element, c_name, c_href)
+    if c_result is NULL:
+        return None
+    try:
+        result = funicode(c_result)
+    finally:
+        tree.xmlFree(c_result)
+    return result
+
+cdef object _getNodeAttributeValue(xmlNode* c_node, key, default):
+    ns, tag = _getNsTag(key)
+    c_href = <const_xmlChar*>NULL if ns is None else _xcstr(ns)
+    c_result = tree.xmlGetNsProp(c_node, _xcstr(tag), c_href)
+    if c_result is NULL:
+        # XXX free namespace that is not in use..?
+        return default
+    try:
+        result = funicode(c_result)
+    finally:
+        tree.xmlFree(c_result)
+    return result
+
+cdef inline object _getAttributeValue(_Element element, key, default):
+    return _getNodeAttributeValue(element._c_node, key, default)
+
+cdef int _setAttributeValue(_Element element, key, value) except -1:
+    cdef xmlNs* c_ns
+    ns, tag = _getNsTag(key)
+    if not element._doc._parser._for_html:
+        _attributeValidOrRaise(tag)
+    c_tag = _xcstr(tag)
+    if isinstance(value, QName):
+        value = _resolveQNameText(element, value)
+    else:
+        value = _utf8(value)
+    c_value = _xcstr(value)
+    if ns is None:
+        c_ns = NULL
+    else:
+        c_ns = element._doc._findOrBuildNodeNs(element._c_node, _xcstr(ns), NULL, 1)
+    tree.xmlSetNsProp(element._c_node, c_ns, c_tag, c_value)
+    return 0
+
+cdef int _delAttribute(_Element element, key) except -1:
+    ns, tag = _getNsTag(key)
+    c_href = <const_xmlChar*>NULL if ns is None else _xcstr(ns)
+    if _delAttributeFromNsName(element._c_node, c_href, _xcstr(tag)):
+        raise KeyError, key
+    return 0
+
+cdef int _delAttributeFromNsName(xmlNode* c_node, const_xmlChar* c_href, const_xmlChar* c_name):
+    c_attr = tree.xmlHasNsProp(c_node, c_name, c_href)
+    if c_attr is NULL:
+        # XXX free namespace that is not in use..?
+        return -1
+    tree.xmlRemoveProp(c_attr)
+    return 0
+
+cdef list _collectAttributes(xmlNode* c_node, int collecttype):
+    u"""Collect all attributes of a node in a list.  Depending on collecttype,
+    it collects either the name (1), the value (2) or the name-value tuples.
+    """
+    cdef Py_ssize_t count
+    c_attr = c_node.properties
+    count = 0
+    while c_attr is not NULL:
+        if c_attr.type == tree.XML_ATTRIBUTE_NODE:
+            count += 1
+        c_attr = c_attr.next
+
+    if not count:
+        return []
+
+    attributes = [None] * count
+    c_attr = c_node.properties
+    count = 0
+    while c_attr is not NULL:
+        if c_attr.type == tree.XML_ATTRIBUTE_NODE:
+            if collecttype == 1:
+                item = _namespacedName(<xmlNode*>c_attr)
+            elif collecttype == 2:
+                item = _attributeValue(c_node, c_attr)
+            else:
+                item = (_namespacedName(<xmlNode*>c_attr),
+                        _attributeValue(c_node, c_attr))
+            attributes[count] = item
+            count += 1
+        c_attr = c_attr.next
+    return attributes
+
+cdef object __RE_XML_ENCODING = re.compile(
+    ur'^(<\?xml[^>]+)\s+encoding\s*=\s*["\'][^"\']*["\'](\s*\?>|)', re.U)
+
+cdef object __REPLACE_XML_ENCODING = __RE_XML_ENCODING.sub
+cdef object __HAS_XML_ENCODING = __RE_XML_ENCODING.match
+
+cdef object _stripEncodingDeclaration(object xml_string):
+    # this is a hack to remove the XML encoding declaration from unicode
+    return __REPLACE_XML_ENCODING(ur'\g<1>\g<2>', xml_string)
+
+cdef bint _hasEncodingDeclaration(object xml_string) except -1:
+    # check if a (unicode) string has an XML encoding declaration
+    return __HAS_XML_ENCODING(xml_string) is not None
+
+cdef inline bint _hasText(xmlNode* c_node):
+    return c_node is not NULL and _textNodeOrSkip(c_node.children) is not NULL
+
+cdef inline bint _hasTail(xmlNode* c_node):
+    return c_node is not NULL and _textNodeOrSkip(c_node.next) is not NULL
+
+cdef _collectText(xmlNode* c_node):
+    u"""Collect all text nodes and return them as a unicode string.
+
+    Start collecting at c_node.
+    
+    If there was no text to collect, return None
+    """
+    cdef Py_ssize_t scount
+    cdef xmlChar* c_text
+    cdef xmlNode* c_node_cur
+    # check for multiple text nodes
+    scount = 0
+    c_text = NULL
+    c_node_cur = c_node = _textNodeOrSkip(c_node)
+    while c_node_cur is not NULL:
+        if c_node_cur.content[0] != c'\0':
+            c_text = c_node_cur.content
+        scount += 1
+        c_node_cur = _textNodeOrSkip(c_node_cur.next)
+
+    # handle two most common cases first
+    if c_text is NULL:
+        return '' if scount > 0 else None
+    if scount == 1:
+        return funicode(c_text)
+
+    # the rest is not performance critical anymore
+    result = b''
+    while c_node is not NULL:
+        result += <unsigned char*>c_node.content
+        c_node = _textNodeOrSkip(c_node.next)
+    return funicode(<const_xmlChar*><unsigned char*>result)
+
+cdef void _removeText(xmlNode* c_node):
+    u"""Remove all text nodes.
+
+    Start removing at c_node.
+    """
+    cdef xmlNode* c_next
+    c_node = _textNodeOrSkip(c_node)
+    while c_node is not NULL:
+        c_next = _textNodeOrSkip(c_node.next)
+        tree.xmlUnlinkNode(c_node)
+        tree.xmlFreeNode(c_node)
+        c_node = c_next
+
+cdef int _setNodeText(xmlNode* c_node, value) except -1:
+    cdef xmlNode* c_text_node
+    # remove all text nodes at the start first
+    _removeText(c_node.children)
+    if value is None:
+        return 0
+    # now add new text node with value at start
+    if python._isString(value):
+        text = _utf8(value)
+        c_text_node = tree.xmlNewDocText(c_node.doc, _xcstr(text))
+    elif isinstance(value, CDATA):
+        c_text_node = tree.xmlNewCDataBlock(
+            c_node.doc, _xcstr((<CDATA>value)._utf8_data),
+            python.PyBytes_GET_SIZE((<CDATA>value)._utf8_data))
+    else:
+        # this will raise the right error
+       _utf8(value)
+       return -1
+    if c_node.children is NULL:
+        tree.xmlAddChild(c_node, c_text_node)
+    else:
+        tree.xmlAddPrevSibling(c_node.children, c_text_node)
+    return 0
+
+cdef int _setTailText(xmlNode* c_node, value) except -1:
+    cdef xmlNode* c_text_node
+    # remove all text nodes at the start first
+    _removeText(c_node.next)
+    if value is None:
+        return 0
+    text = _utf8(value)
+    c_text_node = tree.xmlNewDocText(c_node.doc, _xcstr(text))
+    # XXX what if we're the top element?
+    tree.xmlAddNextSibling(c_node, c_text_node)
+    return 0
+
+cdef bytes _resolveQNameText(_Element element, value):
+    cdef xmlNs* c_ns
+    ns, tag = _getNsTag(value)
+    if ns is None:
+        return tag
+    else:
+        c_ns = element._doc._findOrBuildNodeNs(
+            element._c_node, _xcstr(ns), NULL, 0)
+        return python.PyBytes_FromFormat('%s:%s', c_ns.prefix, _cstr(tag))
+
+cdef inline bint _hasChild(xmlNode* c_node):
+    return c_node is not NULL and _findChildForwards(c_node, 0) is not NULL
+
+cdef inline Py_ssize_t _countElements(xmlNode* c_node):
+    u"Counts the elements within the following siblings and the node itself."
+    cdef Py_ssize_t count
+    count = 0
+    while c_node is not NULL:
+        if _isElement(c_node):
+            count += 1
+        c_node = c_node.next
+    return count
+
+cdef int _findChildSlice(
+    slice sliceobject, xmlNode* c_parent,
+    xmlNode** c_start_node, Py_ssize_t* c_step, Py_ssize_t* c_length) except -1:
+    u"""Resolve a children slice.
+
+    Returns the start node, step size and the slice length in the
+    pointer arguments.
+    """
+    cdef Py_ssize_t start = 0, stop = 0, childcount
+    childcount = _countElements(c_parent.children)
+    if childcount == 0:
+        c_start_node[0] = NULL
+        c_length[0] = 0
+        if sliceobject.step is None:
+            c_step[0] = 1
+        else:
+            python._PyEval_SliceIndex(sliceobject.step, c_step)
+        return 0
+    python.PySlice_GetIndicesEx(
+        sliceobject, childcount, &start, &stop, c_step, c_length)
+    if start > childcount / 2:
+        c_start_node[0] = _findChildBackwards(c_parent, childcount - start - 1)
+    else:
+        c_start_node[0] = _findChild(c_parent, start)
+    return 0
+
+cdef bint _isFullSlice(slice sliceobject) except -1:
+    u"""Conservative guess if this slice is a full slice as in ``s[:]``.
+    """
+    cdef Py_ssize_t step = 0
+    if sliceobject is None:
+        return 0
+    if sliceobject.start is None and \
+            sliceobject.stop is None:
+        if sliceobject.step is None:
+            return 1
+        python._PyEval_SliceIndex(sliceobject.step, &step)
+        if step == 1:
+            return 1
+        return 0
+    return 0
+
+cdef _collectChildren(_Element element):
+    cdef xmlNode* c_node
+    cdef list result = []
+    c_node = element._c_node.children
+    if c_node is not NULL:
+        if not _isElement(c_node):
+            c_node = _nextElement(c_node)
+        while c_node is not NULL:
+            result.append(_elementFactory(element._doc, c_node))
+            c_node = _nextElement(c_node)
+    return result
+
+cdef inline xmlNode* _findChild(xmlNode* c_node, Py_ssize_t index):
+    if index < 0:
+        return _findChildBackwards(c_node, -index - 1)
+    else:
+        return _findChildForwards(c_node, index)
+    
+cdef inline xmlNode* _findChildForwards(xmlNode* c_node, Py_ssize_t index):
+    u"""Return child element of c_node with index, or return NULL if not found.
+    """
+    cdef xmlNode* c_child
+    cdef Py_ssize_t c
+    c_child = c_node.children
+    c = 0
+    while c_child is not NULL:
+        if _isElement(c_child):
+            if c == index:
+                return c_child
+            c += 1
+        c_child = c_child.next
+    return NULL
+
+cdef inline xmlNode* _findChildBackwards(xmlNode* c_node, Py_ssize_t index):
+    u"""Return child element of c_node with index, or return NULL if not found.
+    Search from the end.
+    """
+    cdef xmlNode* c_child
+    cdef Py_ssize_t c
+    c_child = c_node.last
+    c = 0
+    while c_child is not NULL:
+        if _isElement(c_child):
+            if c == index:
+                return c_child
+            c += 1
+        c_child = c_child.prev
+    return NULL
+    
+cdef inline xmlNode* _textNodeOrSkip(xmlNode* c_node) nogil:
+    u"""Return the node if it's a text node.  Skip over ignorable nodes in a
+    series of text nodes.  Return NULL if a non-ignorable node is found.
+
+    This is used to skip over XInclude nodes when collecting adjacent text
+    nodes.
+    """
+    while c_node is not NULL:
+        if c_node.type == tree.XML_TEXT_NODE or \
+               c_node.type == tree.XML_CDATA_SECTION_NODE:
+            return c_node
+        elif c_node.type == tree.XML_XINCLUDE_START or \
+                 c_node.type == tree.XML_XINCLUDE_END:
+            c_node = c_node.next
+        else:
+            return NULL
+    return NULL
+
+cdef inline xmlNode* _nextElement(xmlNode* c_node):
+    u"""Given a node, find the next sibling that is an element.
+    """
+    if c_node is NULL:
+        return NULL
+    c_node = c_node.next
+    while c_node is not NULL:
+        if _isElement(c_node):
+            return c_node
+        c_node = c_node.next
+    return NULL
+
+cdef inline xmlNode* _previousElement(xmlNode* c_node):
+    u"""Given a node, find the next sibling that is an element.
+    """
+    if c_node is NULL:
+        return NULL
+    c_node = c_node.prev
+    while c_node is not NULL:
+        if _isElement(c_node):
+            return c_node
+        c_node = c_node.prev
+    return NULL
+
+cdef inline xmlNode* _parentElement(xmlNode* c_node):
+    u"Given a node, find the parent element."
+    if c_node is NULL or not _isElement(c_node):
+        return NULL
+    c_node = c_node.parent
+    if c_node is NULL or not _isElement(c_node):
+        return NULL
+    return c_node
+
+cdef inline bint _tagMatches(xmlNode* c_node, const_xmlChar* c_href, const_xmlChar* c_name):
+    u"""Tests if the node matches namespace URI and tag name.
+
+    A node matches if it matches both c_href and c_name.
+
+    A node matches c_href if any of the following is true:
+    * c_href is NULL
+    * its namespace is NULL and c_href is the empty string
+    * its namespace string equals the c_href string
+
+    A node matches c_name if any of the following is true:
+    * c_name is NULL
+    * its name string equals the c_name string
+    """
+    if c_node is NULL:
+        return 0
+    if c_node.type != tree.XML_ELEMENT_NODE:
+        # not an element, only succeed if we match everything
+        return c_name is NULL and c_href is NULL
+    if c_name is NULL:
+        if c_href is NULL:
+            # always match
+            return 1
+        else:
+            c_node_href = _getNs(c_node)
+            if c_node_href is NULL:
+                return c_href[0] == c'\0'
+            else:
+                return tree.xmlStrcmp(c_node_href, c_href) == 0
+    elif c_href is NULL:
+        if _getNs(c_node) is not NULL:
+            return 0
+        return c_node.name == c_name or tree.xmlStrcmp(c_node.name, c_name) == 0
+    elif c_node.name == c_name or tree.xmlStrcmp(c_node.name, c_name) == 0:
+        c_node_href = _getNs(c_node)
+        if c_node_href is NULL:
+            return c_href[0] == c'\0'
+        else:
+            return tree.xmlStrcmp(c_node_href, c_href) == 0
+    else:
+        return 0
+
+cdef inline bint _tagMatchesExactly(xmlNode* c_node, qname* c_qname):
+    u"""Tests if the node matches namespace URI and tag name.
+
+    This differs from _tagMatches() in that it does not consider a
+    NULL value in qname.href a wildcard, and that it expects the c_name
+    to be taken from the doc dict, i.e. it only compares the names by
+    address.
+
+    A node matches if it matches both href and c_name of the qname.
+
+    A node matches c_href if any of the following is true:
+    * its namespace is NULL and c_href is the empty string
+    * its namespace string equals the c_href string
+
+    A node matches c_name if any of the following is true:
+    * c_name is NULL
+    * its name string points to the same address (!) as c_name
+    """
+    return _nsTagMatchesExactly(_getNs(c_node), c_node.name, c_qname)
+
+cdef inline bint _nsTagMatchesExactly(const_xmlChar* c_node_href,
+                                      const_xmlChar* c_node_name,
+                                      qname* c_qname):
+    u"""Tests if name and namespace URI match those of c_qname.
+
+    This differs from _tagMatches() in that it does not consider a
+    NULL value in qname.href a wildcard, and that it expects the c_name
+    to be taken from the doc dict, i.e. it only compares the names by
+    address.
+
+    A node matches if it matches both href and c_name of the qname.
+
+    A node matches c_href if any of the following is true:
+    * its namespace is NULL and c_href is the empty string
+    * its namespace string equals the c_href string
+
+    A node matches c_name if any of the following is true:
+    * c_name is NULL
+    * its name string points to the same address (!) as c_name
+    """
+    cdef char* c_href
+    if c_qname.c_name is not NULL and c_qname.c_name is not c_node_name:
+        return 0
+    if c_qname.href is NULL:
+        return 1
+    c_href = python.__cstr(c_qname.href)
+    if c_href[0] == '\0':
+        return c_node_href is NULL or c_node_href[0] == '\0'
+    elif c_node_href is NULL:
+        return 0
+    else:
+        return tree.xmlStrcmp(<const_xmlChar*>c_href, c_node_href) == 0
+
+cdef Py_ssize_t _mapTagsToQnameMatchArray(xmlDoc* c_doc, list ns_tags,
+                                          qname* c_ns_tags, bint force_into_dict) except -1:
+    u"""Map a sequence of (name, namespace) pairs to a qname array for efficient
+    matching with _tagMatchesExactly() above.
+
+    Note that each qname struct in the array owns its href byte string object
+    if it is not NULL.
+    """
+    cdef Py_ssize_t count = 0, i
+    cdef bytes ns, tag
+    for ns, tag in ns_tags:
+        if tag is None:
+            c_tag = <const_xmlChar*>NULL
+        elif force_into_dict:
+            c_tag = tree.xmlDictLookup(c_doc.dict, _xcstr(tag), len(tag))
+            if c_tag is NULL:
+                # clean up before raising the error
+                for i in xrange(count):
+                    cpython.ref.Py_XDECREF(c_ns_tags[i].href)
+                raise MemoryError()
+        else:
+            c_tag = tree.xmlDictExists(c_doc.dict, _xcstr(tag), len(tag))
+            if c_tag is NULL:
+                # not in the dict => not in the document
+                continue
+        c_ns_tags[count].c_name = c_tag
+        if ns is None:
+            c_ns_tags[count].href = NULL
+        else:
+            cpython.ref.Py_INCREF(ns) # keep an owned reference!
+            c_ns_tags[count].href = <python.PyObject*>ns
+        count += 1
+    return count
+
+cdef int _removeNode(_Document doc, xmlNode* c_node) except -1:
+    u"""Unlink and free a node and subnodes if possible.  Otherwise, make sure
+    it's self-contained.
+    """
+    cdef xmlNode* c_next
+    c_next = c_node.next
+    tree.xmlUnlinkNode(c_node)
+    _moveTail(c_next, c_node)
+    if not attemptDeallocation(c_node):
+        # make namespaces absolute
+        moveNodeToDocument(doc, c_node.doc, c_node)
+    return 0
+
+cdef int _removeSiblings(xmlNode* c_element, tree.xmlElementType node_type, bint with_tail) except -1:
+    cdef xmlNode* c_node
+    cdef xmlNode* c_next
+    c_node = c_element.next
+    while c_node is not NULL:
+        c_next = _nextElement(c_node)
+        if c_node.type == node_type:
+            if with_tail:
+                _removeText(c_node.next)
+            tree.xmlUnlinkNode(c_node)
+            attemptDeallocation(c_node)
+        c_node = c_next
+    c_node = c_element.prev
+    while c_node is not NULL:
+        c_next = _previousElement(c_node)
+        if c_node.type == node_type:
+            if with_tail:
+                _removeText(c_node.next)
+            tree.xmlUnlinkNode(c_node)
+            attemptDeallocation(c_node)
+        c_node = c_next
+    return 0
+
+cdef void _moveTail(xmlNode* c_tail, xmlNode* c_target):
+    cdef xmlNode* c_next
+    # tail support: look for any text nodes trailing this node and 
+    # move them too
+    c_tail = _textNodeOrSkip(c_tail)
+    while c_tail is not NULL:
+        c_next = _textNodeOrSkip(c_tail.next)
+        c_target = tree.xmlAddNextSibling(c_target, c_tail)
+        c_tail = c_next
+
+cdef int _copyTail(xmlNode* c_tail, xmlNode* c_target) except -1:
+    cdef xmlNode* c_new_tail
+    # tail copying support: look for any text nodes trailing this node and
+    # copy it to the target node
+    c_tail = _textNodeOrSkip(c_tail)
+    while c_tail is not NULL:
+        if c_target.doc is not c_tail.doc:
+            c_new_tail = tree.xmlDocCopyNode(c_tail, c_target.doc, 0)
+        else:
+            c_new_tail = tree.xmlCopyNode(c_tail, 0)
+        if c_new_tail is NULL:
+            raise MemoryError()
+        c_target = tree.xmlAddNextSibling(c_target, c_new_tail)
+        c_tail = _textNodeOrSkip(c_tail.next)
+    return 0
+
+cdef int _copyNonElementSiblings(xmlNode* c_node, xmlNode* c_target) except -1:
+    cdef xmlNode* c_copy
+    cdef xmlNode* c_sibling = c_node
+    while c_sibling.prev != NULL and \
+            (c_sibling.prev.type == tree.XML_PI_NODE or \
+                 c_sibling.prev.type == tree.XML_COMMENT_NODE):
+        c_sibling = c_sibling.prev
+    while c_sibling != c_node:
+        c_copy = tree.xmlDocCopyNode(c_sibling, c_target.doc, 1)
+        if c_copy is NULL:
+            raise MemoryError()
+        tree.xmlAddPrevSibling(c_target, c_copy)
+        c_sibling = c_sibling.next
+    while c_sibling.next != NULL and \
+            (c_sibling.next.type == tree.XML_PI_NODE or \
+                 c_sibling.next.type == tree.XML_COMMENT_NODE):
+        c_sibling = c_sibling.next
+        c_copy = tree.xmlDocCopyNode(c_sibling, c_target.doc, 1)
+        if c_copy is NULL:
+            raise MemoryError()
+        tree.xmlAddNextSibling(c_target, c_copy)
+
+cdef int _deleteSlice(_Document doc, xmlNode* c_node,
+                      Py_ssize_t count, Py_ssize_t step) except -1:
+    u"""Delete slice, ``count`` items starting with ``c_node`` with a step
+    width of ``step``.
+    """
+    cdef xmlNode* c_next
+    cdef Py_ssize_t c, i
+    cdef _node_to_node_function next_element
+    if c_node is NULL:
+        return 0
+    if step > 0:
+        next_element = _nextElement
+    else:
+        step = -step
+        next_element = _previousElement
+    # now start deleting nodes
+    c = 0
+    c_next = c_node
+    while c_node is not NULL and c < count:
+        for i in range(step):
+            c_next = next_element(c_next)
+        _removeNode(doc, c_node)
+        c += 1
+        c_node = c_next
+    return 0
+
+cdef int _replaceSlice(_Element parent, xmlNode* c_node,
+                       Py_ssize_t slicelength, Py_ssize_t step,
+                       bint left_to_right, elements) except -1:
+    u"""Replace the slice of ``count`` elements starting at ``c_node`` with
+    positive step width ``step`` by the Elements in ``elements``.  The
+    direction is given by the boolean argument ``left_to_right``.
+
+    ``c_node`` may be NULL to indicate the end of the children list.
+    """
+    cdef xmlNode* c_orig_neighbour
+    cdef xmlNode* c_next
+    cdef xmlDoc*  c_source_doc
+    cdef _Element element
+    cdef Py_ssize_t seqlength, i, c
+    cdef _node_to_node_function next_element
+    assert step > 0
+    if left_to_right:
+        next_element = _nextElement
+    else:
+        next_element = _previousElement
+
+    if not isinstance(elements, (list, tuple)):
+        elements = list(elements)
+
+    if step > 1:
+        # *replacing* children stepwise with list => check size!
+        seqlength = len(elements)
+        if seqlength != slicelength:
+            raise ValueError, u"attempt to assign sequence of size %d " \
+                u"to extended slice of size %d" % (seqlength, slicelength)
+
+    if c_node is NULL:
+        # no children yet => add all elements straight away
+        if left_to_right:
+            for element in elements:
+                assert element is not None, u"Node must not be None"
+                _appendChild(parent, element)
+        else:
+            for element in elements:
+                assert element is not None, u"Node must not be None"
+                _prependChild(parent, element)
+        return 0
+
+    # remove the elements first as some might be re-added
+    if left_to_right:
+        # L->R, remember left neighbour
+        c_orig_neighbour = _previousElement(c_node)
+    else:
+        # R->L, remember right neighbour
+        c_orig_neighbour = _nextElement(c_node)
+
+    # We remove the original slice elements one by one. Since we hold
+    # a Python reference to all elements that we will insert, it is
+    # safe to let _removeNode() try (and fail) to free them even if
+    # the element itself or one of its descendents will be reinserted.
+    c = 0
+    c_next = c_node
+    while c_node is not NULL and c < slicelength:
+        for i in range(step):
+            c_next = next_element(c_next)
+        _removeNode(parent._doc, c_node)
+        c += 1
+        c_node = c_next
+
+    # make sure each element is inserted only once
+    elements = iter(elements)
+
+    # find the first node right of the new insertion point
+    if left_to_right:
+        if c_orig_neighbour is not NULL:
+            c_node = next_element(c_orig_neighbour)
+        else:
+            # before the first element
+            c_node = _findChildForwards(parent._c_node, 0)
+    elif c_orig_neighbour is NULL:
+        # at the end, but reversed stepping
+        # append one element and go to the next insertion point
+        for element in elements:
+            assert element is not None, u"Node must not be None"
+            _appendChild(parent, element)
+            c_node = element._c_node
+            if slicelength > 0:
+                slicelength -= 1
+                for i in range(1, step):
+                    c_node = next_element(c_node)
+            break
+
+    if left_to_right:
+        # adjust step size after removing slice as we are not stepping
+        # over the newly inserted elements
+        step -= 1
+
+    # now insert elements where we removed them
+    if c_node is not NULL:
+        for element in elements:
+            assert element is not None, u"Node must not be None"
+            _assertValidNode(element)
+            # move element and tail over
+            c_source_doc = element._c_node.doc
+            c_next = element._c_node.next
+            tree.xmlAddPrevSibling(c_node, element._c_node)
+            _moveTail(c_next, element._c_node)
+
+            # integrate element into new document
+            moveNodeToDocument(parent._doc, c_source_doc, element._c_node)
+
+            # stop at the end of the slice
+            if slicelength > 0:
+                slicelength = slicelength - 1
+                for i in range(step):
+                    c_node = next_element(c_node)
+                if c_node is NULL:
+                    break
+        else:
+            # everything inserted
+            return 0
+
+    # append the remaining elements at the respective end
+    if left_to_right:
+        for element in elements:
+            assert element is not None, u"Node must not be None"
+            _assertValidNode(element)
+            _appendChild(parent, element)
+    else:
+        for element in elements:
+            assert element is not None, u"Node must not be None"
+            _assertValidNode(element)
+            _prependChild(parent, element)
+
+    return 0
+
+cdef int _appendChild(_Element parent, _Element child) except -1:
+    u"""Append a new child to a parent element.
+    """
+    c_node = child._c_node
+    c_source_doc = c_node.doc
+    # prevent cycles
+    c_parent = parent._c_node
+    while c_parent:
+        if c_parent is c_node:
+            raise ValueError("cannot append parent to itself")
+        c_parent = c_parent.parent
+    # store possible text node
+    c_next = c_node.next
+    # move node itself
+    tree.xmlUnlinkNode(c_node)
+    tree.xmlAddChild(parent._c_node, c_node)
+    _moveTail(c_next, c_node)
+    # uh oh, elements may be pointing to different doc when
+    # parent element has moved; change them too..
+    moveNodeToDocument(parent._doc, c_source_doc, c_node)
+    return 0
+
+cdef int _prependChild(_Element parent, _Element child) except -1:
+    u"""Prepend a new child to a parent element.
+    """
+    c_node = child._c_node
+    c_source_doc = c_node.doc
+    # prevent cycles
+    c_parent = parent._c_node
+    while c_parent:
+        if c_parent is c_node:
+            raise ValueError("cannot append parent to itself")
+        c_parent = c_parent.parent
+    # store possible text node
+    c_next = c_node.next
+    # move node itself
+    c_child = _findChildForwards(parent._c_node, 0)
+    if c_child is NULL:
+        tree.xmlUnlinkNode(c_node)
+        tree.xmlAddChild(parent._c_node, c_node)
+    else:
+        tree.xmlAddPrevSibling(c_child, c_node)
+    _moveTail(c_next, c_node)
+    # uh oh, elements may be pointing to different doc when
+    # parent element has moved; change them too..
+    moveNodeToDocument(parent._doc, c_source_doc, c_node)
+    return 0
+
+cdef int _appendSibling(_Element element, _Element sibling) except -1:
+    u"""Add a new sibling behind an element.
+    """
+    c_node = sibling._c_node
+    if element._c_node is c_node:
+        return 0  # nothing to do
+    c_source_doc = c_node.doc
+    # store possible text node
+    c_next = c_node.next
+    # move node itself
+    tree.xmlAddNextSibling(element._c_node, c_node)
+    _moveTail(c_next, c_node)
+    # uh oh, elements may be pointing to different doc when
+    # parent element has moved; change them too..
+    moveNodeToDocument(element._doc, c_source_doc, c_node)
+    return 0
+
+cdef int _prependSibling(_Element element, _Element sibling) except -1:
+    u"""Add a new sibling before an element.
+    """
+    c_node = sibling._c_node
+    if element._c_node is c_node:
+        return 0  # nothing to do
+    c_source_doc = c_node.doc
+    # store possible text node
+    c_next = c_node.next
+    # move node itself
+    tree.xmlAddPrevSibling(element._c_node, c_node)
+    _moveTail(c_next, c_node)
+    # uh oh, elements may be pointing to different doc when
+    # parent element has moved; change them too..
+    moveNodeToDocument(element._doc, c_source_doc, c_node)
+    return 0
+
+cdef inline int isutf8(const_xmlChar* s):
+    cdef xmlChar c = s[0]
+    while c != c'\0':
+        if c & 0x80:
+            return 1
+        s += 1
+        c = s[0]
+    return 0
+
+cdef int check_string_utf8(bytes pystring):
+    u"""Check if a string looks like valid UTF-8 XML content.  Returns 0
+    for ASCII, 1 for UTF-8 and -1 in the case of errors, such as NULL
+    bytes or ASCII control characters.
+    """
+    cdef const_xmlChar* s = _xcstr(pystring)
+    cdef const_xmlChar* c_end = s + len(pystring)
+    cdef bint is_non_ascii = 0
+    while s < c_end:
+        if s[0] & 0x80:
+            # skip over multi byte sequences
+            while s < c_end and s[0] & 0x80:
+                s += 1
+            is_non_ascii = 1
+        if  s < c_end and not tree.xmlIsChar_ch(s[0]):
+            return -1 # invalid!
+        s += 1
+    return is_non_ascii
+
+cdef inline object funicodeOrNone(const_xmlChar* s):
+    return funicode(s) if s is not NULL else None
+
+cdef inline object funicodeOrEmpty(const_xmlChar* s):
+    return funicode(s) if s is not NULL else ''
+
+cdef object funicode(const_xmlChar* s):
+    cdef Py_ssize_t slen
+    cdef const_xmlChar* spos
+    cdef bint is_non_ascii
+    if python.LXML_UNICODE_STRINGS:
+        return s.decode('UTF-8')
+    spos = s
+    is_non_ascii = 0
+    while spos[0] != c'\0':
+        if spos[0] & 0x80:
+            is_non_ascii = 1
+            break
+        spos += 1
+    slen = spos - s
+    if spos[0] != c'\0':
+        slen += tree.xmlStrlen(spos)
+    if is_non_ascii:
+        return s[:slen].decode('UTF-8')
+    return <bytes>s[:slen]
+
+cdef bytes _utf8(object s):
+    """Test if a string is valid user input and encode it to UTF-8.
+    Reject all bytes/unicode input that contains non-XML characters.
+    Reject all bytes input that contains non-ASCII characters.
+    """
+    cdef int invalid
+    cdef bytes utf8_string
+    if not python.IS_PYTHON3 and type(s) is bytes:
+        utf8_string = <bytes>s
+        invalid = check_string_utf8(utf8_string)
+    elif isinstance(s, unicode):
+        utf8_string = (<unicode>s).encode('utf8')
+        invalid = check_string_utf8(utf8_string) == -1 # non-XML?
+    elif isinstance(s, (bytes, bytearray)):
+        utf8_string = bytes(s)
+        invalid = check_string_utf8(utf8_string)
+    else:
+        raise TypeError("Argument must be bytes or unicode, got '%.200s'" % type(s).__name__)
+    if invalid:
+        raise ValueError(
+            "All strings must be XML compatible: Unicode or ASCII, no NULL bytes or control characters")
+    return utf8_string
+
+cdef bytes _utf8orNone(object s):
+    return _utf8(s) if s is not None else None
+
+cdef bint _isFilePath(const_xmlChar* c_path):
+    u"simple heuristic to see if a path is a filename"
+    cdef xmlChar c
+    # test if it looks like an absolute Unix path or a Windows network path
+    if c_path[0] == c'/':
+        return 1
+
+    # test if it looks like an absolute Windows path or URL
+    if (c_path[0] >= c'a' and c_path[0] <= c'z') or \
+            (c_path[0] >= c'A' and c_path[0] <= c'Z'):
+        c_path += 1
+        if c_path[0] == c':' and c_path[1] in b'\0\\':
+            return 1  # C: or C:\...
+
+        # test if it looks like a URL with scheme://
+        while (c_path[0] >= c'a' and c_path[0] <= c'z') or \
+                (c_path[0] >= c'A' and c_path[0] <= c'Z'):
+            c_path += 1
+        if c_path[0] == c':' and c_path[1] == c'/' and c_path[2] == c'/':
+            return 0
+
+    # assume it's a relative path
+    return 1
+
+cdef object _encodeFilename(object filename):
+    u"""Make sure a filename is 8-bit encoded (or None).
+    """
+    if filename is None:
+        return None
+    elif isinstance(filename, bytes):
+        return filename
+    elif isinstance(filename, unicode):
+        filename8 = (<unicode>filename).encode('utf8')
+        if _isFilePath(<unsigned char*>filename8):
+            try:
+                return python.PyUnicode_AsEncodedString(
+                    filename, _C_FILENAME_ENCODING, NULL)
+            except UnicodeEncodeError:
+                pass
+        return filename8
+    else:
+        raise TypeError("Argument must be string or unicode.")
+
+cdef object _decodeFilename(const_xmlChar* c_path):
+    u"""Make the filename a unicode string if we are in Py3.
+    """
+    return _decodeFilenameWithLength(c_path, tree.xmlStrlen(c_path))
+
+cdef object _decodeFilenameWithLength(const_xmlChar* c_path, size_t c_len):
+    u"""Make the filename a unicode string if we are in Py3.
+    """
+    if _isFilePath(c_path):
+        try:
+            return python.PyUnicode_Decode(
+                <const_char*>c_path, c_len, _C_FILENAME_ENCODING, NULL)
+        except UnicodeDecodeError:
+            pass
+    try:
+        return (<unsigned char*>c_path)[:c_len].decode('UTF-8')
+    except UnicodeDecodeError:
+        # this is a stupid fallback, but it might still work...
+        return (<unsigned char*>c_path)[:c_len].decode('latin-1', 'replace')
+
+cdef object _encodeFilenameUTF8(object filename):
+    u"""Recode filename as UTF-8. Tries ASCII, local filesystem encoding and
+    UTF-8 as source encoding.
+    """
+    cdef char* c_filename
+    if filename is None:
+        return None
+    elif isinstance(filename, bytes):
+        if not check_string_utf8(<bytes>filename):
+            # plain ASCII!
+            return filename
+        c_filename = _cstr(<bytes>filename)
+        try:
+            # try to decode with default encoding
+            filename = python.PyUnicode_Decode(
+                c_filename, len(<bytes>filename),
+                _C_FILENAME_ENCODING, NULL)
+        except UnicodeDecodeError as decode_exc:
+            try:
+                # try if it's proper UTF-8
+                (<bytes>filename).decode('utf8')
+                return filename
+            except UnicodeDecodeError:
+                raise decode_exc # otherwise re-raise original exception
+    if isinstance(filename, unicode):
+        return (<unicode>filename).encode('utf8')
+    else:
+        raise TypeError("Argument must be string or unicode.")
+
+cdef tuple _getNsTag(tag):
+    u"""Given a tag, find namespace URI and tag name.
+    Return None for NS uri if no namespace URI provided.
+    """
+    return __getNsTag(tag, 0)
+
+cdef tuple _getNsTagWithEmptyNs(tag):
+    u"""Given a tag, find namespace URI and tag name.  Return None for NS uri
+    if no namespace URI provided, or the empty string if namespace
+    part is '{}'.
+    """
+    return __getNsTag(tag, 1)
+
+cdef tuple __getNsTag(tag, bint empty_ns):
+    cdef char* c_tag
+    cdef char* c_ns_end
+    cdef Py_ssize_t taglen
+    cdef Py_ssize_t nslen
+    cdef bytes ns = None
+    # _isString() is much faster than isinstance()
+    if not _isString(tag) and isinstance(tag, QName):
+        tag = (<QName>tag).text
+    tag = _utf8(tag)
+    c_tag = _cstr(tag)
+    if c_tag[0] == c'{':
+        c_tag += 1
+        c_ns_end = cstring_h.strchr(c_tag, c'}')
+        if c_ns_end is NULL:
+            raise ValueError, u"Invalid tag name"
+        nslen  = c_ns_end - c_tag
+        taglen = python.PyBytes_GET_SIZE(tag) - nslen - 2
+        if taglen == 0:
+            raise ValueError, u"Empty tag name"
+        if nslen > 0:
+            ns = <bytes>c_tag[:nslen]
+        elif empty_ns:
+            ns = b''
+        tag = <bytes>c_ns_end[1:taglen+1]
+    elif python.PyBytes_GET_SIZE(tag) == 0:
+        raise ValueError, u"Empty tag name"
+    return ns, tag
+
+cdef inline int _pyXmlNameIsValid(name_utf8):
+    return _xmlNameIsValid(_xcstr(name_utf8))
+
+cdef inline int _pyHtmlNameIsValid(name_utf8):
+    return _htmlNameIsValid(_xcstr(name_utf8))
+
+cdef inline int _xmlNameIsValid(const_xmlChar* c_name):
+    return tree.xmlValidateNCName(c_name, 0) == 0
+
+cdef int _htmlNameIsValid(const_xmlChar* c_name):
+    if c_name is NULL or c_name[0] == c'\0':
+        return 0
+    while c_name[0] != c'\0':
+        if c_name[0] in b'&<>/"\'\t\n\x0B\x0C\r ':
+            return 0
+        c_name += 1
+    return 1
+
+cdef bint _characterReferenceIsValid(const_xmlChar* c_name):
+    cdef bint is_hex
+    if c_name[0] == c'x':
+        c_name += 1
+        is_hex = 1
+    else:
+        is_hex = 0
+    if c_name[0] == c'\0':
+        return 0
+    while c_name[0] != c'\0':
+        if c_name[0] < c'0' or c_name[0] > c'9':
+            if not is_hex:
+                return 0
+            if not (c'a' <= c_name[0] <= c'f'):
+                if not (c'A' <= c_name[0] <= c'F'):
+                    return 0
+        c_name += 1
+    return 1
+
+cdef int _tagValidOrRaise(tag_utf) except -1:
+    if not _pyXmlNameIsValid(tag_utf):
+        raise ValueError(u"Invalid tag name %r" %
+                         (<bytes>tag_utf).decode('utf8'))
+    return 0
+
+cdef int _htmlTagValidOrRaise(tag_utf) except -1:
+    if not _pyHtmlNameIsValid(tag_utf):
+        raise ValueError(u"Invalid HTML tag name %r" %
+                         (<bytes>tag_utf).decode('utf8'))
+    return 0
+
+cdef int _attributeValidOrRaise(name_utf) except -1:
+    if not _pyXmlNameIsValid(name_utf):
+        raise ValueError(u"Invalid attribute name %r" %
+                         (<bytes>name_utf).decode('utf8'))
+    return 0
+
+cdef int _prefixValidOrRaise(tag_utf) except -1:
+    if not _pyXmlNameIsValid(tag_utf):
+        raise ValueError(u"Invalid namespace prefix %r" %
+                         (<bytes>tag_utf).decode('utf8'))
+    return 0
+
+cdef int _uriValidOrRaise(uri_utf) except -1:
+    cdef uri.xmlURI* c_uri = uri.xmlParseURI(_cstr(uri_utf))
+    if c_uri is NULL:
+        raise ValueError(u"Invalid namespace URI %r" %
+                         (<bytes>uri_utf).decode('utf8'))
+    uri.xmlFreeURI(c_uri)
+    return 0
+
+cdef inline object _namespacedName(xmlNode* c_node):
+    return _namespacedNameFromNsName(_getNs(c_node), c_node.name)
+
+cdef object _namespacedNameFromNsName(const_xmlChar* href, const_xmlChar* name):
+    if href is NULL:
+        return funicode(name)
+    elif python.LXML_UNICODE_STRINGS and not python.IS_PYPY:
+        return python.PyUnicode_FromFormat("{%s}%s", href, name)
+    else:
+        s = python.PyBytes_FromFormat("{%s}%s", href, name)
+        if python.LXML_UNICODE_STRINGS or isutf8(_xcstr(s)):
+            return (<bytes>s).decode('utf8')
+        else:
+            return s
+
+cdef _getFilenameForFile(source):
+    u"""Given a Python File or Gzip object, give filename back.
+
+    Returns None if not a file object.
+    """
+    # urllib2 provides a geturl() method
+    try:
+        return source.geturl()
+    except:
+        pass
+    # file instances have a name attribute
+    try:
+        filename = source.name
+        if _isString(filename):
+            return os_path_abspath(filename)
+    except:
+        pass
+    # gzip file instances have a filename attribute (before Py3k)
+    try:
+        filename = source.filename
+        if _isString(filename):
+            return os_path_abspath(filename)
+    except:
+        pass
+    # can't determine filename
+    return None
diff --git a/lib/lxml/builder.py b/lib/lxml/builder.py
new file mode 100644
index 00000000..ad61a80e
--- /dev/null
+++ b/lib/lxml/builder.py
@@ -0,0 +1,238 @@
+#
+# Element generator factory by Fredrik Lundh.
+#
+# Source:
+#    http://online.effbot.org/2006_11_01_archive.htm#et-builder
+#    http://effbot.python-hosting.com/file/stuff/sandbox/elementlib/builder.py
+#
+# --------------------------------------------------------------------
+# The ElementTree toolkit is
+#
+# Copyright (c) 1999-2004 by Fredrik Lundh
+#
+# By obtaining, using, and/or copying this software and/or its
+# associated documentation, you agree that you have read, understood,
+# and will comply with the following terms and conditions:
+#
+# Permission to use, copy, modify, and distribute this software and
+# its associated documentation for any purpose and without fee is
+# hereby granted, provided that the above copyright notice appears in
+# all copies, and that both that copyright notice and this permission
+# notice appear in supporting documentation, and that the name of
+# Secret Labs AB or the author not be used in advertising or publicity
+# pertaining to distribution of the software without specific, written
+# prior permission.
+#
+# SECRET LABS AB AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD
+# TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANT-
+# ABILITY AND FITNESS.  IN NO EVENT SHALL SECRET LABS AB OR THE AUTHOR
+# BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY
+# DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,
+# WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
+# ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE
+# OF THIS SOFTWARE.
+# --------------------------------------------------------------------
+
+"""
+The ``E`` Element factory for generating XML documents.
+"""
+
+import lxml.etree as ET
+
+try:
+    from functools import partial
+except ImportError:
+    # fake it for pre-2.5 releases
+    def partial(func, tag):
+        return lambda *args, **kwargs: func(tag, *args, **kwargs)
+
+try:
+    callable
+except NameError:
+    # Python 3
+    def callable(f):
+        return hasattr(f, '__call__')
+
+try:
+    basestring
+except NameError:
+    basestring = str
+
+try:
+    unicode
+except NameError:
+    unicode = str
+
+
+class ElementMaker(object):
+    """Element generator factory.
+
+    Unlike the ordinary Element factory, the E factory allows you to pass in
+    more than just a tag and some optional attributes; you can also pass in
+    text and other elements.  The text is added as either text or tail
+    attributes, and elements are inserted at the right spot.  Some small
+    examples::
+
+        >>> from lxml import etree as ET
+        >>> from lxml.builder import E
+
+        >>> ET.tostring(E("tag"))
+        '<tag/>'
+        >>> ET.tostring(E("tag", "text"))
+        '<tag>text</tag>'
+        >>> ET.tostring(E("tag", "text", key="value"))
+        '<tag key="value">text</tag>'
+        >>> ET.tostring(E("tag", E("subtag", "text"), "tail"))
+        '<tag><subtag>text</subtag>tail</tag>'
+
+    For simple tags, the factory also allows you to write ``E.tag(...)`` instead
+    of ``E('tag', ...)``::
+
+        >>> ET.tostring(E.tag())
+        '<tag/>'
+        >>> ET.tostring(E.tag("text"))
+        '<tag>text</tag>'
+        >>> ET.tostring(E.tag(E.subtag("text"), "tail"))
+        '<tag><subtag>text</subtag>tail</tag>'
+
+    Here's a somewhat larger example; this shows how to generate HTML
+    documents, using a mix of prepared factory functions for inline elements,
+    nested ``E.tag`` calls, and embedded XHTML fragments::
+
+        # some common inline elements
+        A = E.a
+        I = E.i
+        B = E.b
+
+        def CLASS(v):
+            # helper function, 'class' is a reserved word
+            return {'class': v}
+
+        page = (
+            E.html(
+                E.head(
+                    E.title("This is a sample document")
+                ),
+                E.body(
+                    E.h1("Hello!", CLASS("title")),
+                    E.p("This is a paragraph with ", B("bold"), " text in it!"),
+                    E.p("This is another paragraph, with a ",
+                        A("link", href="http://www.python.org"), "."),
+                    E.p("Here are some reservered characters: <spam&egg>."),
+                    ET.XML("<p>And finally, here is an embedded XHTML fragment.</p>"),
+                )
+            )
+        )
+
+        print ET.tostring(page)
+
+    Here's a prettyprinted version of the output from the above script::
+
+        <html>
+          <head>
+            <title>This is a sample document</title>
+          </head>
+          <body>
+            <h1 class="title">Hello!</h1>
+            <p>This is a paragraph with <b>bold</b> text in it!</p>
+            <p>This is another paragraph, with <a href="http://www.python.org">link</a>.</p>
+            <p>Here are some reservered characters: &lt;spam&amp;egg&gt;.</p>
+            <p>And finally, here is an embedded XHTML fragment.</p>
+          </body>
+        </html>
+
+    For namespace support, you can pass a namespace map (``nsmap``)
+    and/or a specific target ``namespace`` to the ElementMaker class::
+
+        >>> E = ElementMaker(namespace="http://my.ns/")
+        >>> print(ET.tostring( E.test ))
+        <test xmlns="http://my.ns/"/>
+
+        >>> E = ElementMaker(namespace="http://my.ns/", nsmap={'p':'http://my.ns/'})
+        >>> print(ET.tostring( E.test ))
+        <p:test xmlns:p="http://my.ns/"/>
+    """
+
+    def __init__(self, typemap=None,
+                 namespace=None, nsmap=None, makeelement=None):
+        if namespace is not None:
+            self._namespace = '{' + namespace + '}'
+        else:
+            self._namespace = None
+
+        if nsmap:
+            self._nsmap = dict(nsmap)
+        else:
+            self._nsmap = None
+
+        if makeelement is not None:
+            assert callable(makeelement)
+            self._makeelement = makeelement
+        else:
+            self._makeelement = ET.Element
+
+        # initialize type map for this element factory
+
+        if typemap:
+            typemap = typemap.copy()
+        else:
+            typemap = {}
+        
+        def add_text(elem, item):
+            try:
+                elem[-1].tail = (elem[-1].tail or "") + item
+            except IndexError:
+                elem.text = (elem.text or "") + item
+        if str not in typemap:
+            typemap[str] = add_text
+        if unicode not in typemap:
+            typemap[unicode] = add_text
+
+        def add_dict(elem, item):
+            attrib = elem.attrib
+            for k, v in item.items():
+                if isinstance(v, basestring):
+                    attrib[k] = v
+                else:
+                    attrib[k] = typemap[type(v)](None, v)
+        if dict not in typemap:
+            typemap[dict] = add_dict
+
+        self._typemap = typemap
+
+    def __call__(self, tag, *children, **attrib):
+        get = self._typemap.get
+
+        if self._namespace is not None and tag[0] != '{':
+            tag = self._namespace + tag
+        elem = self._makeelement(tag, nsmap=self._nsmap)
+        if attrib:
+            get(dict)(elem, attrib)
+
+        for item in children:
+            if callable(item):
+                item = item()
+            t = get(type(item))
+            if t is None:
+                if ET.iselement(item):
+                    elem.append(item)
+                    continue
+                for basetype in type(item).__mro__:
+                    # See if the typemap knows of any of this type's bases.
+                    t = get(basetype)
+                    if t is not None:
+                        break
+                else:
+                    raise TypeError("bad argument type: %s(%r)" %
+                                    (type(item).__name__, item))
+            v = t(elem, item)
+            if v:
+                get(type(v))(elem, v)
+
+        return elem
+
+    def __getattr__(self, tag):
+        return partial(self, tag)
+
+# create factory object
+E = ElementMaker()
diff --git a/lib/lxml/classlookup.pxi b/lib/lxml/classlookup.pxi
new file mode 100644
index 00000000..82740a51
--- /dev/null
+++ b/lib/lxml/classlookup.pxi
@@ -0,0 +1,565 @@
+# Configurable Element class lookup
+
+################################################################################
+# Custom Element classes
+
+cdef public class ElementBase(_Element) [ type LxmlElementBaseType,
+                                          object LxmlElementBase ]:
+    u"""ElementBase(*children, attrib=None, nsmap=None, **_extra)
+
+    The public Element class.  All custom Element classes must inherit
+    from this one.  To create an Element, use the `Element()` factory.
+
+    BIG FAT WARNING: Subclasses *must not* override __init__ or
+    __new__ as it is absolutely undefined when these objects will be
+    created or destroyed.  All persistent state of Elements must be
+    stored in the underlying XML.  If you really need to initialize
+    the object after creation, you can implement an ``_init(self)``
+    method that will be called directly after object creation.
+
+    Subclasses of this class can be instantiated to create a new
+    Element.  By default, the tag name will be the class name and the
+    namespace will be empty.  You can modify this with the following
+    class attributes:
+
+    * TAG - the tag name, possibly containing a namespace in Clark
+      notation
+
+    * NAMESPACE - the default namespace URI, unless provided as part
+      of the TAG attribute.
+
+    * HTML - flag if the class is an HTML tag, as opposed to an XML
+      tag.  This only applies to un-namespaced tags and defaults to
+      false (i.e. XML).
+
+    * PARSER - the parser that provides the configuration for the
+      newly created document.  Providing an HTML parser here will
+      default to creating an HTML element.
+
+    In user code, the latter three are commonly inherited in class
+    hierarchies that implement a common namespace.
+    """
+    def __init__(self, *children, attrib=None, nsmap=None, **_extra):
+        u"""ElementBase(*children, attrib=None, nsmap=None, **_extra)
+        """
+        cdef bint is_html = 0
+        cdef _BaseParser parser
+        cdef _Element last_child
+        # don't use normal attribute access as it might be overridden
+        _getattr = object.__getattribute__
+        try:
+            namespace = _utf8(_getattr(self, 'NAMESPACE'))
+        except AttributeError:
+            namespace = None
+        try:
+            ns, tag = _getNsTag(_getattr(self, 'TAG'))
+            if ns is not None:
+                namespace = ns
+        except AttributeError:
+            tag = _utf8(_getattr(_getattr(self, '__class__'), '__name__'))
+            if b'.' in tag:
+                tag = tag.split(b'.')[-1]
+        try:
+            parser = _getattr(self, 'PARSER')
+        except AttributeError:
+            parser = None
+            for child in children:
+                if isinstance(child, _Element):
+                    parser = (<_Element>child)._doc._parser
+                    break
+        if isinstance(parser, HTMLParser):
+            is_html = 1
+        if namespace is None:
+            try:
+                is_html = _getattr(self, 'HTML')
+            except AttributeError:
+                pass
+        _initNewElement(self, is_html, tag, namespace, parser,
+                        attrib, nsmap, _extra)
+        last_child = None
+        for child in children:
+            if _isString(child):
+                if last_child is None:
+                    _setNodeText(self._c_node,
+                                 (_collectText(self._c_node.children) or '') + child)
+                else:
+                    _setTailText(last_child._c_node,
+                                 (_collectText(last_child._c_node.next) or '') + child)
+            elif isinstance(child, _Element):
+                last_child = child
+                _appendChild(self, last_child)
+            elif isinstance(child, type) and issubclass(child, ElementBase):
+                last_child = child()
+                _appendChild(self, last_child)
+            else:
+                raise TypeError, "Invalid child type: %r" % type(child)
+
+cdef class CommentBase(_Comment):
+    u"""All custom Comment classes must inherit from this one.
+
+    To create an XML Comment instance, use the ``Comment()`` factory.
+
+    Subclasses *must not* override __init__ or __new__ as it is
+    absolutely undefined when these objects will be created or
+    destroyed.  All persistent state of Comments must be stored in the
+    underlying XML.  If you really need to initialize the object after
+    creation, you can implement an ``_init(self)`` method that will be
+    called after object creation.
+    """
+    def __init__(self, text):
+        # copied from Comment() factory
+        cdef _Document doc
+        cdef xmlDoc*   c_doc
+        if text is None:
+            text = b''
+        else:
+            text = _utf8(text)
+        c_doc = _newXMLDoc()
+        doc = _documentFactory(c_doc, None)
+        self._c_node = _createComment(c_doc, _xcstr(text))
+        if self._c_node is NULL:
+            raise MemoryError()
+        tree.xmlAddChild(<xmlNode*>c_doc, self._c_node)
+        _registerProxy(self, doc, self._c_node)
+        self._init()
+
+cdef class PIBase(_ProcessingInstruction):
+    u"""All custom Processing Instruction classes must inherit from this one.
+
+    To create an XML ProcessingInstruction instance, use the ``PI()``
+    factory.
+
+    Subclasses *must not* override __init__ or __new__ as it is
+    absolutely undefined when these objects will be created or
+    destroyed.  All persistent state of PIs must be stored in the
+    underlying XML.  If you really need to initialize the object after
+    creation, you can implement an ``_init(self)`` method that will be
+    called after object creation.
+    """
+    def __init__(self, target, text=None):
+        # copied from PI() factory
+        cdef _Document doc
+        cdef xmlDoc*   c_doc
+        target = _utf8(target)
+        if text is None:
+            text = b''
+        else:
+            text = _utf8(text)
+        c_doc = _newXMLDoc()
+        doc = _documentFactory(c_doc, None)
+        self._c_node = _createPI(c_doc, _xcstr(target), _xcstr(text))
+        if self._c_node is NULL:
+            raise MemoryError()
+        tree.xmlAddChild(<xmlNode*>c_doc, self._c_node)
+        _registerProxy(self, doc, self._c_node)
+        self._init()
+
+cdef class EntityBase(_Entity):
+    u"""All custom Entity classes must inherit from this one.
+
+    To create an XML Entity instance, use the ``Entity()`` factory.
+
+    Subclasses *must not* override __init__ or __new__ as it is
+    absolutely undefined when these objects will be created or
+    destroyed.  All persistent state of Entities must be stored in the
+    underlying XML.  If you really need to initialize the object after
+    creation, you can implement an ``_init(self)`` method that will be
+    called after object creation.
+    """
+    def __init__(self, name):
+        cdef _Document doc
+        cdef xmlDoc*   c_doc
+        name_utf = _utf8(name)
+        c_name = _xcstr(name_utf)
+        if c_name[0] == c'#':
+            if not _characterReferenceIsValid(c_name + 1):
+                raise ValueError, u"Invalid character reference: '%s'" % name
+        elif not _xmlNameIsValid(c_name):
+            raise ValueError, u"Invalid entity reference: '%s'" % name
+        c_doc = _newXMLDoc()
+        doc = _documentFactory(c_doc, None)
+        self._c_node = _createEntity(c_doc, c_name)
+        if self._c_node is NULL:
+            raise MemoryError()
+        tree.xmlAddChild(<xmlNode*>c_doc, self._c_node)
+        _registerProxy(self, doc, self._c_node)
+        self._init()
+
+
+cdef int _validateNodeClass(xmlNode* c_node, cls) except -1:
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        expected = ElementBase
+    elif c_node.type == tree.XML_COMMENT_NODE:
+        expected = CommentBase
+    elif c_node.type == tree.XML_ENTITY_REF_NODE:
+        expected = EntityBase
+    elif c_node.type == tree.XML_PI_NODE:
+        expected = PIBase
+    else:
+        assert 0, u"Unknown node type: %s" % c_node.type
+
+    if not (isinstance(cls, type) and issubclass(cls, expected)):
+        raise TypeError(
+            "result of class lookup must be subclass of %s, got %s"
+            % (type(expected), type(cls)))
+    return 0
+
+
+################################################################################
+# Element class lookup
+
+ctypedef public object (*_element_class_lookup_function)(object, _Document, xmlNode*)
+
+# class to store element class lookup functions
+cdef public class ElementClassLookup [ type LxmlElementClassLookupType,
+                                       object LxmlElementClassLookup ]:
+    u"""ElementClassLookup(self)
+    Superclass of Element class lookups.
+    """
+    cdef _element_class_lookup_function _lookup_function
+    def __cinit__(self):
+        self._lookup_function = NULL # use default lookup
+
+cdef public class FallbackElementClassLookup(ElementClassLookup) \
+         [ type LxmlFallbackElementClassLookupType,
+           object LxmlFallbackElementClassLookup ]:
+    u"""FallbackElementClassLookup(self, fallback=None)
+
+    Superclass of Element class lookups with additional fallback.
+    """
+    cdef readonly ElementClassLookup fallback
+    cdef _element_class_lookup_function _fallback_function
+    def __cinit__(self):
+        # fall back to default lookup
+        self._fallback_function = _lookupDefaultElementClass
+
+    def __init__(self, ElementClassLookup fallback=None):
+        if fallback is not None:
+            self._setFallback(fallback)
+        else:
+            self._fallback_function = _lookupDefaultElementClass
+
+    cdef void _setFallback(self, ElementClassLookup lookup):
+        u"""Sets the fallback scheme for this lookup method.
+        """
+        self.fallback = lookup
+        self._fallback_function = lookup._lookup_function
+        if self._fallback_function is NULL:
+            self._fallback_function = _lookupDefaultElementClass
+
+    def set_fallback(self, ElementClassLookup lookup not None):
+        u"""set_fallback(self, lookup)
+
+        Sets the fallback scheme for this lookup method.
+        """
+        self._setFallback(lookup)
+
+cdef inline object _callLookupFallback(FallbackElementClassLookup lookup,
+                                       _Document doc, xmlNode* c_node):
+    return lookup._fallback_function(lookup.fallback, doc, c_node)
+
+
+################################################################################
+# default lookup scheme
+
+cdef class ElementDefaultClassLookup(ElementClassLookup):
+    u"""ElementDefaultClassLookup(self, element=None, comment=None, pi=None, entity=None)
+    Element class lookup scheme that always returns the default Element
+    class.
+
+    The keyword arguments ``element``, ``comment``, ``pi`` and ``entity``
+    accept the respective Element classes.
+    """
+    cdef readonly object element_class
+    cdef readonly object comment_class
+    cdef readonly object pi_class
+    cdef readonly object entity_class
+    def __cinit__(self):
+        self._lookup_function = _lookupDefaultElementClass
+
+    def __init__(self, element=None, comment=None, pi=None, entity=None):
+        if element is None:
+            self.element_class = _Element
+        elif issubclass(element, ElementBase):
+            self.element_class = element
+        else:
+            raise TypeError, u"element class must be subclass of ElementBase"
+
+        if comment is None:
+            self.comment_class = _Comment
+        elif issubclass(comment, CommentBase):
+            self.comment_class = comment
+        else:
+            raise TypeError, u"comment class must be subclass of CommentBase"
+
+        if entity is None:
+            self.entity_class = _Entity
+        elif issubclass(entity, EntityBase):
+            self.entity_class = entity
+        else:
+            raise TypeError, u"Entity class must be subclass of EntityBase"
+
+        if pi is None:
+            self.pi_class = None # special case, see below
+        elif issubclass(pi, PIBase):
+            self.pi_class = pi
+        else:
+            raise TypeError, u"PI class must be subclass of PIBase"
+
+cdef object _lookupDefaultElementClass(state, _Document _doc, xmlNode* c_node):
+    u"Trivial class lookup function that always returns the default class."
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        if state is not None:
+            return (<ElementDefaultClassLookup>state).element_class
+        else:
+            return _Element
+    elif c_node.type == tree.XML_COMMENT_NODE:
+        if state is not None:
+            return (<ElementDefaultClassLookup>state).comment_class
+        else:
+            return _Comment
+    elif c_node.type == tree.XML_ENTITY_REF_NODE:
+        if state is not None:
+            return (<ElementDefaultClassLookup>state).entity_class
+        else:
+            return _Entity
+    elif c_node.type == tree.XML_PI_NODE:
+        if state is None or (<ElementDefaultClassLookup>state).pi_class is None:
+            # special case XSLT-PI
+            if c_node.name is not NULL and c_node.content is not NULL:
+                if tree.xmlStrcmp(c_node.name, <unsigned char*>"xml-stylesheet") == 0:
+                    if tree.xmlStrstr(c_node.content, <unsigned char*>"text/xsl") is not NULL or \
+                           tree.xmlStrstr(c_node.content, <unsigned char*>"text/xml") is not NULL:
+                        return _XSLTProcessingInstruction
+            return _ProcessingInstruction
+        else:
+            return (<ElementDefaultClassLookup>state).pi_class
+    else:
+        assert 0, u"Unknown node type: %s" % c_node.type
+
+
+################################################################################
+# attribute based lookup scheme
+
+cdef class AttributeBasedElementClassLookup(FallbackElementClassLookup):
+    u"""AttributeBasedElementClassLookup(self, attribute_name, class_mapping, fallback=None)
+    Checks an attribute of an Element and looks up the value in a
+    class dictionary.
+
+    Arguments:
+      - attribute name - '{ns}name' style string
+      - class mapping  - Python dict mapping attribute values to Element classes
+      - fallback       - optional fallback lookup mechanism
+
+    A None key in the class mapping will be checked if the attribute is
+    missing.
+    """
+    cdef object _class_mapping
+    cdef tuple _pytag
+    cdef const_xmlChar* _c_ns
+    cdef const_xmlChar* _c_name
+    def __cinit__(self):
+        self._lookup_function = _attribute_class_lookup
+
+    def __init__(self, attribute_name, class_mapping,
+                 ElementClassLookup fallback=None):
+        self._pytag = _getNsTag(attribute_name)
+        ns, name = self._pytag
+        if ns is None:
+            self._c_ns = NULL
+        else:
+            self._c_ns = _xcstr(ns)
+        self._c_name = _xcstr(name)
+        self._class_mapping = dict(class_mapping)
+
+        FallbackElementClassLookup.__init__(self, fallback)
+
+cdef object _attribute_class_lookup(state, _Document doc, xmlNode* c_node):
+    cdef AttributeBasedElementClassLookup lookup
+    cdef python.PyObject* dict_result
+
+    lookup = <AttributeBasedElementClassLookup>state
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        value = _attributeValueFromNsName(
+            c_node, lookup._c_ns, lookup._c_name)
+        dict_result = python.PyDict_GetItem(lookup._class_mapping, value)
+        if dict_result is not NULL:
+            cls = <object>dict_result
+            _validateNodeClass(c_node, cls)
+            return cls
+    return _callLookupFallback(lookup, doc, c_node)
+
+
+################################################################################
+#  per-parser lookup scheme
+
+cdef class ParserBasedElementClassLookup(FallbackElementClassLookup):
+    u"""ParserBasedElementClassLookup(self, fallback=None)
+    Element class lookup based on the XML parser.
+    """
+    def __cinit__(self):
+        self._lookup_function = _parser_class_lookup
+
+cdef object _parser_class_lookup(state, _Document doc, xmlNode* c_node):
+    if doc._parser._class_lookup is not None:
+        return doc._parser._class_lookup._lookup_function(
+            doc._parser._class_lookup, doc, c_node)
+    return _callLookupFallback(<FallbackElementClassLookup>state, doc, c_node)
+
+
+################################################################################
+#  custom class lookup based on node type, namespace, name
+
+cdef class CustomElementClassLookup(FallbackElementClassLookup):
+    u"""CustomElementClassLookup(self, fallback=None)
+    Element class lookup based on a subclass method.
+
+    You can inherit from this class and override the method::
+
+        lookup(self, type, doc, namespace, name)
+
+    to lookup the element class for a node. Arguments of the method:
+    * type:      one of 'element', 'comment', 'PI', 'entity'
+    * doc:       document that the node is in
+    * namespace: namespace URI of the node (or None for comments/PIs/entities)
+    * name:      name of the element/entity, None for comments, target for PIs
+
+    If you return None from this method, the fallback will be called.
+    """
+    def __cinit__(self):
+        self._lookup_function = _custom_class_lookup
+
+    def lookup(self, type, doc, namespace, name):
+        u"lookup(self, type, doc, namespace, name)"
+        return None
+
+cdef object _custom_class_lookup(state, _Document doc, xmlNode* c_node):
+    cdef CustomElementClassLookup lookup
+
+    lookup = <CustomElementClassLookup>state
+
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        element_type = u"element"
+    elif c_node.type == tree.XML_COMMENT_NODE:
+        element_type = u"comment"
+    elif c_node.type == tree.XML_PI_NODE:
+        element_type = u"PI"
+    elif c_node.type == tree.XML_ENTITY_REF_NODE:
+        element_type = u"entity"
+    else:
+        element_type = u"element"
+    if c_node.name is NULL:
+        name = None
+    else:
+        name = funicode(c_node.name)
+    c_str = tree._getNs(c_node)
+    ns = funicode(c_str) if c_str is not NULL else None
+
+    cls = lookup.lookup(element_type, doc, ns, name)
+    if cls is not None:
+        _validateNodeClass(c_node, cls)
+        return cls
+    return _callLookupFallback(lookup, doc, c_node)
+
+
+################################################################################
+# read-only tree based class lookup
+
+cdef class PythonElementClassLookup(FallbackElementClassLookup):
+    u"""PythonElementClassLookup(self, fallback=None)
+    Element class lookup based on a subclass method.
+
+    This class lookup scheme allows access to the entire XML tree in
+    read-only mode.  To use it, re-implement the ``lookup(self, doc,
+    root)`` method in a subclass::
+
+        from lxml import etree, pyclasslookup
+
+        class MyElementClass(etree.ElementBase):
+            honkey = True
+
+        class MyLookup(pyclasslookup.PythonElementClassLookup):
+            def lookup(self, doc, root):
+                if root.tag == "sometag":
+                    return MyElementClass
+                else:
+                    for child in root:
+                        if child.tag == "someothertag":
+                            return MyElementClass
+                # delegate to default
+                return None
+
+    If you return None from this method, the fallback will be called.
+
+    The first argument is the opaque document instance that contains
+    the Element.  The second argument is a lightweight Element proxy
+    implementation that is only valid during the lookup.  Do not try
+    to keep a reference to it.  Once the lookup is done, the proxy
+    will be invalid.
+
+    Also, you cannot wrap such a read-only Element in an ElementTree,
+    and you must take care not to keep a reference to them outside of
+    the `lookup()` method.
+
+    Note that the API of the Element objects is not complete.  It is
+    purely read-only and does not support all features of the normal
+    `lxml.etree` API (such as XPath, extended slicing or some
+    iteration methods).
+
+    See http://codespeak.net/lxml/element_classes.html
+    """
+    def __cinit__(self):
+        self._lookup_function = _python_class_lookup
+
+    def lookup(self, doc, element):
+        u"""lookup(self, doc, element)
+
+        Override this method to implement your own lookup scheme.
+        """
+        return None
+
+cdef object _python_class_lookup(state, _Document doc, tree.xmlNode* c_node):
+    cdef PythonElementClassLookup lookup
+    cdef _ReadOnlyElementProxy proxy
+    lookup = <PythonElementClassLookup>state
+
+    proxy = _newReadOnlyProxy(None, c_node)
+    cls = lookup.lookup(doc, proxy)
+    _freeReadOnlyProxies(proxy)
+
+    if cls is not None:
+        _validateNodeClass(c_node, cls)
+        return cls
+    return _callLookupFallback(lookup, doc, c_node)
+
+################################################################################
+# Global setup
+
+cdef _element_class_lookup_function LOOKUP_ELEMENT_CLASS
+cdef object ELEMENT_CLASS_LOOKUP_STATE
+
+cdef void _setElementClassLookupFunction(
+    _element_class_lookup_function function, object state):
+    global LOOKUP_ELEMENT_CLASS, ELEMENT_CLASS_LOOKUP_STATE
+    if function is NULL:
+        state    = DEFAULT_ELEMENT_CLASS_LOOKUP
+        function = DEFAULT_ELEMENT_CLASS_LOOKUP._lookup_function
+
+    ELEMENT_CLASS_LOOKUP_STATE = state
+    LOOKUP_ELEMENT_CLASS = function
+
+def set_element_class_lookup(ElementClassLookup lookup = None):
+    u"""set_element_class_lookup(lookup = None)
+
+    Set the global default element class lookup method.
+    """
+    if lookup is None or lookup._lookup_function is NULL:
+        _setElementClassLookupFunction(NULL, None)
+    else:
+        _setElementClassLookupFunction(lookup._lookup_function, lookup)
+
+# default setup: parser delegation
+cdef ParserBasedElementClassLookup DEFAULT_ELEMENT_CLASS_LOOKUP
+DEFAULT_ELEMENT_CLASS_LOOKUP = ParserBasedElementClassLookup()
+
+set_element_class_lookup(DEFAULT_ELEMENT_CLASS_LOOKUP)
diff --git a/lib/lxml/cleanup.pxi b/lib/lxml/cleanup.pxi
new file mode 100644
index 00000000..5388ffb6
--- /dev/null
+++ b/lib/lxml/cleanup.pxi
@@ -0,0 +1,210 @@
+# functions for tree cleanup and removing elements from subtrees
+
+def cleanup_namespaces(tree_or_element):
+    u"""cleanup_namespaces(tree_or_element)
+
+    Remove all namespace declarations from a subtree that are not used
+    by any of the elements or attributes in that tree.
+    """
+    cdef _Element element
+    element = _rootNodeOrRaise(tree_or_element)
+    _removeUnusedNamespaceDeclarations(element._c_node)
+
+def strip_attributes(tree_or_element, *attribute_names):
+    u"""strip_attributes(tree_or_element, *attribute_names)
+
+    Delete all attributes with the provided attribute names from an
+    Element (or ElementTree) and its descendants.
+
+    Attribute names can contain wildcards as in `_Element.iter`.
+
+    Example usage::
+
+        strip_attributes(root_element,
+                         'simpleattr',
+                         '{http://some/ns}attrname',
+                         '{http://other/ns}*')
+    """
+    cdef _MultiTagMatcher matcher
+    cdef _Element element
+
+    element = _rootNodeOrRaise(tree_or_element)
+    if not attribute_names:
+        return
+
+    matcher = _MultiTagMatcher(attribute_names)
+    matcher.cacheTags(element._doc)
+    if matcher.rejectsAllAttributes():
+        return
+    _strip_attributes(element._c_node, matcher)
+
+cdef _strip_attributes(xmlNode* c_node, _MultiTagMatcher matcher):
+    cdef xmlAttr* c_attr
+    cdef xmlAttr* c_next_attr
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        c_attr = c_node.properties
+        while c_attr is not NULL:
+            c_next_attr = c_attr.next
+            if matcher.matchesAttribute(c_attr):
+                tree.xmlRemoveProp(c_attr)
+            c_attr = c_next_attr
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+
+def strip_elements(tree_or_element, *tag_names, bint with_tail=True):
+    u"""strip_elements(tree_or_element, *tag_names, with_tail=True)
+
+    Delete all elements with the provided tag names from a tree or
+    subtree.  This will remove the elements and their entire subtree,
+    including all their attributes, text content and descendants.  It
+    will also remove the tail text of the element unless you
+    explicitly set the ``with_tail`` keyword argument option to False.
+
+    Tag names can contain wildcards as in `_Element.iter`.
+
+    Note that this will not delete the element (or ElementTree root
+    element) that you passed even if it matches.  It will only treat
+    its descendants.  If you want to include the root element, check
+    its tag name directly before even calling this function.
+
+    Example usage::
+
+        strip_elements(some_element,
+            'simpletagname',             # non-namespaced tag
+            '{http://some/ns}tagname',   # namespaced tag
+            '{http://some/other/ns}*'    # any tag from a namespace
+            lxml.etree.Comment           # comments
+            )
+    """
+    cdef _MultiTagMatcher matcher
+    cdef _Element element
+    cdef _Document doc
+    cdef list ns_tags
+    cdef qname* c_ns_tags
+    cdef Py_ssize_t c_tag_count
+    cdef bint strip_comments = 0, strip_pis = 0, strip_entities = 0
+
+    doc = _documentOrRaise(tree_or_element)
+    element = _rootNodeOrRaise(tree_or_element)
+    if not tag_names:
+        return
+
+    matcher = _MultiTagMatcher(tag_names)
+    matcher.cacheTags(doc)
+    if matcher.rejectsAll():
+        return
+
+    if isinstance(tree_or_element, _ElementTree):
+        # include PIs and comments next to the root node
+        if matcher.matchesType(tree.XML_COMMENT_NODE):
+            _removeSiblings(element._c_node, tree.XML_COMMENT_NODE, with_tail)
+        if matcher.matchesType(tree.XML_PI_NODE):
+            _removeSiblings(element._c_node, tree.XML_PI_NODE, with_tail)
+    _strip_elements(doc, element._c_node, matcher, with_tail)
+
+cdef _strip_elements(_Document doc, xmlNode* c_node, _MultiTagMatcher matcher,
+                     bint with_tail):
+    cdef xmlNode* c_child
+    cdef xmlNode* c_next
+
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        # we run through the children here to prevent any problems
+        # with the tree iteration which would occur if we unlinked the
+        # c_node itself
+        c_child = _findChildForwards(c_node, 0)
+        while c_child is not NULL:
+            c_next = _nextElement(c_child)
+            if matcher.matches(c_child):
+                if c_child.type == tree.XML_ELEMENT_NODE:
+                    if not with_tail:
+                        tree.xmlUnlinkNode(c_child)
+                    _removeNode(doc, c_child)
+                else:
+                    if with_tail:
+                        _removeText(c_child.next)
+                    tree.xmlUnlinkNode(c_child)
+                    attemptDeallocation(c_child)
+            c_child = c_next
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+
+
+def strip_tags(tree_or_element, *tag_names):
+    u"""strip_tags(tree_or_element, *tag_names)
+
+    Delete all elements with the provided tag names from a tree or
+    subtree.  This will remove the elements and their attributes, but
+    *not* their text/tail content or descendants.  Instead, it will
+    merge the text content and children of the element into its
+    parent.
+
+    Tag names can contain wildcards as in `_Element.iter`.
+
+    Note that this will not delete the element (or ElementTree root
+    element) that you passed even if it matches.  It will only treat
+    its descendants.
+
+    Example usage::
+
+        strip_tags(some_element,
+            'simpletagname',             # non-namespaced tag
+            '{http://some/ns}tagname',   # namespaced tag
+            '{http://some/other/ns}*'    # any tag from a namespace
+            Comment                      # comments (including their text!)
+            )
+    """
+    cdef _MultiTagMatcher matcher
+    cdef _Element element
+    cdef _Document doc
+    cdef list ns_tags
+    cdef bint strip_comments = 0, strip_pis = 0, strip_entities = 0
+    cdef char** c_ns_tags
+    cdef Py_ssize_t c_tag_count
+
+    doc = _documentOrRaise(tree_or_element)
+    element = _rootNodeOrRaise(tree_or_element)
+    if not tag_names:
+        return
+
+    matcher = _MultiTagMatcher(tag_names)
+    matcher.cacheTags(doc)
+    if matcher.rejectsAll():
+        return
+
+    if isinstance(tree_or_element, _ElementTree):
+        # include PIs and comments next to the root node
+        if matcher.matchesType(tree.XML_COMMENT_NODE):
+            _removeSiblings(element._c_node, tree.XML_COMMENT_NODE, 0)
+        if matcher.matchesType(tree.XML_PI_NODE):
+            _removeSiblings(element._c_node, tree.XML_PI_NODE, 0)
+    _strip_tags(doc, element._c_node, matcher)
+
+cdef _strip_tags(_Document doc, xmlNode* c_node, _MultiTagMatcher matcher):
+    cdef xmlNode* c_child
+    cdef xmlNode* c_next
+    cdef Py_ssize_t i
+
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        # we run through the children here to prevent any problems
+        # with the tree iteration which would occur if we unlinked the
+        # c_node itself
+        c_child = _findChildForwards(c_node, 0)
+        while c_child is not NULL:
+            if not matcher.matches(c_child):
+                c_child = _nextElement(c_child)
+                continue
+            if c_child.type == tree.XML_ELEMENT_NODE:
+                c_next = _findChildForwards(c_child, 0) or _nextElement(c_child)
+                _replaceNodeByChildren(doc, c_child)
+                if not attemptDeallocation(c_child):
+                    if c_child.nsDef is not NULL:
+                        # make namespaces absolute
+                        moveNodeToDocument(doc, doc._c_doc, c_child)
+                c_child = c_next
+            else:
+                c_next = _nextElement(c_child)
+                tree.xmlUnlinkNode(c_child)
+                attemptDeallocation(c_child)
+                c_child = c_next
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
diff --git a/lib/lxml/cssselect.py b/lib/lxml/cssselect.py
new file mode 100644
index 00000000..e8effaa2
--- /dev/null
+++ b/lib/lxml/cssselect.py
@@ -0,0 +1,103 @@
+"""CSS Selectors based on XPath.
+
+This module supports selecting XML/HTML tags based on CSS selectors.
+See the `CSSSelector` class for details.
+
+This is a thin wrapper around cssselect 0.7 or later.
+"""
+
+import sys
+from lxml import etree
+
+## Work-around the lack of absolute import in Python 2.4
+#from __future__ import absolute_import
+#from cssselect import ...
+try:
+    external_cssselect = __import__('cssselect')
+except ImportError:
+    raise ImportError('cssselect seems not to be installed. '
+                      'See http://packages.python.org/cssselect/')
+
+SelectorSyntaxError = external_cssselect.SelectorSyntaxError
+ExpressionError = external_cssselect.ExpressionError
+SelectorError = external_cssselect.SelectorError
+
+
+__all__ = ['SelectorSyntaxError', 'ExpressionError', 'SelectorError',
+           'CSSSelector']
+
+
+class LxmlTranslator(external_cssselect.GenericTranslator):
+    """
+    A custom CSS selector to XPath translator with lxml-specific extensions.
+    """
+    def xpath_contains_function(self, xpath, function):
+        # Defined there, removed in later drafts:
+        # http://www.w3.org/TR/2001/CR-css3-selectors-20011113/#content-selectors
+        if function.argument_types() not in (['STRING'], ['IDENT']):
+            raise ExpressionError(
+                "Expected a single string or ident for :contains(), got %r"
+                % function.arguments)
+        value = function.arguments[0].value
+        return xpath.add_condition(
+            'contains(__lxml_internal_css:lower-case(string(.)), %s)'
+            % self.xpath_literal(value.lower()))
+
+
+class LxmlHTMLTranslator(LxmlTranslator, external_cssselect.HTMLTranslator):
+    """
+    lxml extensions + HTML support.
+    """
+
+
+def _make_lower_case(context, s):
+    return s.lower()
+
+ns = etree.FunctionNamespace('http://codespeak.net/lxml/css/')
+ns.prefix = '__lxml_internal_css'
+ns['lower-case'] = _make_lower_case
+
+
+class CSSSelector(etree.XPath):
+    """A CSS selector.
+
+    Usage::
+
+        >>> from lxml import etree, cssselect
+        >>> select = cssselect.CSSSelector("a tag > child")
+
+        >>> root = etree.XML("<a><b><c/><tag><child>TEXT</child></tag></b></a>")
+        >>> [ el.tag for el in select(root) ]
+        ['child']
+
+    To use CSS namespaces, you need to pass a prefix-to-namespace
+    mapping as ``namespaces`` keyword argument::
+
+        >>> rdfns = 'http://www.w3.org/1999/02/22-rdf-syntax-ns#'
+        >>> select_ns = cssselect.CSSSelector('root > rdf|Description',
+        ...                                   namespaces={'rdf': rdfns})
+
+        >>> rdf = etree.XML((
+        ...     '<root xmlns:rdf="%s">'
+        ...       '<rdf:Description>blah</rdf:Description>'
+        ...     '</root>') % rdfns)
+        >>> [(el.tag, el.text) for el in select_ns(rdf)]
+        [('{http://www.w3.org/1999/02/22-rdf-syntax-ns#}Description', 'blah')]
+
+    """
+    def __init__(self, css, namespaces=None, translator='xml'):
+        if translator == 'xml':
+            translator = LxmlTranslator()
+        elif translator == 'html':
+            translator = LxmlHTMLTranslator()
+        elif translator == 'xhtml':
+            translator = LxmlHTMLTranslator(xhtml=True)
+        path = translator.css_to_xpath(css)
+        etree.XPath.__init__(self, path, namespaces=namespaces)
+        self.css = css
+
+    def __repr__(self):
+        return '<%s %s for %r>' % (
+            self.__class__.__name__,
+            hex(abs(id(self)))[2:],
+            self.css)
diff --git a/lib/lxml/cvarargs.pxd b/lib/lxml/cvarargs.pxd
new file mode 100644
index 00000000..824c1f0c
--- /dev/null
+++ b/lib/lxml/cvarargs.pxd
@@ -0,0 +1,8 @@
+cdef extern from "stdarg.h":
+    ctypedef void *va_list
+    void va_start(va_list ap, void *last) nogil
+    void va_end(va_list ap) nogil
+
+cdef extern from "etree_defs.h":
+    cdef int va_int(va_list ap) nogil
+    cdef char *va_charptr(va_list ap) nogil
diff --git a/lib/lxml/debug.pxi b/lib/lxml/debug.pxi
new file mode 100644
index 00000000..47b8497b
--- /dev/null
+++ b/lib/lxml/debug.pxi
@@ -0,0 +1,91 @@
+
+@cython.final
+@cython.internal
+cdef class _MemDebug:
+    """Debugging support for the memory allocation in libxml2.
+    """
+    def bytes_used(self):
+        """bytes_used(self)
+
+        Returns the total amount of memory (in bytes) currently used by libxml2.
+        Note that libxml2 constrains this value to a C int, which limits
+        the accuracy on 64 bit systems.
+        """
+        return tree.xmlMemUsed()
+
+    def blocks_used(self):
+        """blocks_used(self)
+
+        Returns the total number of memory blocks currently allocated by libxml2.
+        Note that libxml2 constrains this value to a C int, which limits
+        the accuracy on 64 bit systems.
+        """
+        return tree.xmlMemBlocks()
+
+    def dict_size(self):
+        """dict_size(self)
+
+        Returns the current size of the global name dictionary used by libxml2
+        for the current thread.  Each thread has its own dictionary.
+        """
+        c_dict = __GLOBAL_PARSER_CONTEXT._getThreadDict(NULL)
+        if c_dict is NULL:
+            raise MemoryError()
+        return tree.xmlDictSize(c_dict)
+
+    def dump(self, output_file=None, byte_count=None):
+        """dump(self, output_file=None, byte_count=None)
+
+        Dumps the current memory blocks allocated by libxml2 to a file.
+
+        The optional parameter 'output_file' specifies the file path.  It defaults
+        to the file ".memorylist" in the current directory.
+
+        The optional parameter 'byte_count' limits the number of bytes in the dump.
+        Note that this parameter is ignored when lxml is compiled against a libxml2
+        version before 2.7.0.
+        """
+        cdef Py_ssize_t c_count
+        if output_file is None:
+            output_file = b'.memorylist'
+        elif isinstance(output_file, unicode):
+            output_file.encode(sys.getfilesystemencoding())
+
+        f = stdio.fopen(output_file, "w")
+        if f is NULL:
+            raise IOError("Failed to create file %s" % output_file.decode(sys.getfilesystemencoding()))
+        try:
+            if byte_count is None:
+                tree.xmlMemDisplay(f)
+            else:
+                c_count = byte_count
+                tree.xmlMemDisplayLast(f, c_count)
+        finally:
+            stdio.fclose(f)
+
+    def show(self, output_file=None, block_count=None):
+        """show(self, output_file=None, block_count=None)
+
+        Dumps the current memory blocks allocated by libxml2 to a file.
+        The output file format is suitable for line diffing.
+
+        The optional parameter 'output_file' specifies the file path.  It defaults
+        to the file ".memorydump" in the current directory.
+
+        The optional parameter 'block_count' limits the number of blocks
+        in the dump.
+        """
+        if output_file is None:
+            output_file = b'.memorydump'
+        elif isinstance(output_file, unicode):
+            output_file.encode(sys.getfilesystemencoding())
+
+        f = stdio.fopen(output_file, "w")
+        if f is NULL:
+            raise IOError("Failed to create file %s" % output_file.decode(sys.getfilesystemencoding()))
+        try:
+            tree.xmlMemShow(f, block_count if block_count is not None else tree.xmlMemBlocks())
+        finally:
+            stdio.fclose(f)
+
+memory_debugger = _MemDebug()
diff --git a/lib/lxml/docloader.pxi b/lib/lxml/docloader.pxi
new file mode 100644
index 00000000..dd515b7f
--- /dev/null
+++ b/lib/lxml/docloader.pxi
@@ -0,0 +1,175 @@
+# Custom resolver API
+
+ctypedef enum _InputDocumentDataType:
+    PARSER_DATA_INVALID
+    PARSER_DATA_EMPTY
+    PARSER_DATA_STRING
+    PARSER_DATA_FILENAME
+    PARSER_DATA_FILE
+
+@cython.final
+@cython.internal
+cdef class _InputDocument:
+    cdef _InputDocumentDataType _type
+    cdef bytes _data_bytes
+    cdef object _filename
+    cdef object _file
+    cdef bint _close_file
+
+    def __cinit__(self):
+        self._type = PARSER_DATA_INVALID
+
+
+cdef class Resolver:
+    u"This is the base class of all resolvers."
+    def resolve(self, system_url, public_id, context):
+        u"""resolve(self, system_url, public_id, context)
+
+        Override this method to resolve an external source by
+        ``system_url`` and ``public_id``.  The third argument is an
+        opaque context object.
+
+        Return the result of one of the ``resolve_*()`` methods.
+        """
+        return None
+
+    def resolve_empty(self, context):
+        u"""resolve_empty(self, context)
+
+        Return an empty input document.
+
+        Pass context as parameter.
+        """
+        cdef _InputDocument doc_ref
+        doc_ref = _InputDocument()
+        doc_ref._type = PARSER_DATA_EMPTY
+        return doc_ref
+
+    def resolve_string(self, string, context, *, base_url=None):
+        u"""resolve_string(self, string, context, base_url=None)
+
+        Return a parsable string as input document.
+
+        Pass data string and context as parameters.  You can pass the
+        source URL or filename through the ``base_url`` keyword
+        argument.
+        """
+        cdef _InputDocument doc_ref
+        if isinstance(string, unicode):
+            string = (<unicode>string).encode('utf8')
+        elif not isinstance(string, bytes):
+            raise TypeError, "argument must be a byte string or unicode string"
+        doc_ref = _InputDocument()
+        doc_ref._type = PARSER_DATA_STRING
+        doc_ref._data_bytes = string
+        if base_url is not None:
+            doc_ref._filename = _encodeFilename(base_url)
+        return doc_ref
+
+    def resolve_filename(self, filename, context):
+        u"""resolve_filename(self, filename, context)
+
+        Return the name of a parsable file as input document.
+
+        Pass filename and context as parameters.  You can also pass a
+        URL with an HTTP, FTP or file target.
+        """
+        cdef _InputDocument doc_ref
+        doc_ref = _InputDocument()
+        doc_ref._type = PARSER_DATA_FILENAME
+        doc_ref._filename = _encodeFilename(filename)
+        return doc_ref
+
+    def resolve_file(self, f, context, *, base_url=None, bint close=True):
+        u"""resolve_file(self, f, context, base_url=None, close=True)
+
+        Return an open file-like object as input document.
+
+        Pass open file and context as parameters.  You can pass the
+        base URL or filename of the file through the ``base_url``
+        keyword argument.  If the ``close`` flag is True (the
+        default), the file will be closed after reading.
+
+        Note that using ``.resolve_filename()`` is more efficient,
+        especially in threaded environments.
+        """
+        cdef _InputDocument doc_ref
+        try:
+            f.read
+        except AttributeError:
+            raise TypeError, u"Argument is not a file-like object"
+        doc_ref = _InputDocument()
+        doc_ref._type = PARSER_DATA_FILE
+        if base_url is not None:
+            doc_ref._filename = _encodeFilename(base_url)
+        else:
+            doc_ref._filename = _getFilenameForFile(f)
+        doc_ref._close_file = close
+        doc_ref._file = f
+        return doc_ref
+
+@cython.final
+@cython.internal
+cdef class _ResolverRegistry:
+    cdef object _resolvers
+    cdef Resolver _default_resolver
+    def __cinit__(self, Resolver default_resolver=None):
+        self._resolvers = set()
+        self._default_resolver = default_resolver
+
+    def add(self, Resolver resolver not None):
+        u"""add(self, resolver)
+
+        Register a resolver.
+
+        For each requested entity, the 'resolve' method of the resolver will
+        be called and the result will be passed to the parser.  If this method
+        returns None, the request will be delegated to other resolvers or the
+        default resolver.  The resolvers will be tested in an arbitrary order
+        until the first match is found.
+        """
+        self._resolvers.add(resolver)
+
+    def remove(self, resolver):
+        u"remove(self, resolver)"
+        self._resolvers.discard(resolver)
+
+    cdef _ResolverRegistry _copy(self):
+        cdef _ResolverRegistry registry
+        registry = _ResolverRegistry(self._default_resolver)
+        registry._resolvers = self._resolvers.copy()
+        return registry
+
+    def copy(self):
+        u"copy(self)"
+        return self._copy()
+
+    def resolve(self, system_url, public_id, context):
+        u"resolve(self, system_url, public_id, context)"
+        for resolver in self._resolvers:
+            result = resolver.resolve(system_url, public_id, context)
+            if result is not None:
+                return result
+        if self._default_resolver is None:
+            return None
+        return self._default_resolver.resolve(system_url, public_id, context)
+
+    def __repr__(self):
+        return repr(self._resolvers)
+
+@cython.internal
+cdef class _ResolverContext(_ExceptionContext):
+    cdef _ResolverRegistry _resolvers
+    cdef _TempStore _storage
+
+    cdef void clear(self):
+        _ExceptionContext.clear(self)
+        self._storage.clear()
+
+cdef _initResolverContext(_ResolverContext context,
+                          _ResolverRegistry resolvers):
+    if resolvers is None:
+        context._resolvers = _ResolverRegistry()
+    else:
+        context._resolvers = resolvers
+    context._storage = _TempStore()
diff --git a/lib/lxml/doctestcompare.py b/lib/lxml/doctestcompare.py
new file mode 100644
index 00000000..3cd5ce48
--- /dev/null
+++ b/lib/lxml/doctestcompare.py
@@ -0,0 +1,505 @@
+"""
+lxml-based doctest output comparison.
+
+Note: normally, you should just import the `lxml.usedoctest` and
+`lxml.html.usedoctest` modules from within a doctest, instead of this
+one::
+
+    >>> import lxml.usedoctest # for XML output
+
+    >>> import lxml.html.usedoctest # for HTML output
+
+To use this module directly, you must call ``lxmldoctest.install()``,
+which will cause doctest to use this in all subsequent calls.
+
+This changes the way output is checked and comparisons are made for
+XML or HTML-like content.
+
+XML or HTML content is noticed because the example starts with ``<``
+(it's HTML if it starts with ``<html``).  You can also use the
+``PARSE_HTML`` and ``PARSE_XML`` flags to force parsing.
+
+Some rough wildcard-like things are allowed.  Whitespace is generally
+ignored (except in attributes).  In text (attributes and text in the
+body) you can use ``...`` as a wildcard.  In an example it also
+matches any trailing tags in the element, though it does not match
+leading tags.  You may create a tag ``<any>`` or include an ``any``
+attribute in the tag.  An ``any`` tag matches any tag, while the
+attribute matches any and all attributes.
+
+When a match fails, the reformatted example and gotten text is
+displayed (indented), and a rough diff-like output is given.  Anything
+marked with ``-`` is in the output but wasn't supposed to be, and
+similarly ``+`` means its in the example but wasn't in the output.
+
+You can disable parsing on one line with ``# doctest:+NOPARSE_MARKUP``
+"""
+
+from lxml import etree
+import sys
+import re
+import doctest
+import cgi
+
+__all__ = ['PARSE_HTML', 'PARSE_XML', 'NOPARSE_MARKUP', 'LXMLOutputChecker',
+           'LHTMLOutputChecker', 'install', 'temp_install']
+
+try:
+    _basestring = basestring
+except NameError:
+    _basestring = (str, bytes)
+
+_IS_PYTHON_3 = sys.version_info[0] >= 3
+
+PARSE_HTML = doctest.register_optionflag('PARSE_HTML')
+PARSE_XML = doctest.register_optionflag('PARSE_XML')
+NOPARSE_MARKUP = doctest.register_optionflag('NOPARSE_MARKUP')
+
+OutputChecker = doctest.OutputChecker
+
+def strip(v):
+    if v is None:
+        return None
+    else:
+        return v.strip()
+
+def norm_whitespace(v):
+    return _norm_whitespace_re.sub(' ', v)
+
+_html_parser = etree.HTMLParser(recover=False, remove_blank_text=True)
+
+def html_fromstring(html):
+    return etree.fromstring(html, _html_parser)
+
+# We use this to distinguish repr()s from elements:
+_repr_re = re.compile(r'^<[^>]+ (at|object) ')
+_norm_whitespace_re = re.compile(r'[ \t\n][ \t\n]+')
+
+class LXMLOutputChecker(OutputChecker):
+
+    empty_tags = (
+        'param', 'img', 'area', 'br', 'basefont', 'input',
+        'base', 'meta', 'link', 'col')
+
+    def get_default_parser(self):
+        return etree.XML
+
+    def check_output(self, want, got, optionflags):
+        alt_self = getattr(self, '_temp_override_self', None)
+        if alt_self is not None:
+            super_method = self._temp_call_super_check_output
+            self = alt_self
+        else:
+            super_method = OutputChecker.check_output
+        parser = self.get_parser(want, got, optionflags)
+        if not parser:
+            return super_method(
+                self, want, got, optionflags)
+        try:
+            want_doc = parser(want)
+        except etree.XMLSyntaxError:
+            return False
+        try:
+            got_doc = parser(got)
+        except etree.XMLSyntaxError:
+            return False
+        return self.compare_docs(want_doc, got_doc)
+
+    def get_parser(self, want, got, optionflags):
+        parser = None
+        if NOPARSE_MARKUP & optionflags:
+            return None
+        if PARSE_HTML & optionflags:
+            parser = html_fromstring
+        elif PARSE_XML & optionflags:
+            parser = etree.XML
+        elif (want.strip().lower().startswith('<html')
+              and got.strip().startswith('<html')):
+            parser = html_fromstring
+        elif (self._looks_like_markup(want)
+              and self._looks_like_markup(got)):
+            parser = self.get_default_parser()
+        return parser
+
+    def _looks_like_markup(self, s):
+        s = s.strip()
+        return (s.startswith('<')
+                and not _repr_re.search(s))
+
+    def compare_docs(self, want, got):
+        if not self.tag_compare(want.tag, got.tag):
+            return False
+        if not self.text_compare(want.text, got.text, True):
+            return False
+        if not self.text_compare(want.tail, got.tail, True):
+            return False
+        if 'any' not in want.attrib:
+            want_keys = sorted(want.attrib.keys())
+            got_keys = sorted(got.attrib.keys())
+            if want_keys != got_keys:
+                return False
+            for key in want_keys:
+                if not self.text_compare(want.attrib[key], got.attrib[key], False):
+                    return False
+        if want.text != '...' or len(want):
+            want_children = list(want)
+            got_children = list(got)
+            while want_children or got_children:
+                if not want_children or not got_children:
+                    return False
+                want_first = want_children.pop(0)
+                got_first = got_children.pop(0)
+                if not self.compare_docs(want_first, got_first):
+                    return False
+                if not got_children and want_first.tail == '...':
+                    break
+        return True
+
+    def text_compare(self, want, got, strip):
+        want = want or ''
+        got = got or ''
+        if strip:
+            want = norm_whitespace(want).strip()
+            got = norm_whitespace(got).strip()
+        want = '^%s$' % re.escape(want)
+        want = want.replace(r'\.\.\.', '.*')
+        if re.search(want, got):
+            return True
+        else:
+            return False
+
+    def tag_compare(self, want, got):
+        if want == 'any':
+            return True
+        if (not isinstance(want, _basestring)
+            or not isinstance(got, _basestring)):
+            return want == got
+        want = want or ''
+        got = got or ''
+        if want.startswith('{...}'):
+            # Ellipsis on the namespace
+            return want.split('}')[-1] == got.split('}')[-1]
+        else:
+            return want == got
+
+    def output_difference(self, example, got, optionflags):
+        want = example.want
+        parser = self.get_parser(want, got, optionflags)
+        errors = []
+        if parser is not None:
+            try:
+                want_doc = parser(want)
+            except etree.XMLSyntaxError:
+                e = sys.exc_info()[1]
+                errors.append('In example: %s' % e)
+            try:
+                got_doc = parser(got)
+            except etree.XMLSyntaxError:
+                e = sys.exc_info()[1]
+                errors.append('In actual output: %s' % e)
+        if parser is None or errors:
+            value = OutputChecker.output_difference(
+                self, example, got, optionflags)
+            if errors:
+                errors.append(value)
+                return '\n'.join(errors)
+            else:
+                return value
+        html = parser is html_fromstring
+        diff_parts = []
+        diff_parts.append('Expected:')
+        diff_parts.append(self.format_doc(want_doc, html, 2))
+        diff_parts.append('Got:')
+        diff_parts.append(self.format_doc(got_doc, html, 2))
+        diff_parts.append('Diff:')
+        diff_parts.append(self.collect_diff(want_doc, got_doc, html, 2))
+        return '\n'.join(diff_parts)
+
+    def html_empty_tag(self, el, html=True):
+        if not html:
+            return False
+        if el.tag not in self.empty_tags:
+            return False
+        if el.text or len(el):
+            # This shouldn't happen (contents in an empty tag)
+            return False
+        return True
+
+    def format_doc(self, doc, html, indent, prefix=''):
+        parts = []
+        if not len(doc):
+            # No children...
+            parts.append(' '*indent)
+            parts.append(prefix)
+            parts.append(self.format_tag(doc))
+            if not self.html_empty_tag(doc, html):
+                if strip(doc.text):
+                    parts.append(self.format_text(doc.text))
+                parts.append(self.format_end_tag(doc))
+            if strip(doc.tail):
+                parts.append(self.format_text(doc.tail))
+            parts.append('\n')
+            return ''.join(parts)
+        parts.append(' '*indent)
+        parts.append(prefix)
+        parts.append(self.format_tag(doc))
+        if not self.html_empty_tag(doc, html):
+            parts.append('\n')
+            if strip(doc.text):
+                parts.append(' '*indent)
+                parts.append(self.format_text(doc.text))
+                parts.append('\n')
+            for el in doc:
+                parts.append(self.format_doc(el, html, indent+2))
+            parts.append(' '*indent)
+            parts.append(self.format_end_tag(doc))
+            parts.append('\n')
+        if strip(doc.tail):
+            parts.append(' '*indent)
+            parts.append(self.format_text(doc.tail))
+            parts.append('\n')
+        return ''.join(parts)
+
+    def format_text(self, text, strip=True):
+        if text is None:
+            return ''
+        if strip:
+            text = text.strip()
+        return cgi.escape(text, 1)
+
+    def format_tag(self, el):
+        attrs = []
+        if isinstance(el, etree.CommentBase):
+            # FIXME: probably PIs should be handled specially too?
+            return '<!--'
+        for name, value in sorted(el.attrib.items()):
+            attrs.append('%s="%s"' % (name, self.format_text(value, False)))
+        if not attrs:
+            return '<%s>' % el.tag
+        return '<%s %s>' % (el.tag, ' '.join(attrs))
+    
+    def format_end_tag(self, el):
+        if isinstance(el, etree.CommentBase):
+            # FIXME: probably PIs should be handled specially too?
+            return '-->'
+        return '</%s>' % el.tag
+
+    def collect_diff(self, want, got, html, indent):
+        parts = []
+        if not len(want) and not len(got):
+            parts.append(' '*indent)
+            parts.append(self.collect_diff_tag(want, got))
+            if not self.html_empty_tag(got, html):
+                parts.append(self.collect_diff_text(want.text, got.text))
+                parts.append(self.collect_diff_end_tag(want, got))
+            parts.append(self.collect_diff_text(want.tail, got.tail))
+            parts.append('\n')
+            return ''.join(parts)
+        parts.append(' '*indent)
+        parts.append(self.collect_diff_tag(want, got))
+        parts.append('\n')
+        if strip(want.text) or strip(got.text):
+            parts.append(' '*indent)
+            parts.append(self.collect_diff_text(want.text, got.text))
+            parts.append('\n')
+        want_children = list(want)
+        got_children = list(got)
+        while want_children or got_children:
+            if not want_children:
+                parts.append(self.format_doc(got_children.pop(0), html, indent+2, '-'))
+                continue
+            if not got_children:
+                parts.append(self.format_doc(want_children.pop(0), html, indent+2, '+'))
+                continue
+            parts.append(self.collect_diff(
+                want_children.pop(0), got_children.pop(0), html, indent+2))
+        parts.append(' '*indent)
+        parts.append(self.collect_diff_end_tag(want, got))
+        parts.append('\n')
+        if strip(want.tail) or strip(got.tail):
+            parts.append(' '*indent)
+            parts.append(self.collect_diff_text(want.tail, got.tail))
+            parts.append('\n')
+        return ''.join(parts)
+
+    def collect_diff_tag(self, want, got):
+        if not self.tag_compare(want.tag, got.tag):
+            tag = '%s (got: %s)' % (want.tag, got.tag)
+        else:
+            tag = got.tag
+        attrs = []
+        any = want.tag == 'any' or 'any' in want.attrib
+        for name, value in sorted(got.attrib.items()):
+            if name not in want.attrib and not any:
+                attrs.append('-%s="%s"' % (name, self.format_text(value, False)))
+            else:
+                if name in want.attrib:
+                    text = self.collect_diff_text(want.attrib[name], value, False)
+                else:
+                    text = self.format_text(value, False)
+                attrs.append('%s="%s"' % (name, text))
+        if not any:
+            for name, value in sorted(want.attrib.items()):
+                if name in got.attrib:
+                    continue
+                attrs.append('+%s="%s"' % (name, self.format_text(value, False)))
+        if attrs:
+            tag = '<%s %s>' % (tag, ' '.join(attrs))
+        else:
+            tag = '<%s>' % tag
+        return tag
+
+    def collect_diff_end_tag(self, want, got):
+        if want.tag != got.tag:
+            tag = '%s (got: %s)' % (want.tag, got.tag)
+        else:
+            tag = got.tag
+        return '</%s>' % tag
+
+    def collect_diff_text(self, want, got, strip=True):
+        if self.text_compare(want, got, strip):
+            if not got:
+                return ''
+            return self.format_text(got, strip)
+        text = '%s (got: %s)' % (want, got)
+        return self.format_text(text, strip)
+
+class LHTMLOutputChecker(LXMLOutputChecker):
+    def get_default_parser(self):
+        return html_fromstring
+    
+def install(html=False):
+    """
+    Install doctestcompare for all future doctests.
+
+    If html is true, then by default the HTML parser will be used;
+    otherwise the XML parser is used.
+    """
+    if html:
+        doctest.OutputChecker = LHTMLOutputChecker
+    else:
+        doctest.OutputChecker = LXMLOutputChecker
+
+def temp_install(html=False, del_module=None):
+    """
+    Use this *inside* a doctest to enable this checker for this
+    doctest only.
+
+    If html is true, then by default the HTML parser will be used;
+    otherwise the XML parser is used.
+    """
+    if html:
+        Checker = LHTMLOutputChecker
+    else:
+        Checker = LXMLOutputChecker
+    frame = _find_doctest_frame()
+    dt_self = frame.f_locals['self']
+    checker = Checker()
+    old_checker = dt_self._checker
+    dt_self._checker = checker
+    # The unfortunate thing is that there is a local variable 'check'
+    # in the function that runs the doctests, that is a bound method
+    # into the output checker.  We have to update that.  We can't
+    # modify the frame, so we have to modify the object in place.  The
+    # only way to do this is to actually change the func_code
+    # attribute of the method.  We change it, and then wait for
+    # __record_outcome to be run, which signals the end of the __run
+    # method, at which point we restore the previous check_output
+    # implementation.
+    if _IS_PYTHON_3:
+        check_func = frame.f_locals['check'].__func__
+        checker_check_func = checker.check_output.__func__
+    else:
+        check_func = frame.f_locals['check'].im_func
+        checker_check_func = checker.check_output.im_func
+    # Because we can't patch up func_globals, this is the only global
+    # in check_output that we care about:
+    doctest.etree = etree
+    _RestoreChecker(dt_self, old_checker, checker,
+                    check_func, checker_check_func,
+                    del_module)
+
+class _RestoreChecker(object):
+    def __init__(self, dt_self, old_checker, new_checker, check_func, clone_func,
+                 del_module):
+        self.dt_self = dt_self
+        self.checker = old_checker
+        self.checker._temp_call_super_check_output = self.call_super
+        self.checker._temp_override_self = new_checker
+        self.check_func = check_func
+        self.clone_func = clone_func
+        self.del_module = del_module
+        self.install_clone()
+        self.install_dt_self()
+    def install_clone(self):
+        if _IS_PYTHON_3:
+            self.func_code = self.check_func.__code__
+            self.func_globals = self.check_func.__globals__
+            self.check_func.__code__ = self.clone_func.__code__
+        else:
+            self.func_code = self.check_func.func_code
+            self.func_globals = self.check_func.func_globals
+            self.check_func.func_code = self.clone_func.func_code
+    def uninstall_clone(self):
+        if _IS_PYTHON_3:
+            self.check_func.__code__ = self.func_code
+        else:
+            self.check_func.func_code = self.func_code
+    def install_dt_self(self):
+        self.prev_func = self.dt_self._DocTestRunner__record_outcome
+        self.dt_self._DocTestRunner__record_outcome = self
+    def uninstall_dt_self(self):
+        self.dt_self._DocTestRunner__record_outcome = self.prev_func
+    def uninstall_module(self):
+        if self.del_module:
+            import sys
+            del sys.modules[self.del_module]
+            if '.' in self.del_module:
+                package, module = self.del_module.rsplit('.', 1)
+                package_mod = sys.modules[package]
+                delattr(package_mod, module)
+    def __call__(self, *args, **kw):
+        self.uninstall_clone()
+        self.uninstall_dt_self()
+        del self.checker._temp_override_self
+        del self.checker._temp_call_super_check_output
+        result = self.prev_func(*args, **kw)
+        self.uninstall_module()
+        return result
+    def call_super(self, *args, **kw):
+        self.uninstall_clone()
+        try:
+            return self.check_func(*args, **kw)
+        finally:
+            self.install_clone()
+            
+def _find_doctest_frame():
+    import sys
+    frame = sys._getframe(1)
+    while frame:
+        l = frame.f_locals
+        if 'BOOM' in l:
+            # Sign of doctest
+            return frame
+        frame = frame.f_back
+    raise LookupError(
+        "Could not find doctest (only use this function *inside* a doctest)")
+    
+__test__ = {
+    'basic': '''
+    >>> temp_install()
+    >>> print """<xml a="1" b="2">stuff</xml>"""
+    <xml b="2" a="1">...</xml>
+    >>> print """<xml xmlns="http://example.com"><tag   attr="bar"   /></xml>"""
+    <xml xmlns="...">
+      <tag attr="..." />
+    </xml>
+    >>> print """<xml>blahblahblah<foo /></xml>""" # doctest: +NOPARSE_MARKUP, +ELLIPSIS
+    <xml>...foo /></xml>
+    '''}
+
+if __name__ == '__main__':
+    import doctest
+    doctest.testmod()
+    
+    
diff --git a/lib/lxml/dtd.pxi b/lib/lxml/dtd.pxi
new file mode 100644
index 00000000..d1913b42
--- /dev/null
+++ b/lib/lxml/dtd.pxi
@@ -0,0 +1,468 @@
+# support for DTD validation
+from lxml.includes cimport dtdvalid
+
+class DTDError(LxmlError):
+    u"""Base class for DTD errors.
+    """
+    pass
+
+class DTDParseError(DTDError):
+    u"""Error while parsing a DTD.
+    """
+    pass
+
+class DTDValidateError(DTDError):
+    u"""Error while validating an XML document with a DTD.
+    """
+    pass
+
+cdef inline int _assertValidDTDNode(node, void *c_node) except -1:
+    assert c_node is not NULL, u"invalid DTD proxy at %s" % id(node)
+
+
+@cython.final
+@cython.internal
+@cython.freelist(8)
+cdef class _DTDElementContentDecl:
+    cdef DTD _dtd
+    cdef tree.xmlElementContent* _c_node
+
+    def __repr__(self):
+        return "<%s.%s object name=%r type=%r occur=%r at 0x%x>" % (self.__class__.__module__, self.__class__.__name__, self.name, self.type, self.occur, id(self))
+
+    property name:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           return funicode(self._c_node.name) if self._c_node.name is not NULL else None
+
+    property type:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           cdef int type = self._c_node.type
+           if type == tree.XML_ELEMENT_CONTENT_PCDATA:
+               return "pcdata"
+           elif type == tree.XML_ELEMENT_CONTENT_ELEMENT:
+               return "element"
+           elif type == tree.XML_ELEMENT_CONTENT_SEQ:
+               return "seq"
+           elif type == tree.XML_ELEMENT_CONTENT_OR:
+               return "or"
+           else:
+               return None
+
+    property occur:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           cdef int occur = self._c_node.ocur
+           if occur == tree.XML_ELEMENT_CONTENT_ONCE:
+               return "once"
+           elif occur == tree.XML_ELEMENT_CONTENT_OPT:
+               return "opt"
+           elif occur == tree.XML_ELEMENT_CONTENT_MULT:
+               return "mult"
+           elif occur == tree.XML_ELEMENT_CONTENT_PLUS:
+               return "plus"
+           else:
+               return None
+
+    property left:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           c1 = self._c_node.c1
+           if c1:
+               node = <_DTDElementContentDecl>_DTDElementContentDecl.__new__(_DTDElementContentDecl)
+               node._dtd = self._dtd
+               node._c_node = <tree.xmlElementContent*>c1
+               return node
+           else:
+               return None
+
+    property right:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           c2 = self._c_node.c2
+           if c2:
+               node = <_DTDElementContentDecl>_DTDElementContentDecl.__new__(_DTDElementContentDecl)
+               node._dtd = self._dtd
+               node._c_node = <tree.xmlElementContent*>c2
+               return node
+           else:
+               return None
+
+
+@cython.final
+@cython.internal
+@cython.freelist(8)
+cdef class _DTDAttributeDecl:
+    cdef DTD _dtd
+    cdef tree.xmlAttribute* _c_node
+
+    def __repr__(self):
+        return "<%s.%s object name=%r elemname=%r prefix=%r type=%r default=%r default_value=%r at 0x%x>" % (self.__class__.__module__, self.__class__.__name__, self.name, self.elemname, self.prefix, self.type, self.default, self.default_value, id(self))
+
+    property name:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           return funicode(self._c_node.name) if self._c_node.name is not NULL else None
+
+    property elemname:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           return funicode(self._c_node.elem) if self._c_node.elem is not NULL else None
+
+    property prefix:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           return funicode(self._c_node.prefix) if self._c_node.prefix is not NULL else None
+
+    property type:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           cdef int type = self._c_node.atype
+           if type == tree.XML_ATTRIBUTE_CDATA:
+               return "cdata"
+           elif type == tree.XML_ATTRIBUTE_ID:
+               return "id"
+           elif type == tree.XML_ATTRIBUTE_IDREF:
+               return "idref"
+           elif type == tree.XML_ATTRIBUTE_IDREFS:
+               return "idrefs"
+           elif type == tree.XML_ATTRIBUTE_ENTITY:
+               return "entity"
+           elif type == tree.XML_ATTRIBUTE_ENTITIES:
+               return "entities"
+           elif type == tree.XML_ATTRIBUTE_NMTOKEN:
+               return "nmtoken"
+           elif type == tree.XML_ATTRIBUTE_NMTOKENS:
+               return "nmtokens"
+           elif type == tree.XML_ATTRIBUTE_ENUMERATION:
+               return "enumeration"
+           elif type == tree.XML_ATTRIBUTE_NOTATION:
+               return "notation"
+           else:
+               return None
+
+    property default:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           cdef int default = self._c_node.def_
+           if default == tree.XML_ATTRIBUTE_NONE:
+               return "none"
+           elif default == tree.XML_ATTRIBUTE_REQUIRED:
+               return "required"
+           elif default == tree.XML_ATTRIBUTE_IMPLIED:
+               return "implied"
+           elif default == tree.XML_ATTRIBUTE_FIXED:
+               return "fixed"
+           else:
+               return None
+
+    property default_value:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           return funicode(self._c_node.defaultValue) if self._c_node.defaultValue is not NULL else None
+
+    def itervalues(self):
+        _assertValidDTDNode(self, self._c_node)
+        cdef tree.xmlEnumeration *c_node = self._c_node.tree
+        while c_node is not NULL:
+            yield funicode(c_node.name)
+            c_node = c_node.next
+
+    def values(self):
+        return list(self.itervalues())
+
+
+@cython.final
+@cython.internal
+@cython.freelist(8)
+cdef class _DTDElementDecl:
+    cdef DTD _dtd
+    cdef tree.xmlElement* _c_node
+
+    def __repr__(self):
+        return "<%s.%s object name=%r prefix=%r type=%r at 0x%x>" % (self.__class__.__module__, self.__class__.__name__, self.name, self.prefix, self.type, id(self))
+
+    property name:
+        def __get__(self):
+            _assertValidDTDNode(self, self._c_node)
+            return funicode(self._c_node.name) if self._c_node.name is not NULL else None
+
+    property prefix:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           return funicode(self._c_node.prefix) if self._c_node.prefix is not NULL else None
+
+    property type:
+        def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           cdef int type = self._c_node.etype
+           if type == tree.XML_ELEMENT_TYPE_UNDEFINED:
+               return "undefined"
+           elif type == tree.XML_ELEMENT_TYPE_EMPTY:
+               return "empty"
+           elif type == tree.XML_ELEMENT_TYPE_ANY:
+               return "any"
+           elif type == tree.XML_ELEMENT_TYPE_MIXED:
+               return "mixed"
+           elif type == tree.XML_ELEMENT_TYPE_ELEMENT:
+               return "element"
+           else:
+               return None
+
+    property content:
+       def __get__(self):
+           _assertValidDTDNode(self, self._c_node)
+           cdef tree.xmlElementContent *content = self._c_node.content
+           if content:
+               node = <_DTDElementContentDecl>_DTDElementContentDecl.__new__(_DTDElementContentDecl)
+               node._dtd = self._dtd
+               node._c_node = content
+               return node
+           else:
+               return None
+
+    def iterattributes(self):
+        _assertValidDTDNode(self, self._c_node)
+        cdef tree.xmlAttribute *c_node = self._c_node.attributes
+        while c_node:
+            node = <_DTDAttributeDecl>_DTDAttributeDecl.__new__(_DTDAttributeDecl)
+            node._dtd = self._dtd
+            node._c_node = c_node
+            yield node
+            c_node = c_node.nexth
+
+    def attributes(self):
+        return list(self.iterattributes())
+
+
+@cython.final
+@cython.internal
+@cython.freelist(8)
+cdef class _DTDEntityDecl:
+    cdef DTD _dtd
+    cdef tree.xmlEntity* _c_node
+    def __repr__(self):
+        return "<%s.%s object name=%r at 0x%x>" % (self.__class__.__module__, self.__class__.__name__, self.name, id(self))
+
+    property name:
+        def __get__(self):
+            _assertValidDTDNode(self, self._c_node)
+            return funicode(self._c_node.name) if self._c_node.name is not NULL else None
+
+    property orig:
+        def __get__(self):
+            _assertValidDTDNode(self, self._c_node)
+            return funicode(self._c_node.orig) if self._c_node.orig is not NULL else None
+
+    property content:
+        def __get__(self):
+            _assertValidDTDNode(self, self._c_node)
+            return funicode(self._c_node.content) if self._c_node.content is not NULL else None
+
+
+################################################################################
+# DTD
+
+cdef class DTD(_Validator):
+    u"""DTD(self, file=None, external_id=None)
+    A DTD validator.
+
+    Can load from filesystem directly given a filename or file-like object.
+    Alternatively, pass the keyword parameter ``external_id`` to load from a
+    catalog.
+    """
+    cdef tree.xmlDtd* _c_dtd
+    def __init__(self, file=None, *, external_id=None):
+        _Validator.__init__(self)
+        if file is not None:
+            if _isString(file):
+                file = _encodeFilename(file)
+                with self._error_log:
+                    self._c_dtd = xmlparser.xmlParseDTD(NULL, _xcstr(file))
+            elif hasattr(file, 'read'):
+                self._c_dtd = _parseDtdFromFilelike(file)
+            else:
+                raise DTDParseError, u"file must be a filename or file-like object"
+        elif external_id is not None:
+            with self._error_log:
+                self._c_dtd = xmlparser.xmlParseDTD(<const_xmlChar*>external_id, NULL)
+        else:
+            raise DTDParseError, u"either filename or external ID required"
+
+        if self._c_dtd is NULL:
+            raise DTDParseError(
+                self._error_log._buildExceptionMessage(u"error parsing DTD"),
+                self._error_log)
+
+    property name:
+       def __get__(self):
+           if self._c_dtd is NULL:
+               return None
+           return funicodeOrNone(self._c_dtd.name)
+
+    property external_id:
+       def __get__(self):
+           if self._c_dtd is NULL:
+               return None
+           return funicodeOrNone(self._c_dtd.ExternalID)
+
+    property system_url:
+       def __get__(self):
+           if self._c_dtd is NULL:
+               return None
+           return funicodeOrNone(self._c_dtd.SystemID)
+
+    def iterelements(self):
+        cdef tree.xmlNode *c_node = self._c_dtd.children if self._c_dtd is not NULL else NULL
+        while c_node is not NULL:
+            if c_node.type == tree.XML_ELEMENT_DECL:
+                node = _DTDElementDecl()
+                node._dtd = self
+                node._c_node = <tree.xmlElement*>c_node
+                yield node
+            c_node = c_node.next
+
+    def elements(self):
+        return list(self.iterelements())
+
+    def iterentities(self):
+        cdef tree.xmlNode *c_node = self._c_dtd.children if self._c_dtd is not NULL else NULL
+        while c_node is not NULL:
+            if c_node.type == tree.XML_ENTITY_DECL:
+                node = _DTDEntityDecl()
+                node._dtd = self
+                node._c_node = <tree.xmlEntity*>c_node
+                yield node
+            c_node = c_node.next
+
+    def entities(self):
+        return list(self.iterentities())
+
+    def __dealloc__(self):
+        tree.xmlFreeDtd(self._c_dtd)
+
+    def __call__(self, etree):
+        u"""__call__(self, etree)
+
+        Validate doc using the DTD.
+
+        Returns true if the document is valid, false if not.
+        """
+        cdef _Document doc
+        cdef _Element root_node
+        cdef xmlDoc* c_doc
+        cdef dtdvalid.xmlValidCtxt* valid_ctxt
+        cdef int ret = -1
+
+        assert self._c_dtd is not NULL, "DTD not initialised"
+        doc = _documentOrRaise(etree)
+        root_node = _rootNodeOrRaise(etree)
+
+        valid_ctxt = dtdvalid.xmlNewValidCtxt()
+        if valid_ctxt is NULL:
+            raise DTDError(u"Failed to create validation context")
+
+        # work around error reporting bug in libxml2 <= 2.9.1 (and later?)
+        # https://bugzilla.gnome.org/show_bug.cgi?id=724903
+        valid_ctxt.error = <dtdvalid.xmlValidityErrorFunc>_nullGenericErrorFunc
+        valid_ctxt.userData = NULL
+
+        try:
+            with self._error_log:
+                c_doc = _fakeRootDoc(doc._c_doc, root_node._c_node)
+                ret = dtdvalid.xmlValidateDtd(valid_ctxt, c_doc, self._c_dtd)
+                _destroyFakeDoc(doc._c_doc, c_doc)
+        finally:
+            dtdvalid.xmlFreeValidCtxt(valid_ctxt)
+
+        if ret == -1:
+            raise DTDValidateError(u"Internal error in DTD validation",
+                                   self._error_log)
+        return ret == 1
+
+
+cdef tree.xmlDtd* _parseDtdFromFilelike(file) except NULL:
+    cdef _ExceptionContext exc_context
+    cdef _FileReaderContext dtd_parser
+    cdef _ErrorLog error_log
+    cdef tree.xmlDtd* c_dtd
+    exc_context = _ExceptionContext()
+    dtd_parser = _FileReaderContext(file, exc_context, None)
+    error_log = _ErrorLog()
+
+    with error_log:
+        c_dtd = dtd_parser._readDtd()
+
+    exc_context._raise_if_stored()
+    if c_dtd is NULL:
+        raise DTDParseError(u"error parsing DTD", error_log)
+    return c_dtd
+
+cdef DTD _dtdFactory(tree.xmlDtd* c_dtd):
+    # do not run through DTD.__init__()!
+    cdef DTD dtd
+    if c_dtd is NULL:
+        return None
+    dtd = DTD.__new__(DTD)
+    dtd._c_dtd = _copyDtd(c_dtd)
+    _Validator.__init__(dtd)
+    return dtd
+
+
+cdef tree.xmlDtd* _copyDtd(tree.xmlDtd* c_orig_dtd) except NULL:
+    """
+    Copy a DTD.  libxml2 (currently) fails to set up the element->attributes
+    links when copying DTDs, so we have to rebuild them here.
+    """
+    c_dtd = tree.xmlCopyDtd(c_orig_dtd)
+    if not c_dtd:
+        raise MemoryError
+    cdef tree.xmlNode* c_node = c_dtd.children
+    while c_node:
+        if c_node.type == tree.XML_ATTRIBUTE_DECL:
+            _linkDtdAttribute(c_dtd, <tree.xmlAttribute*>c_node)
+        c_node = c_node.next
+    return c_dtd
+
+
+cdef void _linkDtdAttribute(tree.xmlDtd* c_dtd, tree.xmlAttribute* c_attr):
+    """
+    Create the link to the DTD attribute declaration from the corresponding
+    element declaration.
+    """
+    c_elem = dtdvalid.xmlGetDtdElementDesc(c_dtd, c_attr.elem)
+    if not c_elem:
+        # no such element? something is wrong with the DTD ...
+        return
+    c_pos = c_elem.attributes
+    if not c_pos:
+        c_elem.attributes = c_attr
+        c_attr.nexth = NULL
+        return
+    # libxml2 keeps namespace declarations first, and we need to make
+    # sure we don't re-insert attributes that are already there
+    if _isDtdNsDecl(c_attr):
+        if not _isDtdNsDecl(c_pos):
+            c_elem.attributes = c_attr
+            c_attr.nexth = c_pos
+            return
+        while c_pos != c_attr and c_pos.nexth and _isDtdNsDecl(c_pos.nexth):
+            c_pos = c_pos.nexth
+    else:
+        # append at end
+        while c_pos != c_attr and c_pos.nexth:
+            c_pos = c_pos.nexth
+    if c_pos == c_attr:
+        return
+    c_attr.nexth = c_pos.nexth
+    c_pos.nexth = c_attr
+
+
+cdef bint _isDtdNsDecl(tree.xmlAttribute* c_attr):
+    if cstring_h.strcmp(<const_char*>c_attr.name, "xmlns") == 0:
+        return True
+    if (c_attr.prefix is not NULL and
+            cstring_h.strcmp(<const_char*>c_attr.prefix, "xmlns") == 0):
+        return True
+    return False
diff --git a/lib/lxml/extensions.pxi b/lib/lxml/extensions.pxi
new file mode 100644
index 00000000..531036ef
--- /dev/null
+++ b/lib/lxml/extensions.pxi
@@ -0,0 +1,855 @@
+# support for extension functions in XPath and XSLT
+
+class XPathError(LxmlError):
+    u"""Base class of all XPath errors.
+    """
+    pass
+
+class XPathEvalError(XPathError):
+    u"""Error during XPath evaluation.
+    """
+    pass
+
+class XPathFunctionError(XPathEvalError):
+    u"""Internal error looking up an XPath extension function.
+    """
+    pass
+
+class XPathResultError(XPathEvalError):
+    u"""Error handling an XPath result.
+    """
+    pass
+
+# forward declarations
+
+ctypedef int (*_register_function)(void* ctxt, name_utf, ns_uri_utf)
+cdef class _ExsltRegExp
+
+################################################################################
+# Base class for XSLT and XPath evaluation contexts: functions, namespaces, ...
+
+@cython.internal
+cdef class _BaseContext:
+    cdef xpath.xmlXPathContext* _xpathCtxt
+    cdef _Document _doc
+    cdef dict _extensions
+    cdef list _namespaces
+    cdef list _global_namespaces
+    cdef dict _utf_refs
+    cdef dict _function_cache
+    cdef dict _eval_context_dict
+    cdef bint _build_smart_strings
+    # for exception handling and temporary reference keeping:
+    cdef _TempStore _temp_refs
+    cdef set _temp_documents
+    cdef _ExceptionContext _exc
+    cdef _ErrorLog _error_log
+
+    def __cinit__(self):
+        self._xpathCtxt = NULL
+
+    def __init__(self, namespaces, extensions, error_log, enable_regexp,
+                 build_smart_strings):
+        cdef _ExsltRegExp _regexp 
+        cdef dict new_extensions
+        cdef list ns
+        self._utf_refs = {}
+        self._global_namespaces = []
+        self._function_cache = {}
+        self._eval_context_dict = None
+        self._error_log = error_log
+
+        if extensions is not None:
+            # convert extensions to UTF-8
+            if isinstance(extensions, dict):
+                extensions = (extensions,)
+            # format: [ {(ns, name):function} ] -> {(ns_utf, name_utf):function}
+            new_extensions = {}
+            for extension in extensions:
+                for (ns_uri, name), function in extension.items():
+                    if name is None:
+                        raise ValueError, u"extensions must have non empty names"
+                    ns_utf   = self._to_utf(ns_uri)
+                    name_utf = self._to_utf(name)
+                    new_extensions[(ns_utf, name_utf)] = function
+            extensions = new_extensions or None
+
+        if namespaces is not None:
+            if isinstance(namespaces, dict):
+                namespaces = namespaces.items()
+            if namespaces:
+                ns = []
+                for prefix, ns_uri in namespaces:
+                    if prefix is None or not prefix:
+                        raise TypeError, \
+                            u"empty namespace prefix is not supported in XPath"
+                    if ns_uri is None or not ns_uri:
+                        raise TypeError, \
+                            u"setting default namespace is not supported in XPath"
+                    prefix_utf = self._to_utf(prefix)
+                    ns_uri_utf = self._to_utf(ns_uri)
+                    ns.append( (prefix_utf, ns_uri_utf) )
+                namespaces = ns
+            else:
+                namespaces = None
+
+        self._doc        = None
+        self._exc        = _ExceptionContext()
+        self._extensions = extensions
+        self._namespaces = namespaces
+        self._temp_refs  = _TempStore()
+        self._temp_documents  = set()
+        self._build_smart_strings = build_smart_strings
+
+        if enable_regexp:
+            _regexp = _ExsltRegExp()
+            _regexp._register_in_context(self)
+
+    cdef _BaseContext _copy(self):
+        cdef _BaseContext context
+        if self._namespaces is not None:
+            namespaces = self._namespaces[:]
+        else:
+            namespaces = None
+        context = self.__class__(namespaces, None, self._error_log, False,
+                                 self._build_smart_strings)
+        if self._extensions is not None:
+            context._extensions = self._extensions.copy()
+        return context
+
+    cdef bytes _to_utf(self, s):
+        u"Convert to UTF-8 and keep a reference to the encoded string"
+        cdef python.PyObject* dict_result
+        if s is None:
+            return None
+        dict_result = python.PyDict_GetItem(self._utf_refs, s)
+        if dict_result is not NULL:
+            return <bytes>dict_result
+        utf = _utf8(s)
+        self._utf_refs[s] = utf
+        if python.IS_PYPY:
+            # use C level refs, PyPy refs are not enough!
+            python.Py_INCREF(utf)
+        return utf
+
+    cdef void _set_xpath_context(self, xpath.xmlXPathContext* xpathCtxt):
+        self._xpathCtxt = xpathCtxt
+        xpathCtxt.userData = <void*>self
+        xpathCtxt.error = _receiveXPathError
+
+    @cython.final
+    cdef _register_context(self, _Document doc):
+        self._doc = doc
+        self._exc.clear()
+
+    @cython.final
+    cdef _cleanup_context(self):
+        #xpath.xmlXPathRegisteredNsCleanup(self._xpathCtxt)
+        #self.unregisterGlobalNamespaces()
+        if python.IS_PYPY:
+            # clean up double refs in PyPy (see "_to_utf()" method)
+            for ref in self._utf_refs.itervalues():
+                python.Py_DECREF(ref)
+        self._utf_refs.clear()
+        self._eval_context_dict = None
+        self._doc = None
+
+    @cython.final
+    cdef _release_context(self):
+        if self._xpathCtxt is not NULL:
+            self._xpathCtxt.userData = NULL
+            self._xpathCtxt = NULL
+
+    # namespaces (internal UTF-8 methods with leading '_')
+
+    cdef addNamespace(self, prefix, ns_uri):
+        cdef list namespaces
+        if prefix is None:
+            raise TypeError, u"empty prefix is not supported in XPath"
+        prefix_utf = self._to_utf(prefix)
+        ns_uri_utf = self._to_utf(ns_uri)
+        new_item = (prefix_utf, ns_uri_utf)
+        if self._namespaces is None:
+            self._namespaces = [new_item]
+        else:
+            namespaces = []
+            for item in self._namespaces:
+                if item[0] == prefix_utf:
+                    item = new_item
+                    new_item = None
+                namespaces.append(item)
+            if new_item is not None:
+                namespaces.append(new_item)
+            self._namespaces = namespaces
+        if self._xpathCtxt is not NULL:
+            xpath.xmlXPathRegisterNs(
+                self._xpathCtxt, _xcstr(prefix_utf), _xcstr(ns_uri_utf))
+
+    cdef registerNamespace(self, prefix, ns_uri):
+        if prefix is None:
+            raise TypeError, u"empty prefix is not supported in XPath"
+        prefix_utf = self._to_utf(prefix)
+        ns_uri_utf = self._to_utf(ns_uri)
+        self._global_namespaces.append(prefix_utf)
+        xpath.xmlXPathRegisterNs(self._xpathCtxt,
+                                 _xcstr(prefix_utf), _xcstr(ns_uri_utf))
+
+    cdef registerLocalNamespaces(self):
+        if self._namespaces is None:
+            return
+        for prefix_utf, ns_uri_utf in self._namespaces:
+            xpath.xmlXPathRegisterNs(
+                self._xpathCtxt, _xcstr(prefix_utf), _xcstr(ns_uri_utf))
+
+    cdef registerGlobalNamespaces(self):
+        cdef list ns_prefixes = _find_all_extension_prefixes()
+        if python.PyList_GET_SIZE(ns_prefixes) > 0:
+            for prefix_utf, ns_uri_utf in ns_prefixes:
+                self._global_namespaces.append(prefix_utf)
+                xpath.xmlXPathRegisterNs(
+                    self._xpathCtxt, _xcstr(prefix_utf), _xcstr(ns_uri_utf))
+
+    cdef unregisterGlobalNamespaces(self):
+        if python.PyList_GET_SIZE(self._global_namespaces) > 0:
+            for prefix_utf in self._global_namespaces:
+                xpath.xmlXPathRegisterNs(self._xpathCtxt,
+                                         _xcstr(prefix_utf), NULL)
+            del self._global_namespaces[:]
+    
+    cdef void _unregisterNamespace(self, prefix_utf):
+        xpath.xmlXPathRegisterNs(self._xpathCtxt,
+                                 _xcstr(prefix_utf), NULL)
+    
+    # extension functions
+
+    cdef int _addLocalExtensionFunction(self, ns_utf, name_utf, function) except -1:
+        if self._extensions is None:
+            self._extensions = {}
+        self._extensions[(ns_utf, name_utf)] = function
+        return 0
+
+    cdef registerGlobalFunctions(self, void* ctxt,
+                                 _register_function reg_func):
+        cdef python.PyObject* dict_result
+        cdef dict d
+        for ns_utf, ns_functions in __FUNCTION_NAMESPACE_REGISTRIES.iteritems():
+            dict_result = python.PyDict_GetItem(
+                self._function_cache, ns_utf)
+            if dict_result is not NULL:
+                d = <dict>dict_result
+            else:
+                d = {}
+                self._function_cache[ns_utf] = d
+            for name_utf, function in ns_functions.iteritems():
+                d[name_utf] = function
+                reg_func(ctxt, name_utf, ns_utf)
+
+    cdef registerLocalFunctions(self, void* ctxt,
+                                _register_function reg_func):
+        cdef python.PyObject* dict_result
+        cdef dict d
+        if self._extensions is None:
+            return # done
+        last_ns = None
+        d = None
+        for (ns_utf, name_utf), function in self._extensions.iteritems():
+            if ns_utf is not last_ns or d is None:
+                last_ns = ns_utf
+                dict_result = python.PyDict_GetItem(
+                    self._function_cache, ns_utf)
+                if dict_result is not NULL:
+                    d = <dict>dict_result
+                else:
+                    d = {}
+                    self._function_cache[ns_utf] = d
+            d[name_utf] = function
+            reg_func(ctxt, name_utf, ns_utf)
+
+    cdef unregisterAllFunctions(self, void* ctxt,
+                                      _register_function unreg_func):
+        for ns_utf, functions in self._function_cache.iteritems():
+            for name_utf in functions:
+                unreg_func(ctxt, name_utf, ns_utf)
+
+    cdef unregisterGlobalFunctions(self, void* ctxt,
+                                         _register_function unreg_func):
+        for ns_utf, functions in self._function_cache.items():
+            for name_utf in functions:
+                if self._extensions is None or \
+                       (ns_utf, name_utf) not in self._extensions:
+                    unreg_func(ctxt, name_utf, ns_utf)
+
+    @cython.final
+    cdef _find_cached_function(self, const_xmlChar* c_ns_uri, const_xmlChar* c_name):
+        u"""Lookup an extension function in the cache and return it.
+
+        Parameters: c_ns_uri may be NULL, c_name must not be NULL
+        """
+        cdef python.PyObject* c_dict
+        cdef python.PyObject* dict_result
+        c_dict = python.PyDict_GetItem(
+            self._function_cache, None if c_ns_uri is NULL else c_ns_uri)
+        if c_dict is not NULL:
+            dict_result = python.PyDict_GetItem(
+                <object>c_dict, <unsigned char*>c_name)
+            if dict_result is not NULL:
+                return <object>dict_result
+        return None
+
+    # Python access to the XPath context for extension functions
+
+    property context_node:
+        def __get__(self):
+            cdef xmlNode* c_node
+            if self._xpathCtxt is NULL:
+                raise XPathError, \
+                    u"XPath context is only usable during the evaluation"
+            c_node = self._xpathCtxt.node
+            if c_node is NULL:
+                raise XPathError, u"no context node"
+            if c_node.doc != self._xpathCtxt.doc:
+                raise XPathError, \
+                    u"document-external context nodes are not supported"
+            if self._doc is None:
+                raise XPathError, u"document context is missing"
+            return _elementFactory(self._doc, c_node)
+
+    property eval_context:
+        def __get__(self):
+            if self._eval_context_dict is None:
+                self._eval_context_dict = {}
+            return self._eval_context_dict
+
+    # Python reference keeping during XPath function evaluation
+
+    @cython.final
+    cdef _release_temp_refs(self):
+        u"Free temporarily referenced objects from this context."
+        self._temp_refs.clear()
+        self._temp_documents.clear()
+
+    @cython.final
+    cdef _hold(self, obj):
+        u"""A way to temporarily hold references to nodes in the evaluator.
+
+        This is needed because otherwise nodes created in XPath extension
+        functions would be reference counted too soon, during the XPath
+        evaluation.  This is most important in the case of exceptions.
+        """
+        cdef _Element element
+        if isinstance(obj, _Element):
+            self._temp_refs.add(obj)
+            self._temp_documents.add((<_Element>obj)._doc)
+            return
+        elif _isString(obj) or not python.PySequence_Check(obj):
+            return
+        for o in obj:
+            if isinstance(o, _Element):
+                #print "Holding element:", <int>element._c_node
+                self._temp_refs.add(o)
+                #print "Holding document:", <int>element._doc._c_doc
+                self._temp_documents.add((<_Element>o)._doc)
+
+    @cython.final
+    cdef _Document _findDocumentForNode(self, xmlNode* c_node):
+        u"""If an XPath expression returns an element from a different
+        document than the current context document, we call this to
+        see if it was possibly created by an extension and is a known
+        document instance.
+        """
+        cdef _Document doc
+        for doc in self._temp_documents:
+            if doc is not None and doc._c_doc is c_node.doc:
+                return doc
+        return None
+
+
+# libxml2 keeps these error messages in a static array in its code
+# and doesn't give us access to them ...
+
+cdef tuple LIBXML2_XPATH_ERROR_MESSAGES = (
+    b"Ok",
+    b"Number encoding",
+    b"Unfinished literal",
+    b"Start of literal",
+    b"Expected $ for variable reference",
+    b"Undefined variable",
+    b"Invalid predicate",
+    b"Invalid expression",
+    b"Missing closing curly brace",
+    b"Unregistered function",
+    b"Invalid operand",
+    b"Invalid type",
+    b"Invalid number of arguments",
+    b"Invalid context size",
+    b"Invalid context position",
+    b"Memory allocation error",
+    b"Syntax error",
+    b"Resource error",
+    b"Sub resource error",
+    b"Undefined namespace prefix",
+    b"Encoding error",
+    b"Char out of XML range",
+    b"Invalid or incomplete context",
+    b"Stack usage error",
+)
+
+cdef void _forwardXPathError(void* c_ctxt, xmlerror.xmlError* c_error) with gil:
+    cdef xmlerror.xmlError error
+    cdef int xpath_code
+    if c_error.message is not NULL:
+        error.message = c_error.message
+    else:
+        xpath_code = c_error.code - xmlerror.XML_XPATH_EXPRESSION_OK
+        if 0 <= xpath_code < len(LIBXML2_XPATH_ERROR_MESSAGES):
+            error.message = _cstr(LIBXML2_XPATH_ERROR_MESSAGES[xpath_code])
+        else:
+            error.message = b"unknown error"
+    error.domain = c_error.domain
+    error.code = c_error.code
+    error.level = c_error.level
+    error.line = c_error.line
+    error.int2 = c_error.int1 # column
+    error.file = c_error.file
+
+    (<_BaseContext>c_ctxt)._error_log._receive(&error)
+
+cdef void _receiveXPathError(void* c_context, xmlerror.xmlError* error) nogil:
+    if not __DEBUG:
+        return
+    if c_context is NULL:
+        _forwardError(NULL, error)
+    else:
+        _forwardXPathError(c_context, error)
+
+
+def Extension(module, function_mapping=None, *, ns=None):
+    u"""Extension(module, function_mapping=None, ns=None)
+
+    Build a dictionary of extension functions from the functions
+    defined in a module or the methods of an object.
+
+    As second argument, you can pass an additional mapping of
+    attribute names to XPath function names, or a list of function
+    names that should be taken.
+
+    The ``ns`` keyword argument accepts a namespace URI for the XPath
+    functions.
+    """
+    cdef dict functions = {}
+    if isinstance(function_mapping, dict):
+        for function_name, xpath_name in function_mapping.items():
+            functions[(ns, xpath_name)] = getattr(module, function_name)
+    else:
+        if function_mapping is None:
+            function_mapping = [ name for name in dir(module)
+                                 if not name.startswith(u'_') ]
+        for function_name in function_mapping:
+            functions[(ns, function_name)] = getattr(module, function_name)
+    return functions
+
+################################################################################
+# EXSLT regexp implementation
+
+@cython.final
+@cython.internal
+cdef class _ExsltRegExp:
+    cdef dict _compile_map
+    def __cinit__(self):
+        self._compile_map = {}
+
+    cdef _make_string(self, value):
+        if _isString(value):
+            return value
+        elif isinstance(value, list):
+            # node set: take recursive text concatenation of first element
+            if python.PyList_GET_SIZE(value) == 0:
+                return u''
+            firstnode = value[0]
+            if _isString(firstnode):
+                return firstnode
+            elif isinstance(firstnode, _Element):
+                c_text = tree.xmlNodeGetContent((<_Element>firstnode)._c_node)
+                if c_text is NULL:
+                    raise MemoryError()
+                try:
+                    return funicode(c_text)
+                finally:
+                    tree.xmlFree(c_text)
+            else:
+                return unicode(firstnode)
+        else:
+            return unicode(value)
+
+    cdef _compile(self, rexp, ignore_case):
+        cdef python.PyObject* c_result
+        rexp = self._make_string(rexp)
+        key = (rexp, ignore_case)
+        c_result = python.PyDict_GetItem(self._compile_map, key)
+        if c_result is not NULL:
+            return <object>c_result
+        py_flags = re.UNICODE
+        if ignore_case:
+            py_flags = py_flags | re.IGNORECASE
+        rexp_compiled = re.compile(rexp, py_flags)
+        self._compile_map[key] = rexp_compiled
+        return rexp_compiled
+
+    def test(self, ctxt, s, rexp, flags=u''):
+        flags = self._make_string(flags)
+        s = self._make_string(s)
+        rexpc = self._compile(rexp, u'i' in flags)
+        if rexpc.search(s) is None:
+            return False
+        else:
+            return True
+
+    def match(self, ctxt, s, rexp, flags=u''):
+        cdef list result_list
+        flags = self._make_string(flags)
+        s = self._make_string(s)
+        rexpc = self._compile(rexp, u'i' in flags)
+        if u'g' in flags:
+            results = rexpc.findall(s)
+            if not results:
+                return ()
+        else:
+            result = rexpc.search(s)
+            if not result:
+                return ()
+            results = [ result.group() ]
+            results.extend( result.groups(u'') )
+        result_list = []
+        root = Element(u'matches')
+        join_groups = u''.join
+        for s_match in results:
+            if python.PyTuple_CheckExact(s_match):
+                s_match = join_groups(s_match)
+            elem = SubElement(root, u'match')
+            elem.text = s_match
+            result_list.append(elem)
+        return result_list
+
+    def replace(self, ctxt, s, rexp, flags, replacement):
+        replacement = self._make_string(replacement)
+        flags = self._make_string(flags)
+        s = self._make_string(s)
+        rexpc = self._compile(rexp, u'i' in flags)
+        if u'g' in flags:
+            count = 0
+        else:
+            count = 1
+        return rexpc.sub(replacement, s, count)
+
+    cdef _register_in_context(self, _BaseContext context):
+        ns = b"http://exslt.org/regular-expressions"
+        context._addLocalExtensionFunction(ns, b"test",    self.test)
+        context._addLocalExtensionFunction(ns, b"match",   self.match)
+        context._addLocalExtensionFunction(ns, b"replace", self.replace)
+
+
+################################################################################
+# helper functions
+
+cdef xpath.xmlXPathObject* _wrapXPathObject(object obj, _Document doc,
+                                            _BaseContext context) except NULL:
+    cdef xpath.xmlNodeSet* resultSet
+    cdef _Element fake_node = None
+    cdef xmlNode* c_node
+
+    if isinstance(obj, unicode):
+        obj = _utf8(obj)
+    if isinstance(obj, bytes):
+        # libxml2 copies the string value
+        return xpath.xmlXPathNewCString(_cstr(obj))
+    if isinstance(obj, bool):
+        return xpath.xmlXPathNewBoolean(obj)
+    if python.PyNumber_Check(obj):
+        return xpath.xmlXPathNewFloat(obj)
+    if obj is None:
+        resultSet = xpath.xmlXPathNodeSetCreate(NULL)
+    elif isinstance(obj, _Element):
+        resultSet = xpath.xmlXPathNodeSetCreate((<_Element>obj)._c_node)
+    elif python.PySequence_Check(obj):
+        resultSet = xpath.xmlXPathNodeSetCreate(NULL)
+        try:
+            for value in obj:
+                if isinstance(value, _Element):
+                    if context is not None:
+                        context._hold(value)
+                    xpath.xmlXPathNodeSetAdd(resultSet, (<_Element>value)._c_node)
+                else:
+                    if context is None or doc is None:
+                        raise XPathResultError, \
+                              u"Non-Element values not supported at this point - got %r" % value
+                    # support strings by appending text nodes to an Element
+                    if isinstance(value, unicode):
+                        value = _utf8(value)
+                    if isinstance(value, bytes):
+                        if fake_node is None:
+                            fake_node = _makeElement("text-root", NULL, doc, None,
+                                                     None, None, None, None, None)
+                            context._hold(fake_node)
+                        else:
+                            # append a comment node to keep the text nodes separate
+                            c_node = tree.xmlNewDocComment(doc._c_doc, <unsigned char*>"")
+                            if c_node is NULL:
+                                raise MemoryError()
+                            tree.xmlAddChild(fake_node._c_node, c_node)
+                        context._hold(value)
+                        c_node = tree.xmlNewDocText(doc._c_doc, _xcstr(value))
+                        if c_node is NULL:
+                            raise MemoryError()
+                        tree.xmlAddChild(fake_node._c_node, c_node)
+                        xpath.xmlXPathNodeSetAdd(resultSet, c_node)
+                    else:
+                        raise XPathResultError, \
+                              u"This is not a supported node-set result: %r" % value
+        except:
+            xpath.xmlXPathFreeNodeSet(resultSet)
+            raise
+    else:
+        raise XPathResultError, u"Unknown return type: %s" % \
+            python._fqtypename(obj).decode('utf8')
+    return xpath.xmlXPathWrapNodeSet(resultSet)
+
+cdef object _unwrapXPathObject(xpath.xmlXPathObject* xpathObj,
+                               _Document doc, _BaseContext context):
+    if xpathObj.type == xpath.XPATH_UNDEFINED:
+        raise XPathResultError, u"Undefined xpath result"
+    elif xpathObj.type == xpath.XPATH_NODESET:
+        return _createNodeSetResult(xpathObj, doc, context)
+    elif xpathObj.type == xpath.XPATH_BOOLEAN:
+        return xpathObj.boolval
+    elif xpathObj.type == xpath.XPATH_NUMBER:
+        return xpathObj.floatval
+    elif xpathObj.type == xpath.XPATH_STRING:
+        stringval = funicode(xpathObj.stringval)
+        if context._build_smart_strings:
+            stringval = _elementStringResultFactory(
+                stringval, None, None, 0)
+        return stringval
+    elif xpathObj.type == xpath.XPATH_POINT:
+        raise NotImplementedError, u"XPATH_POINT"
+    elif xpathObj.type == xpath.XPATH_RANGE:
+        raise NotImplementedError, u"XPATH_RANGE"
+    elif xpathObj.type == xpath.XPATH_LOCATIONSET:
+        raise NotImplementedError, u"XPATH_LOCATIONSET"
+    elif xpathObj.type == xpath.XPATH_USERS:
+        raise NotImplementedError, u"XPATH_USERS"
+    elif xpathObj.type == xpath.XPATH_XSLT_TREE:
+        return _createNodeSetResult(xpathObj, doc, context)
+    else:
+        raise XPathResultError, u"Unknown xpath result %s" % unicode(xpathObj.type)
+
+cdef object _createNodeSetResult(xpath.xmlXPathObject* xpathObj, _Document doc,
+                                 _BaseContext context):
+    cdef xmlNode* c_node
+    cdef int i
+    cdef list result
+    result = []
+    if xpathObj.nodesetval is NULL:
+        return result
+    for i in range(xpathObj.nodesetval.nodeNr):
+        c_node = xpathObj.nodesetval.nodeTab[i]
+        _unpackNodeSetEntry(result, c_node, doc, context,
+                            xpathObj.type == xpath.XPATH_XSLT_TREE)
+    return result
+
+cdef _unpackNodeSetEntry(list results, xmlNode* c_node, _Document doc,
+                         _BaseContext context, bint is_fragment):
+    cdef xmlNode* c_child
+    if _isElement(c_node):
+        if c_node.doc != doc._c_doc and c_node.doc._private is NULL:
+            # XXX: works, but maybe not always the right thing to do?
+            # XPath: only runs when extensions create or copy trees
+            #        -> we store Python refs to these, so that is OK
+            # XSLT: can it leak when merging trees from multiple sources?
+            c_node = tree.xmlDocCopyNode(c_node, doc._c_doc, 1)
+            # FIXME: call _instantiateElementFromXPath() instead?
+        results.append(
+            _fakeDocElementFactory(doc, c_node))
+    elif c_node.type == tree.XML_TEXT_NODE or \
+             c_node.type == tree.XML_CDATA_SECTION_NODE or \
+             c_node.type == tree.XML_ATTRIBUTE_NODE:
+        results.append(
+            _buildElementStringResult(doc, c_node, context))
+    elif c_node.type == tree.XML_NAMESPACE_DECL:
+        results.append( (funicodeOrNone((<xmlNs*>c_node).prefix),
+                         funicodeOrNone((<xmlNs*>c_node).href)) )
+    elif c_node.type == tree.XML_DOCUMENT_NODE or \
+            c_node.type == tree.XML_HTML_DOCUMENT_NODE:
+        # ignored for everything but result tree fragments
+        if is_fragment:
+            c_child = c_node.children
+            while c_child is not NULL:
+                _unpackNodeSetEntry(results, c_child, doc, context, 0)
+                c_child = c_child.next
+    elif c_node.type == tree.XML_XINCLUDE_START or \
+            c_node.type == tree.XML_XINCLUDE_END:
+        pass
+    else:
+        raise NotImplementedError, \
+            u"Not yet implemented result node type: %d" % c_node.type
+
+cdef void _freeXPathObject(xpath.xmlXPathObject* xpathObj):
+    u"""Free the XPath object, but *never* free the *content* of node sets.
+    Python dealloc will do that for us.
+    """
+    if xpathObj.nodesetval is not NULL:
+        xpath.xmlXPathFreeNodeSet(xpathObj.nodesetval)
+        xpathObj.nodesetval = NULL
+    xpath.xmlXPathFreeObject(xpathObj)
+
+cdef _Element _instantiateElementFromXPath(xmlNode* c_node, _Document doc,
+                                           _BaseContext context):
+    # NOTE: this may copy the element - only call this when it can't leak
+    if c_node.doc != doc._c_doc and c_node.doc._private is NULL:
+        # not from the context document and not from a fake document
+        # either => may still be from a known document, e.g. one
+        # created by an extension function
+        doc = context._findDocumentForNode(c_node)
+        if doc is None:
+            # not from a known document at all! => can only make a
+            # safety copy here
+            c_node = tree.xmlDocCopyNode(c_node, doc._c_doc, 1)
+    return _fakeDocElementFactory(doc, c_node)
+
+################################################################################
+# special str/unicode subclasses
+
+@cython.final
+cdef class _ElementUnicodeResult(unicode):
+    cdef _Element _parent
+    cdef readonly object attrname
+    cdef readonly bint is_tail
+    cdef readonly bint is_text
+    cdef readonly bint is_attribute
+
+    def getparent(self):
+        return self._parent
+
+class _ElementStringResult(bytes):
+    # we need to use a Python class here, bytes cannot be C-subclassed
+    # in Pyrex/Cython
+    def getparent(self):
+        return self._parent
+
+cdef object _elementStringResultFactory(string_value, _Element parent,
+                                        attrname, bint is_tail):
+    cdef _ElementUnicodeResult uresult
+    cdef bint is_text
+    cdef bint is_attribute = attrname is not None
+    if parent is None:
+        is_text = 0
+    else:
+        is_text = not (is_tail or is_attribute)
+
+    if type(string_value) is bytes:
+        result = _ElementStringResult(string_value)
+        result._parent = parent
+        result.is_attribute = is_attribute
+        result.is_tail = is_tail
+        result.is_text = is_text
+        result.attrname = attrname
+        return result
+    else:
+        uresult = _ElementUnicodeResult(string_value)
+        uresult._parent = parent
+        uresult.is_attribute = is_attribute
+        uresult.is_tail = is_tail
+        uresult.is_text = is_text
+        uresult.attrname = attrname
+        return uresult
+
+cdef object _buildElementStringResult(_Document doc, xmlNode* c_node,
+                                      _BaseContext context):
+    cdef _Element parent = None
+    cdef object attrname = None
+    cdef xmlNode* c_element
+    cdef bint is_tail
+
+    if c_node.type == tree.XML_ATTRIBUTE_NODE:
+        attrname = _namespacedName(c_node)
+        is_tail = 0
+        s = tree.xmlNodeGetContent(c_node)
+        try:
+            value = funicode(s)
+        finally:
+            tree.xmlFree(s)
+        c_element = NULL
+    else:
+        #assert c_node.type == tree.XML_TEXT_NODE or c_node.type == tree.XML_CDATA_SECTION_NODE, "invalid node type"
+        # may be tail text or normal text
+        value = funicode(c_node.content)
+        c_element = _previousElement(c_node)
+        is_tail = c_element is not NULL
+
+    if not context._build_smart_strings:
+        return value
+
+    if c_element is NULL:
+        # non-tail text or attribute text
+        c_element = c_node.parent
+        while c_element is not NULL and not _isElement(c_element):
+            c_element = c_element.parent
+
+    if c_element is not NULL:
+        parent = _instantiateElementFromXPath(c_element, doc, context)
+
+    return _elementStringResultFactory(
+        value, parent, attrname, is_tail)
+
+################################################################################
+# callbacks for XPath/XSLT extension functions
+
+cdef void _extension_function_call(_BaseContext context, function,
+                                   xpath.xmlXPathParserContext* ctxt, int nargs):
+    cdef _Document doc
+    cdef xpath.xmlXPathObject* obj
+    cdef list args
+    cdef int i
+    doc = context._doc
+    try:
+        args = []
+        for i in range(nargs):
+            obj = xpath.valuePop(ctxt)
+            o = _unwrapXPathObject(obj, doc, context)
+            _freeXPathObject(obj)
+            args.append(o)
+        args.reverse()
+
+        res = function(context, *args)
+        # wrap result for XPath consumption
+        obj = _wrapXPathObject(res, doc, context)
+        # prevent Python from deallocating elements handed to libxml2
+        context._hold(res)
+        xpath.valuePush(ctxt, obj)
+    except:
+        xpath.xmlXPathErr(ctxt, xpath.XPATH_EXPR_ERROR)
+        context._exc._store_raised()
+    finally:
+        return  # swallow any further exceptions
+
+# lookup the function by name and call it
+
+cdef void _xpath_function_call(xpath.xmlXPathParserContext* ctxt,
+                               int nargs) with gil:
+    cdef _BaseContext context
+    cdef xpath.xmlXPathContext* rctxt = ctxt.context
+    context = <_BaseContext> rctxt.userData
+    try:
+        function = context._find_cached_function(rctxt.functionURI, rctxt.function)
+        if function is not None:
+            _extension_function_call(context, function, ctxt, nargs)
+        else:
+            xpath.xmlXPathErr(ctxt, xpath.XPATH_UNKNOWN_FUNC_ERROR)
+            context._exc._store_exception(
+                XPathFunctionError(u"XPath function '%s' not found" %
+                _namespacedNameFromNsName(rctxt.functionURI, rctxt.function)))
+    except:
+        # may not be the right error, but we need to tell libxml2 *something*
+        xpath.xmlXPathErr(ctxt, xpath.XPATH_UNKNOWN_FUNC_ERROR)
+        context._exc._store_raised()
+    finally:
+        return  # swallow any further exceptions
diff --git a/lib/lxml/html/ElementSoup.py b/lib/lxml/html/ElementSoup.py
new file mode 100644
index 00000000..8e4fde13
--- /dev/null
+++ b/lib/lxml/html/ElementSoup.py
@@ -0,0 +1,10 @@
+__doc__ = """Legacy interface to the BeautifulSoup HTML parser.
+"""
+
+__all__ = ["parse", "convert_tree"]
+
+from soupparser import convert_tree, parse as _parse
+
+def parse(file, beautifulsoup=None, makeelement=None):
+    root = _parse(file, beautifulsoup=beautifulsoup, makeelement=makeelement)
+    return root.getroot()
diff --git a/lib/lxml/html/__init__.py b/lib/lxml/html/__init__.py
new file mode 100644
index 00000000..fe28c3bb
--- /dev/null
+++ b/lib/lxml/html/__init__.py
@@ -0,0 +1,1697 @@
+# Copyright (c) 2004 Ian Bicking. All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions are
+# met:
+#
+# 1. Redistributions of source code must retain the above copyright
+# notice, this list of conditions and the following disclaimer.
+#
+# 2. Redistributions in binary form must reproduce the above copyright
+# notice, this list of conditions and the following disclaimer in
+# the documentation and/or other materials provided with the
+# distribution.
+#
+# 3. Neither the name of Ian Bicking nor the names of its contributors may
+# be used to endorse or promote products derived from this software
+# without specific prior written permission.
+#
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL IAN BICKING OR
+# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+# LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+# NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+# SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+"""The ``lxml.html`` tool set for HTML handling.
+"""
+
+import sys
+import re
+try:
+    from urlparse import urljoin
+except ImportError:
+    # Python 3
+    from urllib.parse import urljoin
+import copy
+from lxml import etree
+from lxml.html import defs
+from lxml.html._setmixin import SetMixin
+try:
+    from collections import MutableMapping as DictMixin
+except ImportError:
+    # Python < 2.6
+    from UserDict import DictMixin
+try:
+    set
+except NameError:
+    # Python 2.3
+    from sets import Set as set
+try:
+    bytes
+except NameError:
+    # Python < 2.6
+    bytes = str
+try:
+    unicode
+except NameError:
+    # Python 3
+    unicode = str
+try:
+    basestring
+except NameError:
+    # Python 3
+    basestring = (str, bytes)
+
+def __fix_docstring(s):
+    if not s:
+        return s
+    import sys
+    if sys.version_info[0] >= 3:
+        sub = re.compile(r"^(\s*)u'", re.M).sub
+    else:
+        sub = re.compile(r"^(\s*)b'", re.M).sub
+    return sub(r"\1'", s)
+
+__all__ = [
+    'document_fromstring', 'fragment_fromstring', 'fragments_fromstring', 'fromstring',
+    'tostring', 'Element', 'defs', 'open_in_browser', 'submit_form',
+    'find_rel_links', 'find_class', 'make_links_absolute',
+    'resolve_base_href', 'iterlinks', 'rewrite_links', 'open_in_browser', 'parse']
+
+XHTML_NAMESPACE = "http://www.w3.org/1999/xhtml"
+
+_rel_links_xpath = etree.XPath("descendant-or-self::a[@rel]|descendant-or-self::x:a[@rel]",
+                               namespaces={'x':XHTML_NAMESPACE})
+_options_xpath = etree.XPath("descendant-or-self::option|descendant-or-self::x:option",
+                             namespaces={'x':XHTML_NAMESPACE})
+_forms_xpath = etree.XPath("descendant-or-self::form|descendant-or-self::x:form",
+                           namespaces={'x':XHTML_NAMESPACE})
+#_class_xpath = etree.XPath(r"descendant-or-self::*[regexp:match(@class, concat('\b', $class_name, '\b'))]", {'regexp': 'http://exslt.org/regular-expressions'})
+_class_xpath = etree.XPath("descendant-or-self::*[@class and contains(concat(' ', normalize-space(@class), ' '), concat(' ', $class_name, ' '))]")
+_id_xpath = etree.XPath("descendant-or-self::*[@id=$id]")
+_collect_string_content = etree.XPath("string()")
+_css_url_re = re.compile(r'url\(('+'["][^"]*["]|'+"['][^']*[']|"+r'[^)]*)\)', re.I)
+_css_import_re = re.compile(r'@import "(.*?)"')
+_label_xpath = etree.XPath("//label[@for=$id]|//x:label[@for=$id]",
+                           namespaces={'x':XHTML_NAMESPACE})
+_archive_re = re.compile(r'[^ ]+')
+
+def _unquote_match(s, pos):
+    if s[:1] == '"' and s[-1:] == '"' or s[:1] == "'" and s[-1:] == "'":
+        return s[1:-1], pos+1
+    else:
+        return s,pos
+
+def _transform_result(typ, result):
+    """Convert the result back into the input type.
+    """
+    if issubclass(typ, bytes):
+        return tostring(result, encoding='utf-8')
+    elif issubclass(typ, unicode):
+        return tostring(result, encoding='unicode')
+    else:
+        return result
+
+def _nons(tag):
+    if isinstance(tag, basestring):
+        if tag[0] == '{' and tag[1:len(XHTML_NAMESPACE)+1] == XHTML_NAMESPACE:
+            return tag.split('}')[-1]
+    return tag
+
+class HtmlMixin(object):
+
+    def base_url(self):
+        """
+        Returns the base URL, given when the page was parsed.
+
+        Use with ``urlparse.urljoin(el.base_url, href)`` to get
+        absolute URLs.
+        """
+        return self.getroottree().docinfo.URL
+    base_url = property(base_url, doc=base_url.__doc__)
+
+    def forms(self):
+        """
+        Return a list of all the forms
+        """
+        return _forms_xpath(self)
+    forms = property(forms, doc=forms.__doc__)
+
+    def body(self):
+        """
+        Return the <body> element.  Can be called from a child element
+        to get the document's head.
+        """
+        return self.xpath('//body|//x:body', namespaces={'x':XHTML_NAMESPACE})[0]
+    body = property(body, doc=body.__doc__)
+
+    def head(self):
+        """
+        Returns the <head> element.  Can be called from a child
+        element to get the document's head.
+        """
+        return self.xpath('//head|//x:head', namespaces={'x':XHTML_NAMESPACE})[0]
+    head = property(head, doc=head.__doc__)
+
+    def _label__get(self):
+        """
+        Get or set any <label> element associated with this element.
+        """
+        id = self.get('id')
+        if not id:
+            return None
+        result = _label_xpath(self, id=id)
+        if not result:
+            return None
+        else:
+            return result[0]
+    def _label__set(self, label):
+        id = self.get('id')
+        if not id:
+            raise TypeError(
+                "You cannot set a label for an element (%r) that has no id"
+                % self)
+        if _nons(label.tag) != 'label':
+            raise TypeError(
+                "You can only assign label to a label element (not %r)"
+                % label)
+        label.set('for', id)
+    def _label__del(self):
+        label = self.label
+        if label is not None:
+            del label.attrib['for']
+    label = property(_label__get, _label__set, _label__del, doc=_label__get.__doc__)
+
+    def drop_tree(self):
+        """
+        Removes this element from the tree, including its children and
+        text.  The tail text is joined to the previous element or
+        parent.
+        """
+        parent = self.getparent()
+        assert parent is not None
+        if self.tail:
+            previous = self.getprevious()
+            if previous is None:
+                parent.text = (parent.text or '') + self.tail
+            else:
+                previous.tail = (previous.tail or '') + self.tail
+        parent.remove(self)
+
+    def drop_tag(self):
+        """
+        Remove the tag, but not its children or text.  The children and text
+        are merged into the parent.
+
+        Example::
+
+            >>> h = fragment_fromstring('<div>Hello <b>World!</b></div>')
+            >>> h.find('.//b').drop_tag()
+            >>> print(tostring(h, encoding='unicode'))
+            <div>Hello World!</div>
+        """
+        parent = self.getparent()
+        assert parent is not None
+        previous = self.getprevious()
+        if self.text and isinstance(self.tag, basestring):
+            # not a Comment, etc.
+            if previous is None:
+                parent.text = (parent.text or '') + self.text
+            else:
+                previous.tail = (previous.tail or '') + self.text
+        if self.tail:
+            if len(self):
+                last = self[-1]
+                last.tail = (last.tail or '') + self.tail
+            elif previous is None:
+                parent.text = (parent.text or '') + self.tail
+            else:
+                previous.tail = (previous.tail or '') + self.tail
+        index = parent.index(self)
+        parent[index:index+1] = self[:]
+
+    def find_rel_links(self, rel):
+        """
+        Find any links like ``<a rel="{rel}">...</a>``; returns a list of elements.
+        """
+        rel = rel.lower()
+        return [el for el in _rel_links_xpath(self)
+                if el.get('rel').lower() == rel]
+
+    def find_class(self, class_name):
+        """
+        Find any elements with the given class name.
+        """
+        return _class_xpath(self, class_name=class_name)
+
+    def get_element_by_id(self, id, *default):
+        """
+        Get the first element in a document with the given id.  If none is
+        found, return the default argument if provided or raise KeyError
+        otherwise.
+
+        Note that there can be more than one element with the same id,
+        and this isn't uncommon in HTML documents found in the wild.
+        Browsers return only the first match, and this function does
+        the same.
+        """
+        try:
+            # FIXME: should this check for multiple matches?
+            # browsers just return the first one
+            return _id_xpath(self, id=id)[0]
+        except IndexError:
+            if default:
+                return default[0]
+            else:
+                raise KeyError(id)
+
+    def text_content(self):
+        """
+        Return the text content of the tag (and the text in any children).
+        """
+        return _collect_string_content(self)
+
+    def cssselect(self, expr, translator='html'):
+        """
+        Run the CSS expression on this element and its children,
+        returning a list of the results.
+
+        Equivalent to lxml.cssselect.CSSSelect(expr, translator='html')(self)
+        -- note that pre-compiling the expression can provide a substantial
+        speedup.
+        """
+        # Do the import here to make the dependency optional.
+        from lxml.cssselect import CSSSelector
+        return CSSSelector(expr, translator=translator)(self)
+
+    ########################################
+    ## Link functions
+    ########################################
+
+    def make_links_absolute(self, base_url=None, resolve_base_href=True,
+                            handle_failures=None):
+        """
+        Make all links in the document absolute, given the
+        ``base_url`` for the document (the full URL where the document
+        came from), or if no ``base_url`` is given, then the ``.base_url``
+        of the document.
+
+        If ``resolve_base_href`` is true, then any ``<base href>``
+        tags in the document are used *and* removed from the document.
+        If it is false then any such tag is ignored.
+
+        If ``handle_failures`` is None (default), a failure to process
+        a URL will abort the processing.  If set to 'ignore', errors
+        are ignored.  If set to 'discard', failing URLs will be removed.
+        """
+        if base_url is None:
+            base_url = self.base_url
+            if base_url is None:
+                raise TypeError(
+                    "No base_url given, and the document has no base_url")
+        if resolve_base_href:
+            self.resolve_base_href()
+
+        if handle_failures == 'ignore':
+            def link_repl(href):
+                try:
+                    return urljoin(base_url, href)
+                except ValueError:
+                    return href
+        elif handle_failures == 'discard':
+            def link_repl(href):
+                try:
+                    return urljoin(base_url, href)
+                except ValueError:
+                    return None
+        elif handle_failures is None:
+            def link_repl(href):
+                return urljoin(base_url, href)
+        else:
+            raise ValueError(
+                "unexpected value for handle_failures: %r" % handle_failures)
+
+        self.rewrite_links(link_repl)
+
+    def resolve_base_href(self, handle_failures=None):
+        """
+        Find any ``<base href>`` tag in the document, and apply its
+        values to all links found in the document.  Also remove the
+        tag once it has been applied.
+
+        If ``handle_failures`` is None (default), a failure to process
+        a URL will abort the processing.  If set to 'ignore', errors
+        are ignored.  If set to 'discard', failing URLs will be removed.
+        """
+        base_href = None
+        basetags = self.xpath('//base[@href]|//x:base[@href]',
+                              namespaces={'x': XHTML_NAMESPACE})
+        for b in basetags:
+            base_href = b.get('href')
+            b.drop_tree()
+        if not base_href:
+            return
+        self.make_links_absolute(base_href, resolve_base_href=False,
+                                 handle_failures=handle_failures)
+
+    def iterlinks(self):
+        """
+        Yield (element, attribute, link, pos), where attribute may be None
+        (indicating the link is in the text).  ``pos`` is the position
+        where the link occurs; often 0, but sometimes something else in
+        the case of links in stylesheets or style tags.
+
+        Note: <base href> is *not* taken into account in any way.  The
+        link you get is exactly the link in the document.
+
+        Note: multiple links inside of a single text string or
+        attribute value are returned in reversed order.  This makes it
+        possible to replace or delete them from the text string value
+        based on their reported text positions.  Otherwise, a
+        modification at one text position can change the positions of
+        links reported later on.
+        """
+        link_attrs = defs.link_attrs
+        for el in self.iter(etree.Element):
+            attribs = el.attrib
+            tag = _nons(el.tag)
+            if tag != 'object':
+                for attrib in link_attrs:
+                    if attrib in attribs:
+                        yield (el, attrib, attribs[attrib], 0)
+            elif tag == 'object':
+                codebase = None
+                ## <object> tags have attributes that are relative to
+                ## codebase
+                if 'codebase' in attribs:
+                    codebase = el.get('codebase')
+                    yield (el, 'codebase', codebase, 0)
+                for attrib in 'classid', 'data':
+                    if attrib in attribs:
+                        value = el.get(attrib)
+                        if codebase is not None:
+                            value = urljoin(codebase, value)
+                        yield (el, attrib, value, 0)
+                if 'archive' in attribs:
+                    for match in _archive_re.finditer(el.get('archive')):
+                        value = match.group(0)
+                        if codebase is not None:
+                            value = urljoin(codebase, value)
+                        yield (el, 'archive', value, match.start())
+            if tag == 'param':
+                valuetype = el.get('valuetype') or ''
+                if valuetype.lower() == 'ref':
+                    ## FIXME: while it's fine we *find* this link,
+                    ## according to the spec we aren't supposed to
+                    ## actually change the value, including resolving
+                    ## it.  It can also still be a link, even if it
+                    ## doesn't have a valuetype="ref" (which seems to be the norm)
+                    ## http://www.w3.org/TR/html401/struct/objects.html#adef-valuetype
+                    yield (el, 'value', el.get('value'), 0)
+            if tag == 'style' and el.text:
+                urls = [
+                    _unquote_match(match.group(1), match.start(1))
+                    for match in _css_url_re.finditer(el.text)
+                    ] + [
+                    (match.group(1), match.start(1))
+                    for match in _css_import_re.finditer(el.text)
+                    ]
+                if urls:
+                    # sort by start pos to bring both match sets back into order
+                    urls = [ (start, url) for (url, start) in urls ]
+                    urls.sort()
+                    # reverse the list to report correct positions despite
+                    # modifications
+                    urls.reverse()
+                    for start, url in urls:
+                        yield (el, None, url, start)
+            if 'style' in attribs:
+                urls = list(_css_url_re.finditer(attribs['style']))
+                if urls:
+                    # return in reversed order to simplify in-place modifications
+                    for match in urls[::-1]:
+                        url, start = _unquote_match(match.group(1), match.start(1))
+                        yield (el, 'style', url, start)
+
+    def rewrite_links(self, link_repl_func, resolve_base_href=True,
+                      base_href=None):
+        """
+        Rewrite all the links in the document.  For each link
+        ``link_repl_func(link)`` will be called, and the return value
+        will replace the old link.
+
+        Note that links may not be absolute (unless you first called
+        ``make_links_absolute()``), and may be internal (e.g.,
+        ``'#anchor'``).  They can also be values like
+        ``'mailto:email'`` or ``'javascript:expr'``.
+
+        If you give ``base_href`` then all links passed to
+        ``link_repl_func()`` will take that into account.
+
+        If the ``link_repl_func`` returns None, the attribute or
+        tag text will be removed completely.
+        """
+        if base_href is not None:
+            # FIXME: this can be done in one pass with a wrapper
+            # around link_repl_func
+            self.make_links_absolute(
+                base_href, resolve_base_href=resolve_base_href)
+        elif resolve_base_href:
+            self.resolve_base_href()
+
+        for el, attrib, link, pos in self.iterlinks():
+            new_link = link_repl_func(link.strip())
+            if new_link == link:
+                continue
+            if new_link is None:
+                # Remove the attribute or element content
+                if attrib is None:
+                    el.text = ''
+                else:
+                    del el.attrib[attrib]
+                continue
+
+            if attrib is None:
+                new = el.text[:pos] + new_link + el.text[pos+len(link):]
+                el.text = new
+            else:
+                cur = el.get(attrib)
+                if not pos and len(cur) == len(link):
+                    new = new_link  # most common case
+                else:
+                    new = cur[:pos] + new_link + cur[pos+len(link):]
+                el.set(attrib, new)
+
+
+class _MethodFunc(object):
+    """
+    An object that represents a method on an element as a function;
+    the function takes either an element or an HTML string.  It
+    returns whatever the function normally returns, or if the function
+    works in-place (and so returns None) it returns a serialized form
+    of the resulting document.
+    """
+    def __init__(self, name, copy=False, source_class=HtmlMixin):
+        self.name = name
+        self.copy = copy
+        self.__doc__ = getattr(source_class, self.name).__doc__
+    def __call__(self, doc, *args, **kw):
+        result_type = type(doc)
+        if isinstance(doc, basestring):
+            if 'copy' in kw:
+                raise TypeError(
+                    "The keyword 'copy' can only be used with element inputs to %s, not a string input" % self.name)
+            doc = fromstring(doc, **kw)
+        else:
+            if 'copy' in kw:
+                make_a_copy = kw.pop('copy')
+            else:
+                make_a_copy = self.copy
+            if make_a_copy:
+                doc = copy.deepcopy(doc)
+        meth = getattr(doc, self.name)
+        result = meth(*args, **kw)
+        # FIXME: this None test is a bit sloppy
+        if result is None:
+            # Then return what we got in
+            return _transform_result(result_type, doc)
+        else:
+            return result
+
+find_rel_links = _MethodFunc('find_rel_links', copy=False)
+find_class = _MethodFunc('find_class', copy=False)
+make_links_absolute = _MethodFunc('make_links_absolute', copy=True)
+resolve_base_href = _MethodFunc('resolve_base_href', copy=True)
+iterlinks = _MethodFunc('iterlinks', copy=False)
+rewrite_links = _MethodFunc('rewrite_links', copy=True)
+
+class HtmlComment(etree.CommentBase, HtmlMixin):
+    pass
+
+class HtmlElement(etree.ElementBase, HtmlMixin):
+    pass
+
+class HtmlProcessingInstruction(etree.PIBase, HtmlMixin):
+    pass
+
+class HtmlEntity(etree.EntityBase, HtmlMixin):
+    pass
+
+
+class HtmlElementClassLookup(etree.CustomElementClassLookup):
+    """A lookup scheme for HTML Element classes.
+
+    To create a lookup instance with different Element classes, pass a tag
+    name mapping of Element classes in the ``classes`` keyword argument and/or
+    a tag name mapping of Mixin classes in the ``mixins`` keyword argument.
+    The special key '*' denotes a Mixin class that should be mixed into all
+    Element classes.
+    """
+    _default_element_classes = {}
+
+    def __init__(self, classes=None, mixins=None):
+        etree.CustomElementClassLookup.__init__(self)
+        if classes is None:
+            classes = self._default_element_classes.copy()
+        if mixins:
+            mixers = {}
+            for name, value in mixins:
+                if name == '*':
+                    for n in classes.keys():
+                        mixers.setdefault(n, []).append(value)
+                else:
+                    mixers.setdefault(name, []).append(value)
+            for name, mix_bases in mixers.items():
+                cur = classes.get(name, HtmlElement)
+                bases = tuple(mix_bases + [cur])
+                classes[name] = type(cur.__name__, bases, {})
+        self._element_classes = classes
+
+    def lookup(self, node_type, document, namespace, name):
+        if node_type == 'element':
+            return self._element_classes.get(name.lower(), HtmlElement)
+        elif node_type == 'comment':
+            return HtmlComment
+        elif node_type == 'PI':
+            return HtmlProcessingInstruction
+        elif node_type == 'entity':
+            return HtmlEntity
+        # Otherwise normal lookup
+        return None
+
+################################################################################
+# parsing
+################################################################################
+
+_looks_like_full_html_unicode = re.compile(
+    unicode(r'^\s*<(?:html|!doctype)'), re.I).match
+_looks_like_full_html_bytes = re.compile(
+    r'^\s*<(?:html|!doctype)'.encode('ascii'), re.I).match
+
+def document_fromstring(html, parser=None, **kw):
+    if parser is None:
+        parser = html_parser
+    value = etree.fromstring(html, parser, **kw)
+    if value is None:
+        raise etree.ParserError(
+            "Document is empty")
+    return value
+
+def fragments_fromstring(html, no_leading_text=False, base_url=None,
+                         parser=None, **kw):
+    """
+    Parses several HTML elements, returning a list of elements.
+
+    The first item in the list may be a string (though leading
+    whitespace is removed).  If no_leading_text is true, then it will
+    be an error if there is leading text, and it will always be a list
+    of only elements.
+
+    base_url will set the document's base_url attribute (and the tree's docinfo.URL)
+    """
+    if parser is None:
+        parser = html_parser
+    # FIXME: check what happens when you give html with a body, head, etc.
+    if isinstance(html, bytes):
+        if not _looks_like_full_html_bytes(html):
+            # can't use %-formatting in early Py3 versions
+            html = ('<html><body>'.encode('ascii') + html +
+                    '</body></html>'.encode('ascii'))
+    else:
+        if not _looks_like_full_html_unicode(html):
+            html = '<html><body>%s</body></html>' % html
+    doc = document_fromstring(html, parser=parser, base_url=base_url, **kw)
+    assert _nons(doc.tag) == 'html'
+    bodies = [e for e in doc if _nons(e.tag) == 'body']
+    assert len(bodies) == 1, ("too many bodies: %r in %r" % (bodies, html))
+    body = bodies[0]
+    elements = []
+    if no_leading_text and body.text and body.text.strip():
+        raise etree.ParserError(
+            "There is leading text: %r" % body.text)
+    if body.text and body.text.strip():
+        elements.append(body.text)
+    elements.extend(body)
+    # FIXME: removing the reference to the parent artificial document
+    # would be nice
+    return elements
+
+def fragment_fromstring(html, create_parent=False, base_url=None,
+                        parser=None, **kw):
+    """
+    Parses a single HTML element; it is an error if there is more than
+    one element, or if anything but whitespace precedes or follows the
+    element.
+
+    If create_parent is true (or is a tag name) then a parent node
+    will be created to encapsulate the HTML in a single element.  In
+    this case, leading or trailing text is allowed.
+
+    base_url will set the document's base_url attribute (and the tree's docinfo.URL)
+    """
+    if parser is None:
+        parser = html_parser
+
+    accept_leading_text = bool(create_parent)
+
+    elements = fragments_fromstring(
+        html, parser=parser, no_leading_text=not accept_leading_text,
+        base_url=base_url, **kw)
+
+    if create_parent:
+        if not isinstance(create_parent, basestring):
+            create_parent = 'div'
+        new_root = Element(create_parent)
+        if elements:
+            if isinstance(elements[0], basestring):
+                new_root.text = elements[0]
+                del elements[0]
+            new_root.extend(elements)
+        return new_root
+
+    if not elements:
+        raise etree.ParserError('No elements found')
+    if len(elements) > 1:
+        raise etree.ParserError(
+            "Multiple elements found (%s)"
+            % ', '.join([_element_name(e) for e in elements]))
+    el = elements[0]
+    if el.tail and el.tail.strip():
+        raise etree.ParserError(
+            "Element followed by text: %r" % el.tail)
+    el.tail = None
+    return el
+
+def fromstring(html, base_url=None, parser=None, **kw):
+    """
+    Parse the html, returning a single element/document.
+
+    This tries to minimally parse the chunk of text, without knowing if it
+    is a fragment or a document.
+
+    base_url will set the document's base_url attribute (and the tree's docinfo.URL)
+    """
+    if parser is None:
+        parser = html_parser
+    if isinstance(html, bytes):
+        is_full_html = _looks_like_full_html_bytes(html)
+    else:
+        is_full_html = _looks_like_full_html_unicode(html)
+    doc = document_fromstring(html, parser=parser, base_url=base_url, **kw)
+    if is_full_html:
+        return doc
+    # otherwise, lets parse it out...
+    bodies = doc.findall('body')
+    if not bodies:
+        bodies = doc.findall('{%s}body' % XHTML_NAMESPACE)
+    if bodies:
+        body = bodies[0]
+        if len(bodies) > 1:
+            # Somehow there are multiple bodies, which is bad, but just
+            # smash them into one body
+            for other_body in bodies[1:]:
+                if other_body.text:
+                    if len(body):
+                        body[-1].tail = (body[-1].tail or '') + other_body.text
+                    else:
+                        body.text = (body.text or '') + other_body.text
+                body.extend(other_body)
+                # We'll ignore tail
+                # I guess we are ignoring attributes too
+                other_body.drop_tree()
+    else:
+        body = None
+    heads = doc.findall('head')
+    if not heads:
+        heads = doc.findall('{%s}head' % XHTML_NAMESPACE)
+    if heads:
+        # Well, we have some sort of structure, so lets keep it all
+        head = heads[0]
+        if len(heads) > 1:
+            for other_head in heads[1:]:
+                head.extend(other_head)
+                # We don't care about text or tail in a head
+                other_head.drop_tree()
+        return doc
+    if body is None:
+        return doc
+    if (len(body) == 1 and (not body.text or not body.text.strip())
+        and (not body[-1].tail or not body[-1].tail.strip())):
+        # The body has just one element, so it was probably a single
+        # element passed in
+        return body[0]
+    # Now we have a body which represents a bunch of tags which have the
+    # content that was passed in.  We will create a fake container, which
+    # is the body tag, except <body> implies too much structure.
+    if _contains_block_level_tag(body):
+        body.tag = 'div'
+    else:
+        body.tag = 'span'
+    return body
+
+def parse(filename_or_url, parser=None, base_url=None, **kw):
+    """
+    Parse a filename, URL, or file-like object into an HTML document
+    tree.  Note: this returns a tree, not an element.  Use
+    ``parse(...).getroot()`` to get the document root.
+
+    You can override the base URL with the ``base_url`` keyword.  This
+    is most useful when parsing from a file-like object.
+    """
+    if parser is None:
+        parser = html_parser
+    return etree.parse(filename_or_url, parser, base_url=base_url, **kw)
+
+def _contains_block_level_tag(el):
+    # FIXME: I could do this with XPath, but would that just be
+    # unnecessarily slow?
+    for el in el.iter(etree.Element):
+        if _nons(el.tag) in defs.block_tags:
+            return True
+    return False
+
+def _element_name(el):
+    if isinstance(el, etree.CommentBase):
+        return 'comment'
+    elif isinstance(el, basestring):
+        return 'string'
+    else:
+        return _nons(el.tag)
+
+################################################################################
+# form handling
+################################################################################
+
+class FormElement(HtmlElement):
+    """
+    Represents a <form> element.
+    """
+
+    def inputs(self):
+        """
+        Returns an accessor for all the input elements in the form.
+
+        See `InputGetter` for more information about the object.
+        """
+        return InputGetter(self)
+    inputs = property(inputs, doc=inputs.__doc__)
+
+    def _fields__get(self):
+        """
+        Dictionary-like object that represents all the fields in this
+        form.  You can set values in this dictionary to effect the
+        form.
+        """
+        return FieldsDict(self.inputs)
+    def _fields__set(self, value):
+        prev_keys = self.fields.keys()
+        for key, value in value.items():
+            if key in prev_keys:
+                prev_keys.remove(key)
+            self.fields[key] = value
+        for key in prev_keys:
+            if key is None:
+                # Case of an unnamed input; these aren't really
+                # expressed in form_values() anyway.
+                continue
+            self.fields[key] = None
+
+    fields = property(_fields__get, _fields__set, doc=_fields__get.__doc__)
+
+    def _name(self):
+        if self.get('name'):
+            return self.get('name')
+        elif self.get('id'):
+            return '#' + self.get('id')
+        forms = list(self.body.iter('form'))
+        if not forms:
+            forms = list(self.body.iter('{%s}form' % XHTML_NAMESPACE))
+        return str(forms.index(self))
+
+    def form_values(self):
+        """
+        Return a list of tuples of the field values for the form.
+        This is suitable to be passed to ``urllib.urlencode()``.
+        """
+        results = []
+        for el in self.inputs:
+            name = el.name
+            if not name:
+                continue
+            tag = _nons(el.tag)
+            if tag == 'textarea':
+                results.append((name, el.value))
+            elif tag == 'select':
+                value = el.value
+                if el.multiple:
+                    for v in value:
+                        results.append((name, v))
+                elif value is not None:
+                    results.append((name, el.value))
+            else:
+                assert tag == 'input', (
+                    "Unexpected tag: %r" % el)
+                if el.checkable and not el.checked:
+                    continue
+                if el.type in ('submit', 'image', 'reset'):
+                    continue
+                value = el.value
+                if value is not None:
+                    results.append((name, el.value))
+        return results
+
+    def _action__get(self):
+        """
+        Get/set the form's ``action`` attribute.
+        """
+        base_url = self.base_url
+        action = self.get('action')
+        if base_url and action is not None:
+            return urljoin(base_url, action)
+        else:
+            return action
+    def _action__set(self, value):
+        self.set('action', value)
+    def _action__del(self):
+        if 'action' in self.attrib:
+            del self.attrib['action']
+    action = property(_action__get, _action__set, _action__del, doc=_action__get.__doc__)
+
+    def _method__get(self):
+        """
+        Get/set the form's method.  Always returns a capitalized
+        string, and defaults to ``'GET'``
+        """
+        return self.get('method', 'GET').upper()
+    def _method__set(self, value):
+        self.set('method', value.upper())
+    method = property(_method__get, _method__set, doc=_method__get.__doc__)
+
+HtmlElementClassLookup._default_element_classes['form'] = FormElement
+
+def submit_form(form, extra_values=None, open_http=None):
+    """
+    Helper function to submit a form.  Returns a file-like object, as from
+    ``urllib.urlopen()``.  This object also has a ``.geturl()`` function,
+    which shows the URL if there were any redirects.
+
+    You can use this like::
+
+        form = doc.forms[0]
+        form.inputs['foo'].value = 'bar' # etc
+        response = form.submit()
+        doc = parse(response)
+        doc.make_links_absolute(response.geturl())
+
+    To change the HTTP requester, pass a function as ``open_http`` keyword
+    argument that opens the URL for you.  The function must have the following
+    signature::
+
+        open_http(method, URL, values)
+
+    The action is one of 'GET' or 'POST', the URL is the target URL as a
+    string, and the values are a sequence of ``(name, value)`` tuples with the
+    form data.
+    """
+    values = form.form_values()
+    if extra_values:
+        if hasattr(extra_values, 'items'):
+            extra_values = extra_values.items()
+        values.extend(extra_values)
+    if open_http is None:
+        open_http = open_http_urllib
+    if form.action:
+        url = form.action
+    else:
+        url = form.base_url
+    return open_http(form.method, url, values)
+
+def open_http_urllib(method, url, values):
+    if not url:
+        raise ValueError("cannot submit, no URL provided")
+    ## FIXME: should test that it's not a relative URL or something
+    try:
+        from urllib import urlencode, urlopen
+    except ImportError: # Python 3
+        from urllib.request import urlopen
+        from urllib.parse import urlencode
+    if method == 'GET':
+        if '?' in url:
+            url += '&'
+        else:
+            url += '?'
+        url += urlencode(values)
+        data = None
+    else:
+        data = urlencode(values)
+    return urlopen(url, data)
+
+class FieldsDict(DictMixin):
+
+    def __init__(self, inputs):
+        self.inputs = inputs
+    def __getitem__(self, item):
+        return self.inputs[item].value
+    def __setitem__(self, item, value):
+        self.inputs[item].value = value
+    def __delitem__(self, item):
+        raise KeyError(
+            "You cannot remove keys from ElementDict")
+    def keys(self):
+        return self.inputs.keys()
+    def __contains__(self, item):
+        return item in self.inputs
+    def __iter__(self):
+        return iter(self.inputs.keys())
+    def __len__(self):
+        return len(self.inputs)
+
+    def __repr__(self):
+        return '<%s for form %s>' % (
+            self.__class__.__name__,
+            self.inputs.form._name())
+
+class InputGetter(object):
+
+    """
+    An accessor that represents all the input fields in a form.
+
+    You can get fields by name from this, with
+    ``form.inputs['field_name']``.  If there are a set of checkboxes
+    with the same name, they are returned as a list (a `CheckboxGroup`
+    which also allows value setting).  Radio inputs are handled
+    similarly.
+
+    You can also iterate over this to get all input elements.  This
+    won't return the same thing as if you get all the names, as
+    checkboxes and radio elements are returned individually.
+    """
+
+    _name_xpath = etree.XPath(".//*[@name = $name and (local-name(.) = 'select' or local-name(.) = 'input' or local-name(.) = 'textarea')]")
+    _all_xpath = etree.XPath(".//*[local-name() = 'select' or local-name() = 'input' or local-name() = 'textarea']")
+
+    def __init__(self, form):
+        self.form = form
+
+    def __repr__(self):
+        return '<%s for form %s>' % (
+            self.__class__.__name__,
+            self.form._name())
+
+    ## FIXME: there should be more methods, and it's unclear if this is
+    ## a dictionary-like object or list-like object
+
+    def __getitem__(self, name):
+        results = self._name_xpath(self.form, name=name)
+        if results:
+            type = results[0].get('type')
+            if type == 'radio' and len(results) > 1:
+                group = RadioGroup(results)
+                group.name = name
+                return group
+            elif type == 'checkbox' and len(results) > 1:
+                group = CheckboxGroup(results)
+                group.name = name
+                return group
+            else:
+                # I don't like throwing away elements like this
+                return results[0]
+        else:
+            raise KeyError(
+                "No input element with the name %r" % name)
+
+    def __contains__(self, name):
+        results = self._name_xpath(self.form, name=name)
+        return bool(results)
+
+    def keys(self):
+        names = set()
+        for el in self:
+            names.add(el.name)
+        if None in names:
+            names.remove(None)
+        return list(names)
+
+    def __iter__(self):
+        ## FIXME: kind of dumb to turn a list into an iterator, only
+        ## to have it likely turned back into a list again :(
+        return iter(self._all_xpath(self.form))
+
+class InputMixin(object):
+
+    """
+    Mix-in for all input elements (input, select, and textarea)
+    """
+
+
+    def _name__get(self):
+        """
+        Get/set the name of the element
+        """
+        return self.get('name')
+    def _name__set(self, value):
+        self.set('name', value)
+    def _name__del(self):
+        if 'name' in self.attrib:
+            del self.attrib['name']
+    name = property(_name__get, _name__set, _name__del, doc=_name__get.__doc__)
+
+    def __repr__(self):
+        type = getattr(self, 'type', None)
+        if type:
+            type = ' type=%r' % type
+        else:
+            type = ''
+        return '<%s %x name=%r%s>' % (
+            self.__class__.__name__, id(self), self.name, type)
+
+class TextareaElement(InputMixin, HtmlElement):
+    """
+    ``<textarea>`` element.  You can get the name with ``.name`` and
+    get/set the value with ``.value``
+    """
+
+    def _value__get(self):
+        """
+        Get/set the value (which is the contents of this element)
+        """
+        content = self.text or ''
+        if self.tag.startswith("{%s}" % XHTML_NAMESPACE):
+            serialisation_method = 'xml'
+        else:
+            serialisation_method = 'html'
+        for el in self:
+            # it's rare that we actually get here, so let's not use ''.join()
+            content += etree.tostring(
+                el, method=serialisation_method, encoding='unicode')
+        return content
+    def _value__set(self, value):
+        del self[:]
+        self.text = value
+    def _value__del(self):
+        self.text = ''
+        del self[:]
+    value = property(_value__get, _value__set, _value__del, doc=_value__get.__doc__)
+
+HtmlElementClassLookup._default_element_classes['textarea'] = TextareaElement
+
+class SelectElement(InputMixin, HtmlElement):
+    """
+    ``<select>`` element.  You can get the name with ``.name``.
+
+    ``.value`` will be the value of the selected option, unless this
+    is a multi-select element (``<select multiple>``), in which case
+    it will be a set-like object.  In either case ``.value_options``
+    gives the possible values.
+
+    The boolean attribute ``.multiple`` shows if this is a
+    multi-select.
+    """
+
+    def _value__get(self):
+        """
+        Get/set the value of this select (the selected option).
+
+        If this is a multi-select, this is a set-like object that
+        represents all the selected options.
+        """
+        if self.multiple:
+            return MultipleSelectOptions(self)
+        for el in _options_xpath(self):
+            if el.get('selected') is not None:
+                value = el.get('value')
+                if value is None:
+                    value = el.text or ''
+                if value:
+                    value = value.strip()
+                return value
+        return None
+
+    def _value__set(self, value):
+        if self.multiple:
+            if isinstance(value, basestring):
+                raise TypeError(
+                    "You must pass in a sequence")
+            self.value.clear()
+            self.value.update(value)
+            return
+        if value is not None:
+            value = value.strip()
+            for el in _options_xpath(self):
+                opt_value = el.get('value')
+                if opt_value is None:
+                    opt_value = el.text or ''
+                if opt_value:
+                    opt_value = opt_value.strip()
+                if opt_value == value:
+                    checked_option = el
+                    break
+            else:
+                raise ValueError(
+                    "There is no option with the value of %r" % value)
+        for el in _options_xpath(self):
+            if 'selected' in el.attrib:
+                del el.attrib['selected']
+        if value is not None:
+            checked_option.set('selected', '')
+
+    def _value__del(self):
+        # FIXME: should del be allowed at all?
+        if self.multiple:
+            self.value.clear()
+        else:
+            self.value = None
+
+    value = property(_value__get, _value__set, _value__del, doc=_value__get.__doc__)
+
+    def value_options(self):
+        """
+        All the possible values this select can have (the ``value``
+        attribute of all the ``<option>`` elements.
+        """
+        options = []
+        for el in _options_xpath(self):
+            value = el.get('value')
+            if value is None:
+                value = el.text or ''
+            if value:
+                value = value.strip()
+            options.append(value)
+        return options
+    value_options = property(value_options, doc=value_options.__doc__)
+
+    def _multiple__get(self):
+        """
+        Boolean attribute: is there a ``multiple`` attribute on this element.
+        """
+        return 'multiple' in self.attrib
+    def _multiple__set(self, value):
+        if value:
+            self.set('multiple', '')
+        elif 'multiple' in self.attrib:
+            del self.attrib['multiple']
+    multiple = property(_multiple__get, _multiple__set, doc=_multiple__get.__doc__)
+
+HtmlElementClassLookup._default_element_classes['select'] = SelectElement
+
+class MultipleSelectOptions(SetMixin):
+    """
+    Represents all the selected options in a ``<select multiple>`` element.
+
+    You can add to this set-like option to select an option, or remove
+    to unselect the option.
+    """
+
+    def __init__(self, select):
+        self.select = select
+
+    def options(self):
+        """
+        Iterator of all the ``<option>`` elements.
+        """
+        return iter(_options_xpath(self.select))
+    options = property(options)
+
+    def __iter__(self):
+        for option in self.options:
+            if 'selected' in option.attrib:
+                opt_value = option.get('value')
+                if opt_value is None:
+                    opt_value = option.text or ''
+                if opt_value:
+                    opt_value = opt_value.strip()
+                yield opt_value
+
+    def add(self, item):
+        for option in self.options:
+            opt_value = option.get('value')
+            if opt_value is None:
+                opt_value = option.text or ''
+            if opt_value:
+                opt_value = opt_value.strip()
+            if opt_value == item:
+                option.set('selected', '')
+                break
+        else:
+            raise ValueError(
+                "There is no option with the value %r" % item)
+
+    def remove(self, item):
+        for option in self.options:
+            opt_value = option.get('value')
+            if opt_value is None:
+                opt_value = option.text or ''
+            if opt_value:
+                opt_value = opt_value.strip()
+            if opt_value == item:
+                if 'selected' in option.attrib:
+                    del option.attrib['selected']
+                else:
+                    raise ValueError(
+                        "The option %r is not currently selected" % item)
+                break
+        else:
+            raise ValueError(
+                "There is not option with the value %r" % item)
+
+    def __repr__(self):
+        return '<%s {%s} for select name=%r>' % (
+            self.__class__.__name__,
+            ', '.join([repr(v) for v in self]),
+            self.select.name)
+
+class RadioGroup(list):
+    """
+    This object represents several ``<input type=radio>`` elements
+    that have the same name.
+
+    You can use this like a list, but also use the property
+    ``.value`` to check/uncheck inputs.  Also you can use
+    ``.value_options`` to get the possible values.
+    """
+
+    def _value__get(self):
+        """
+        Get/set the value, which checks the radio with that value (and
+        unchecks any other value).
+        """
+        for el in self:
+            if 'checked' in el.attrib:
+                return el.get('value')
+        return None
+
+    def _value__set(self, value):
+        if value is not None:
+            for el in self:
+                if el.get('value') == value:
+                    checked_option = el
+                    break
+            else:
+                raise ValueError(
+                    "There is no radio input with the value %r" % value)
+        for el in self:
+            if 'checked' in el.attrib:
+                del el.attrib['checked']
+        if value is not None:
+            checked_option.set('checked', '')
+
+    def _value__del(self):
+        self.value = None
+
+    value = property(_value__get, _value__set, _value__del, doc=_value__get.__doc__)
+
+    def value_options(self):
+        """
+        Returns a list of all the possible values.
+        """
+        return [el.get('value') for el in self]
+    value_options = property(value_options, doc=value_options.__doc__)
+
+    def __repr__(self):
+        return '%s(%s)' % (
+            self.__class__.__name__,
+            list.__repr__(self))
+
+class CheckboxGroup(list):
+    """
+    Represents a group of checkboxes (``<input type=checkbox>``) that
+    have the same name.
+
+    In addition to using this like a list, the ``.value`` attribute
+    returns a set-like object that you can add to or remove from to
+    check and uncheck checkboxes.  You can also use ``.value_options``
+    to get the possible values.
+    """
+
+    def _value__get(self):
+        """
+        Return a set-like object that can be modified to check or
+        uncheck individual checkboxes according to their value.
+        """
+        return CheckboxValues(self)
+    def _value__set(self, value):
+        self.value.clear()
+        if not hasattr(value, '__iter__'):
+            raise ValueError(
+                "A CheckboxGroup (name=%r) must be set to a sequence (not %r)"
+                % (self[0].name, value))
+        self.value.update(value)
+    def _value__del(self):
+        self.value.clear()
+    value = property(_value__get, _value__set, _value__del, doc=_value__get.__doc__)
+
+    def value_options(self):
+        """
+        Returns a list of all the possible values.
+        """
+        return [el.get('value') for el in self]
+    value_options = property(value_options, doc=value_options.__doc__)
+
+    def __repr__(self):
+        return '%s(%s)' % (
+            self.__class__.__name__, list.__repr__(self))
+
+class CheckboxValues(SetMixin):
+
+    """
+    Represents the values of the checked checkboxes in a group of
+    checkboxes with the same name.
+    """
+
+    def __init__(self, group):
+        self.group = group
+
+    def __iter__(self):
+        return iter([
+            el.get('value')
+            for el in self.group
+            if 'checked' in el.attrib])
+
+    def add(self, value):
+        for el in self.group:
+            if el.get('value') == value:
+                el.set('checked', '')
+                break
+        else:
+            raise KeyError("No checkbox with value %r" % value)
+
+    def remove(self, value):
+        for el in self.group:
+            if el.get('value') == value:
+                if 'checked' in el.attrib:
+                    del el.attrib['checked']
+                else:
+                    raise KeyError(
+                        "The checkbox with value %r was already unchecked" % value)
+                break
+        else:
+            raise KeyError(
+                "No checkbox with value %r" % value)
+
+    def __repr__(self):
+        return '<%s {%s} for checkboxes name=%r>' % (
+            self.__class__.__name__,
+            ', '.join([repr(v) for v in self]),
+            self.group.name)
+
+class InputElement(InputMixin, HtmlElement):
+    """
+    Represents an ``<input>`` element.
+
+    You can get the type with ``.type`` (which is lower-cased and
+    defaults to ``'text'``).
+
+    Also you can get and set the value with ``.value``
+
+    Checkboxes and radios have the attribute ``input.checkable ==
+    True`` (for all others it is false) and a boolean attribute
+    ``.checked``.
+
+    """
+
+    ## FIXME: I'm a little uncomfortable with the use of .checked
+    def _value__get(self):
+        """
+        Get/set the value of this element, using the ``value`` attribute.
+
+        Also, if this is a checkbox and it has no value, this defaults
+        to ``'on'``.  If it is a checkbox or radio that is not
+        checked, this returns None.
+        """
+        if self.checkable:
+            if self.checked:
+                return self.get('value') or 'on'
+            else:
+                return None
+        return self.get('value')
+    def _value__set(self, value):
+        if self.checkable:
+            if not value:
+                self.checked = False
+            else:
+                self.checked = True
+                if isinstance(value, basestring):
+                    self.set('value', value)
+        else:
+            self.set('value', value)
+    def _value__del(self):
+        if self.checkable:
+            self.checked = False
+        else:
+            if 'value' in self.attrib:
+                del self.attrib['value']
+    value = property(_value__get, _value__set, _value__del, doc=_value__get.__doc__)
+
+    def _type__get(self):
+        """
+        Return the type of this element (using the type attribute).
+        """
+        return self.get('type', 'text').lower()
+    def _type__set(self, value):
+        self.set('type', value)
+    type = property(_type__get, _type__set, doc=_type__get.__doc__)
+
+    def checkable(self):
+        """
+        Boolean: can this element be checked?
+        """
+        return self.type in ['checkbox', 'radio']
+    checkable = property(checkable, doc=checkable.__doc__)
+
+    def _checked__get(self):
+        """
+        Boolean attribute to get/set the presence of the ``checked``
+        attribute.
+
+        You can only use this on checkable input types.
+        """
+        if not self.checkable:
+            raise AttributeError('Not a checkable input type')
+        return 'checked' in self.attrib
+    def _checked__set(self, value):
+        if not self.checkable:
+            raise AttributeError('Not a checkable input type')
+        if value:
+            self.set('checked', '')
+        else:
+            if 'checked' in self.attrib:
+                del self.attrib['checked']
+    checked = property(_checked__get, _checked__set, doc=_checked__get.__doc__)
+
+HtmlElementClassLookup._default_element_classes['input'] = InputElement
+
+class LabelElement(HtmlElement):
+    """
+    Represents a ``<label>`` element.
+
+    Label elements are linked to other elements with their ``for``
+    attribute.  You can access this element with ``label.for_element``.
+    """
+
+    def _for_element__get(self):
+        """
+        Get/set the element this label points to.  Return None if it
+        can't be found.
+        """
+        id = self.get('for')
+        if not id:
+            return None
+        return self.body.get_element_by_id(id)
+    def _for_element__set(self, other):
+        id = other.get('id')
+        if not id:
+            raise TypeError(
+                "Element %r has no id attribute" % other)
+        self.set('for', id)
+    def _for_element__del(self):
+        if 'id' in self.attrib:
+            del self.attrib['id']
+    for_element = property(_for_element__get, _for_element__set, _for_element__del,
+                           doc=_for_element__get.__doc__)
+
+HtmlElementClassLookup._default_element_classes['label'] = LabelElement
+
+############################################################
+## Serialization
+############################################################
+
+def html_to_xhtml(html):
+    """Convert all tags in an HTML tree to XHTML by moving them to the
+    XHTML namespace.
+    """
+    try:
+        html = html.getroot()
+    except AttributeError:
+        pass
+    prefix = "{%s}" % XHTML_NAMESPACE
+    for el in html.iter(etree.Element):
+        tag = el.tag
+        if tag[0] != '{':
+            el.tag = prefix + tag
+
+def xhtml_to_html(xhtml):
+    """Convert all tags in an XHTML tree to HTML by removing their
+    XHTML namespace.
+    """
+    try:
+        xhtml = xhtml.getroot()
+    except AttributeError:
+        pass
+    prefix = "{%s}" % XHTML_NAMESPACE
+    prefix_len = len(prefix)
+    for el in xhtml.iter(prefix + "*"):
+        el.tag = el.tag[prefix_len:]
+
+# This isn't a general match, but it's a match for what libxml2
+# specifically serialises:
+__str_replace_meta_content_type = re.compile(
+    r'<meta http-equiv="Content-Type"[^>]*>').sub
+__bytes_replace_meta_content_type = re.compile(
+    r'<meta http-equiv="Content-Type"[^>]*>'.encode('ASCII')).sub
+
+def tostring(doc, pretty_print=False, include_meta_content_type=False,
+             encoding=None, method="html", with_tail=True, doctype=None):
+    """Return an HTML string representation of the document.
+
+    Note: if include_meta_content_type is true this will create a
+    ``<meta http-equiv="Content-Type" ...>`` tag in the head;
+    regardless of the value of include_meta_content_type any existing
+    ``<meta http-equiv="Content-Type" ...>`` tag will be removed
+
+    The ``encoding`` argument controls the output encoding (defauts to
+    ASCII, with &#...; character references for any characters outside
+    of ASCII).  Note that you can pass the name ``'unicode'`` as
+    ``encoding`` argument to serialise to a Unicode string.
+
+    The ``method`` argument defines the output method.  It defaults to
+    'html', but can also be 'xml' for xhtml output, or 'text' to
+    serialise to plain text without markup.
+
+    To leave out the tail text of the top-level element that is being
+    serialised, pass ``with_tail=False``.
+
+    The ``doctype`` option allows passing in a plain string that will
+    be serialised before the XML tree.  Note that passing in non
+    well-formed content here will make the XML output non well-formed.
+    Also, an existing doctype in the document tree will not be removed
+    when serialising an ElementTree instance.
+
+    Example::
+
+        >>> from lxml import html
+        >>> root = html.fragment_fromstring('<p>Hello<br>world!</p>')
+
+        >>> html.tostring(root)
+        b'<p>Hello<br>world!</p>'
+        >>> html.tostring(root, method='html')
+        b'<p>Hello<br>world!</p>'
+
+        >>> html.tostring(root, method='xml')
+        b'<p>Hello<br/>world!</p>'
+
+        >>> html.tostring(root, method='text')
+        b'Helloworld!'
+
+        >>> html.tostring(root, method='text', encoding='unicode')
+        u'Helloworld!'
+
+        >>> root = html.fragment_fromstring('<div><p>Hello<br>world!</p>TAIL</div>')
+        >>> html.tostring(root[0], method='text', encoding='unicode')
+        u'Helloworld!TAIL'
+
+        >>> html.tostring(root[0], method='text', encoding='unicode', with_tail=False)
+        u'Helloworld!'
+
+        >>> doc = html.document_fromstring('<p>Hello<br>world!</p>')
+        >>> html.tostring(doc, method='html', encoding='unicode')
+        u'<html><body><p>Hello<br>world!</p></body></html>'
+
+        >>> print(html.tostring(doc, method='html', encoding='unicode',
+        ...          doctype='<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN"'
+        ...                  ' "http://www.w3.org/TR/html4/strict.dtd">'))
+        <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN" "http://www.w3.org/TR/html4/strict.dtd">
+        <html><body><p>Hello<br>world!</p></body></html>
+    """
+    html = etree.tostring(doc, method=method, pretty_print=pretty_print,
+                          encoding=encoding, with_tail=with_tail,
+                          doctype=doctype)
+    if method == 'html' and not include_meta_content_type:
+        if isinstance(html, str):
+            html = __str_replace_meta_content_type('', html)
+        else:
+            html = __bytes_replace_meta_content_type(bytes(), html)
+    return html
+
+tostring.__doc__ = __fix_docstring(tostring.__doc__)
+
+def open_in_browser(doc, encoding=None):
+    """
+    Open the HTML document in a web browser, saving it to a temporary
+    file to open it.  Note that this does not delete the file after
+    use.  This is mainly meant for debugging.
+    """
+    import os
+    import webbrowser
+    import tempfile
+    if not isinstance(doc, etree._ElementTree):
+        doc = etree.ElementTree(doc)
+    handle, fn = tempfile.mkstemp(suffix='.html')
+    f = os.fdopen(handle, 'wb')
+    try:
+        doc.write(f, method="html", encoding=encoding or doc.docinfo.encoding or "UTF-8")
+    finally:
+        # we leak the file itself here, but we should at least close it
+        f.close()
+    url = 'file://' + fn.replace(os.path.sep, '/')
+    print(url)
+    webbrowser.open(url)
+
+################################################################################
+# configure Element class lookup
+################################################################################
+
+class HTMLParser(etree.HTMLParser):
+    """An HTML parser that is configured to return lxml.html Element
+    objects.
+    """
+    def __init__(self, **kwargs):
+        super(HTMLParser, self).__init__(**kwargs)
+        self.set_element_class_lookup(HtmlElementClassLookup())
+
+class XHTMLParser(etree.XMLParser):
+    """An XML parser that is configured to return lxml.html Element
+    objects.
+
+    Note that this parser is not really XHTML aware unless you let it
+    load a DTD that declares the HTML entities.  To do this, make sure
+    you have the XHTML DTDs installed in your catalogs, and create the
+    parser like this::
+
+        >>> parser = XHTMLParser(load_dtd=True)
+
+    If you additionally want to validate the document, use this::
+
+        >>> parser = XHTMLParser(dtd_validation=True)
+
+    For catalog support, see http://www.xmlsoft.org/catalog.html.
+    """
+    def __init__(self, **kwargs):
+        super(XHTMLParser, self).__init__(**kwargs)
+        self.set_element_class_lookup(HtmlElementClassLookup())
+
+def Element(*args, **kw):
+    """Create a new HTML Element.
+
+    This can also be used for XHTML documents.
+    """
+    v = html_parser.makeelement(*args, **kw)
+    return v
+
+html_parser = HTMLParser()
+xhtml_parser = XHTMLParser()
diff --git a/lib/lxml/html/_diffcommand.py b/lib/lxml/html/_diffcommand.py
new file mode 100644
index 00000000..bcf5a4b0
--- /dev/null
+++ b/lib/lxml/html/_diffcommand.py
@@ -0,0 +1,87 @@
+import optparse
+import sys
+import re
+import os
+from lxml.html.diff import htmldiff
+
+description = """\
+"""
+
+parser = optparse.OptionParser(
+    usage="%prog [OPTIONS] FILE1 FILE2\n"
+    "%prog --annotate [OPTIONS] INFO1 FILE1 INFO2 FILE2 ...",
+    description=description,
+    )
+
+parser.add_option(
+    '-o', '--output',
+    metavar="FILE",
+    dest="output",
+    default="-",
+    help="File to write the difference to",
+    )
+
+parser.add_option(
+    '-a', '--annotation',
+    action="store_true",
+    dest="annotation",
+    help="Do an annotation")
+
+def main(args=None):
+    if args is None:
+        args = sys.argv[1:]
+    options, args = parser.parse_args(args)
+    if options.annotation:
+        return annotate(options, args)
+    if len(args) != 2:
+        print('Error: you must give two files')
+        parser.print_help()
+        sys.exit(1)
+    file1, file2 = args
+    input1 = read_file(file1)
+    input2 = read_file(file2)
+    body1 = split_body(input1)[1]
+    pre, body2, post = split_body(input2)
+    result = htmldiff(body1, body2)
+    result = pre + result + post
+    if options.output == '-':
+        if not result.endswith('\n'):
+            result += '\n'
+        sys.stdout.write(result)
+    else:
+        f = open(options.output, 'wb')
+        f.write(result)
+        f.close()
+
+def read_file(filename):
+    if filename == '-':
+        c = sys.stdin.read()
+    elif not os.path.exists(filename):
+        raise OSError(
+            "Input file %s does not exist" % filename)
+    else:
+        f = open(filename, 'rb')
+        c = f.read()
+        f.close()
+    return c
+
+body_start_re = re.compile(
+    r"<body.*?>", re.I|re.S)
+body_end_re = re.compile(
+    r"</body.*?>", re.I|re.S)
+    
+def split_body(html):
+    match = body_start_re.search(html)
+    if match:
+        pre = html[:match.end()]
+        html = html[match.end():]
+    match = body_end_re.search(html)
+    if match:
+        post = html[match.start():]
+        html = html[:match.start()]
+    return pre, html, post
+
+def annotate(options, args):
+    print("Not yet implemented")
+    sys.exit(1)
+    
diff --git a/lib/lxml/html/_html5builder.py b/lib/lxml/html/_html5builder.py
new file mode 100644
index 00000000..3405c201
--- /dev/null
+++ b/lib/lxml/html/_html5builder.py
@@ -0,0 +1,100 @@
+"""
+Legacy module - don't use in new code!
+
+html5lib now has its own proper implementation.
+
+This module implements a tree builder for html5lib that generates lxml
+html element trees.  This module uses camelCase as it follows the
+html5lib style guide.
+"""
+
+from html5lib.treebuilders import _base, etree as etree_builders
+from lxml import html, etree
+
+
+class DocumentType(object):
+
+    def __init__(self, name, publicId, systemId):
+        self.name = name
+        self.publicId = publicId
+        self.systemId = systemId
+
+class Document(object):
+
+    def __init__(self):
+        self._elementTree = None
+        self.childNodes = []
+
+    def appendChild(self, element):
+        self._elementTree.getroot().addnext(element._element)
+
+
+class TreeBuilder(_base.TreeBuilder):
+    documentClass = Document
+    doctypeClass = DocumentType
+    elementClass = None
+    commentClass = None
+    fragmentClass = Document
+
+    def __init__(self, *args, **kwargs):
+        html_builder = etree_builders.getETreeModule(html, fullTree=False)
+        etree_builder = etree_builders.getETreeModule(etree, fullTree=False)
+        self.elementClass = html_builder.Element
+        self.commentClass = etree_builder.Comment
+        _base.TreeBuilder.__init__(self, *args, **kwargs)
+
+    def reset(self):
+        _base.TreeBuilder.reset(self)
+        self.rootInserted = False
+        self.initialComments = []
+        self.doctype = None
+
+    def getDocument(self):
+        return self.document._elementTree
+
+    def getFragment(self):
+        fragment = []
+        element = self.openElements[0]._element
+        if element.text:
+            fragment.append(element.text)
+        fragment.extend(element.getchildren())
+        if element.tail:
+            fragment.append(element.tail)
+        return fragment
+
+    def insertDoctype(self, name, publicId, systemId):
+        doctype = self.doctypeClass(name, publicId, systemId)
+        self.doctype = doctype
+
+    def insertComment(self, data, parent=None):
+        if not self.rootInserted:
+            self.initialComments.append(data)
+        else:
+            _base.TreeBuilder.insertComment(self, data, parent)
+
+    def insertRoot(self, name):
+        buf = []
+        if self.doctype and self.doctype.name:
+            buf.append('<!DOCTYPE %s' % self.doctype.name)
+            if self.doctype.publicId is not None or self.doctype.systemId is not None:
+                buf.append(' PUBLIC "%s" "%s"' % (self.doctype.publicId,
+                                                  self.doctype.systemId))
+            buf.append('>')
+        buf.append('<html></html>')
+        root = html.fromstring(''.join(buf))
+
+        # Append the initial comments:
+        for comment in self.initialComments:
+            root.addprevious(etree.Comment(comment))
+
+        # Create the root document and add the ElementTree to it
+        self.document = self.documentClass()
+        self.document._elementTree = root.getroottree()
+
+        # Add the root element to the internal child/open data structures
+        root_element = self.elementClass(name)
+        root_element._element = root
+        self.document.childNodes.append(root_element)
+        self.openElements.append(root_element)
+
+        self.rootInserted = True
diff --git a/lib/lxml/html/_setmixin.py b/lib/lxml/html/_setmixin.py
new file mode 100644
index 00000000..81310ff6
--- /dev/null
+++ b/lib/lxml/html/_setmixin.py
@@ -0,0 +1,115 @@
+class SetMixin(object):
+
+    """
+    Mix-in for sets.  You must define __iter__, add, remove
+    """
+
+    def __len__(self):
+        length = 0
+        for item in self:
+            length += 1
+        return length
+
+    def __contains__(self, item):
+        for has_item in self:
+            if item == has_item:
+                return True
+        return False
+
+    def issubset(self, other):
+        for item in other:
+            if item not in self:
+                return False
+        return True
+
+    __le__ = issubset
+
+    def issuperset(self, other):
+        for item in self:
+            if item not in other:
+                return False
+        return True
+
+    __ge__ = issuperset
+
+    def union(self, other):
+        return self | other
+
+    def __or__(self, other):
+        new = self.copy()
+        new |= other
+        return new
+    
+    def intersection(self, other):
+        return self & other
+
+    def __and__(self, other):
+        new = self.copy()
+        new &= other
+        return new
+
+    def difference(self, other):
+        return self - other
+
+    def __sub__(self, other):
+        new = self.copy()
+        new -= other
+        return new
+
+    def symmetric_difference(self, other):
+        return self ^ other
+
+    def __xor__(self, other):
+        new = self.copy()
+        new ^= other
+        return new
+
+    def copy(self):
+        return set(self)
+
+    def update(self, other):
+        for item in other:
+            self.add(item)
+
+    def __ior__(self, other):
+        self.update(other)
+        return self
+
+    def intersection_update(self, other):
+        for item in self:
+            if item not in other:
+                self.remove(item)
+
+    def __iand__(self, other):
+        self.intersection_update(other)
+        return self
+
+    def difference_update(self, other):
+        for item in other:
+            if item in self:
+                self.remove(item)
+
+    def __isub__(self, other):
+        self.difference_update(other)
+        return self
+
+    def symmetric_difference_update(self, other):
+        for item in other:
+            if item in self:
+                self.remove(item)
+            else:
+                self.add(item)
+
+    def __ixor__(self, other):
+        self.symmetric_difference_update(other)
+        return self
+
+    def discard(self, item):
+        try:
+            self.remove(item)
+        except KeyError:
+            pass
+
+    def clear(self):
+        for item in list(self):
+            self.remove(item)
diff --git a/lib/lxml/html/builder.py b/lib/lxml/html/builder.py
new file mode 100644
index 00000000..2230ccef
--- /dev/null
+++ b/lib/lxml/html/builder.py
@@ -0,0 +1,133 @@
+# --------------------------------------------------------------------
+# The ElementTree toolkit is
+# Copyright (c) 1999-2004 by Fredrik Lundh
+# --------------------------------------------------------------------
+
+"""
+A set of HTML generator tags for building HTML documents.
+
+Usage::
+
+    >>> from lxml.html.builder import *
+    >>> html = HTML(
+    ...            HEAD( TITLE("Hello World") ),
+    ...            BODY( CLASS("main"),
+    ...                  H1("Hello World !")
+    ...            )
+    ...        )
+
+    >>> import lxml.etree
+    >>> print lxml.etree.tostring(html, pretty_print=True)
+    <html>
+      <head>
+        <title>Hello World</title>
+      </head>
+      <body class="main">
+        <h1>Hello World !</h1>
+      </body>
+    </html>
+
+"""
+
+from lxml.builder import ElementMaker
+from lxml.html import html_parser
+
+E = ElementMaker(makeelement=html_parser.makeelement)
+
+# elements
+A = E.a # anchor
+ABBR = E.abbr # abbreviated form (e.g., WWW, HTTP, etc.)
+ACRONYM = E.acronym # 
+ADDRESS = E.address # information on author
+APPLET = E.applet # Java applet (DEPRECATED)
+AREA = E.area # client-side image map area
+B = E.b # bold text style
+BASE = E.base # document base URI
+BASEFONT = E.basefont # base font size (DEPRECATED)
+BDO = E.bdo # I18N BiDi over-ride
+BIG = E.big # large text style
+BLOCKQUOTE = E.blockquote # long quotation
+BODY = E.body # document body
+BR = E.br # forced line break
+BUTTON = E.button # push button
+CAPTION = E.caption # table caption
+CENTER = E.center # shorthand for DIV align=center (DEPRECATED)
+CITE = E.cite # citation
+CODE = E.code # computer code fragment
+COL = E.col # table column
+COLGROUP = E.colgroup # table column group
+DD = E.dd # definition description
+DEL = getattr(E, 'del') # deleted text
+DFN = E.dfn # instance definition
+DIR = E.dir # directory list (DEPRECATED)
+DIV = E.div # generic language/style container
+DL = E.dl # definition list
+DT = E.dt # definition term
+EM = E.em # emphasis
+FIELDSET = E.fieldset # form control group
+FONT = E.font # local change to font (DEPRECATED)
+FORM = E.form # interactive form
+FRAME = E.frame # subwindow
+FRAMESET = E.frameset # window subdivision
+H1 = E.h1 # heading
+H2 = E.h2 # heading
+H3 = E.h3 # heading
+H4 = E.h4 # heading
+H5 = E.h5 # heading
+H6 = E.h6 # heading
+HEAD = E.head # document head
+HR = E.hr # horizontal rule
+HTML = E.html # document root element
+I = E.i # italic text style
+IFRAME = E.iframe # inline subwindow
+IMG = E.img # Embedded image
+INPUT = E.input # form control
+INS = E.ins # inserted text
+ISINDEX = E.isindex # single line prompt (DEPRECATED)
+KBD = E.kbd # text to be entered by the user
+LABEL = E.label # form field label text
+LEGEND = E.legend # fieldset legend
+LI = E.li # list item
+LINK = E.link # a media-independent link
+MAP = E.map # client-side image map
+MENU = E.menu # menu list (DEPRECATED)
+META = E.meta # generic metainformation
+NOFRAMES = E.noframes # alternate content container for non frame-based rendering
+NOSCRIPT = E.noscript # alternate content container for non script-based rendering
+OBJECT = E.object # generic embedded object
+OL = E.ol # ordered list
+OPTGROUP = E.optgroup # option group
+OPTION = E.option # selectable choice
+P = E.p # paragraph
+PARAM = E.param # named property value
+PRE = E.pre # preformatted text
+Q = E.q # short inline quotation
+S = E.s # strike-through text style (DEPRECATED)
+SAMP = E.samp # sample program output, scripts, etc.
+SCRIPT = E.script # script statements
+SELECT = E.select # option selector
+SMALL = E.small # small text style
+SPAN = E.span # generic language/style container
+STRIKE = E.strike # strike-through text (DEPRECATED)
+STRONG = E.strong # strong emphasis
+STYLE = E.style # style info
+SUB = E.sub # subscript
+SUP = E.sup # superscript
+TABLE = E.table # 
+TBODY = E.tbody # table body
+TD = E.td # table data cell
+TEXTAREA = E.textarea # multi-line text field
+TFOOT = E.tfoot # table footer
+TH = E.th # table header cell
+THEAD = E.thead # table header
+TITLE = E.title # document title
+TR = E.tr # table row
+TT = E.tt # teletype or monospaced text style
+U = E.u # underlined text style (DEPRECATED)
+UL = E.ul # unordered list
+VAR = E.var # instance of a variable or program argument
+
+# attributes (only reserved words are included here)
+ATTR = dict
+def CLASS(v): return {'class': v}
+def FOR(v): return {'for': v}
diff --git a/lib/lxml/html/clean.py b/lib/lxml/html/clean.py
new file mode 100644
index 00000000..605ea86a
--- /dev/null
+++ b/lib/lxml/html/clean.py
@@ -0,0 +1,724 @@
+"""A cleanup tool for HTML.
+
+Removes unwanted tags and content.  See the `Cleaner` class for
+details.
+"""
+
+import re
+import copy
+try:
+    from urlparse import urlsplit
+except ImportError:
+    # Python 3
+    from urllib.parse import urlsplit
+from lxml import etree
+from lxml.html import defs
+from lxml.html import fromstring, tostring, XHTML_NAMESPACE
+from lxml.html import xhtml_to_html, _transform_result
+
+try:
+    unichr
+except NameError:
+    # Python 3
+    unichr = chr
+try:
+    unicode
+except NameError:
+    # Python 3
+    unicode = str
+try:
+    bytes
+except NameError:
+    # Python < 2.6
+    bytes = str
+try:
+    basestring
+except NameError:
+    basestring = (str, bytes)
+
+
+__all__ = ['clean_html', 'clean', 'Cleaner', 'autolink', 'autolink_html',
+           'word_break', 'word_break_html']
+
+# Look at http://code.sixapart.com/trac/livejournal/browser/trunk/cgi-bin/cleanhtml.pl
+#   Particularly the CSS cleaning; most of the tag cleaning is integrated now
+# I have multiple kinds of schemes searched; but should schemes be
+#   whitelisted instead?
+# max height?
+# remove images?  Also in CSS?  background attribute?
+# Some way to whitelist object, iframe, etc (e.g., if you want to
+#   allow *just* embedded YouTube movies)
+# Log what was deleted and why?
+# style="behavior: ..." might be bad in IE?
+# Should we have something for just <meta http-equiv>?  That's the worst of the
+#   metas.
+# UTF-7 detections?  Example:
+#     <HEAD><META HTTP-EQUIV="CONTENT-TYPE" CONTENT="text/html; charset=UTF-7"> </HEAD>+ADw-SCRIPT+AD4-alert('XSS');+ADw-/SCRIPT+AD4-
+#   you don't always have to have the charset set, if the page has no charset
+#   and there's UTF7-like code in it.
+# Look at these tests: http://htmlpurifier.org/live/smoketests/xssAttacks.php
+
+
+# This is an IE-specific construct you can have in a stylesheet to
+# run some Javascript:
+_css_javascript_re = re.compile(
+    r'expression\s*\(.*?\)', re.S|re.I)
+
+# Do I have to worry about @\nimport?
+_css_import_re = re.compile(
+    r'@\s*import', re.I)
+
+# All kinds of schemes besides just javascript: that can cause
+# execution:
+_javascript_scheme_re = re.compile(
+    r'\s*(?:javascript|jscript|livescript|vbscript|data|about|mocha):', re.I)
+_substitute_whitespace = re.compile(r'\s+').sub
+# FIXME: should data: be blocked?
+
+# FIXME: check against: http://msdn2.microsoft.com/en-us/library/ms537512.aspx
+_conditional_comment_re = re.compile(
+    r'\[if[\s\n\r]+.*?][\s\n\r]*>', re.I|re.S)
+
+_find_styled_elements = etree.XPath(
+    "descendant-or-self::*[@style]")
+
+_find_external_links = etree.XPath(
+    ("descendant-or-self::a  [normalize-space(@href) and substring(normalize-space(@href),1,1) != '#'] |"
+     "descendant-or-self::x:a[normalize-space(@href) and substring(normalize-space(@href),1,1) != '#']"),
+    namespaces={'x':XHTML_NAMESPACE})
+
+class Cleaner(object):
+    """
+    Instances cleans the document of each of the possible offending
+    elements.  The cleaning is controlled by attributes; you can
+    override attributes in a subclass, or set them in the constructor.
+
+    ``scripts``:
+        Removes any ``<script>`` tags.
+
+    ``javascript``:
+        Removes any Javascript, like an ``onclick`` attribute. Also removes stylesheets
+        as they could contain Javascript.
+
+    ``comments``:
+        Removes any comments.
+
+    ``style``:
+        Removes any style tags or attributes.
+
+    ``links``:
+        Removes any ``<link>`` tags
+
+    ``meta``:
+        Removes any ``<meta>`` tags
+
+    ``page_structure``:
+        Structural parts of a page: ``<head>``, ``<html>``, ``<title>``.
+
+    ``processing_instructions``:
+        Removes any processing instructions.
+
+    ``embedded``:
+        Removes any embedded objects (flash, iframes)
+
+    ``frames``:
+        Removes any frame-related tags
+
+    ``forms``:
+        Removes any form tags
+
+    ``annoying_tags``:
+        Tags that aren't *wrong*, but are annoying.  ``<blink>`` and ``<marquee>``
+
+    ``remove_tags``:
+        A list of tags to remove.  Only the tags will be removed,
+        their content will get pulled up into the parent tag.
+
+    ``kill_tags``:
+        A list of tags to kill.  Killing also removes the tag's content,
+        i.e. the whole subtree, not just the tag itself.
+
+    ``allow_tags``:
+        A list of tags to include (default include all).
+
+    ``remove_unknown_tags``:
+        Remove any tags that aren't standard parts of HTML.
+
+    ``safe_attrs_only``:
+        If true, only include 'safe' attributes (specifically the list
+        from the feedparser HTML sanitisation web site).
+
+    ``safe_attrs``:
+        A set of attribute names to override the default list of attributes
+        considered 'safe' (when safe_attrs_only=True).
+
+    ``add_nofollow``:
+        If true, then any <a> tags will have ``rel="nofollow"`` added to them.
+
+    ``host_whitelist``:
+        A list or set of hosts that you can use for embedded content
+        (for content like ``<object>``, ``<link rel="stylesheet">``, etc).
+        You can also implement/override the method
+        ``allow_embedded_url(el, url)`` or ``allow_element(el)`` to
+        implement more complex rules for what can be embedded.
+        Anything that passes this test will be shown, regardless of
+        the value of (for instance) ``embedded``.
+
+        Note that this parameter might not work as intended if you do not
+        make the links absolute before doing the cleaning.
+
+        Note that you may also need to set ``whitelist_tags``.
+
+    ``whitelist_tags``:
+        A set of tags that can be included with ``host_whitelist``.
+        The default is ``iframe`` and ``embed``; you may wish to
+        include other tags like ``script``, or you may want to
+        implement ``allow_embedded_url`` for more control.  Set to None to
+        include all tags.
+
+    This modifies the document *in place*.
+    """
+
+    scripts = True
+    javascript = True
+    comments = True
+    style = False
+    links = True
+    meta = True
+    page_structure = True
+    processing_instructions = True
+    embedded = True
+    frames = True
+    forms = True
+    annoying_tags = True
+    remove_tags = None
+    allow_tags = None
+    kill_tags = None
+    remove_unknown_tags = True
+    safe_attrs_only = True
+    safe_attrs = defs.safe_attrs
+    add_nofollow = False
+    host_whitelist = ()
+    whitelist_tags = set(['iframe', 'embed'])
+
+    def __init__(self, **kw):
+        for name, value in kw.items():
+            if not hasattr(self, name):
+                raise TypeError(
+                    "Unknown parameter: %s=%r" % (name, value))
+            setattr(self, name, value)
+
+    # Used to lookup the primary URL for a given tag that is up for
+    # removal:
+    _tag_link_attrs = dict(
+        script='src',
+        link='href',
+        # From: http://java.sun.com/j2se/1.4.2/docs/guide/misc/applet.html
+        # From what I can tell, both attributes can contain a link:
+        applet=['code', 'object'],
+        iframe='src',
+        embed='src',
+        layer='src',
+        # FIXME: there doesn't really seem like a general way to figure out what
+        # links an <object> tag uses; links often go in <param> tags with values
+        # that we don't really know.  You'd have to have knowledge about specific
+        # kinds of plugins (probably keyed off classid), and match against those.
+        ##object=?,
+        # FIXME: not looking at the action currently, because it is more complex
+        # than than -- if you keep the form, you should keep the form controls.
+        ##form='action',
+        a='href',
+        )
+
+    def __call__(self, doc):
+        """
+        Cleans the document.
+        """
+        if hasattr(doc, 'getroot'):
+            # ElementTree instance, instead of an element
+            doc = doc.getroot()
+        # convert XHTML to HTML
+        xhtml_to_html(doc)
+        # Normalize a case that IE treats <image> like <img>, and that
+        # can confuse either this step or later steps.
+        for el in doc.iter('image'):
+            el.tag = 'img'
+        if not self.comments:
+            # Of course, if we were going to kill comments anyway, we don't
+            # need to worry about this
+            self.kill_conditional_comments(doc)
+
+        kill_tags = set(self.kill_tags or ())
+        remove_tags = set(self.remove_tags or ())
+        allow_tags = set(self.allow_tags or ())
+
+        if self.scripts:
+            kill_tags.add('script')
+        if self.safe_attrs_only:
+            safe_attrs = set(self.safe_attrs)
+            for el in doc.iter():
+                attrib = el.attrib
+                for aname in attrib.keys():
+                    if aname not in safe_attrs:
+                        del attrib[aname]
+        if self.javascript:
+            if not (self.safe_attrs_only and
+                    self.safe_attrs == defs.safe_attrs):
+                # safe_attrs handles events attributes itself
+                for el in doc.iter():
+                    attrib = el.attrib
+                    for aname in attrib.keys():
+                        if aname.startswith('on'):
+                            del attrib[aname]
+            doc.rewrite_links(self._remove_javascript_link,
+                              resolve_base_href=False)
+            if not self.style:
+                # If we're deleting style then we don't have to remove JS links
+                # from styles, otherwise...
+                for el in _find_styled_elements(doc):
+                    old = el.get('style')
+                    new = _css_javascript_re.sub('', old)
+                    new = _css_import_re.sub('', new)
+                    if self._has_sneaky_javascript(new):
+                        # Something tricky is going on...
+                        del el.attrib['style']
+                    elif new != old:
+                        el.set('style', new)
+                for el in list(doc.iter('style')):
+                    if el.get('type', '').lower().strip() == 'text/javascript':
+                        el.drop_tree()
+                        continue
+                    old = el.text or ''
+                    new = _css_javascript_re.sub('', old)
+                    # The imported CSS can do anything; we just can't allow:
+                    new = _css_import_re.sub('', old)
+                    if self._has_sneaky_javascript(new):
+                        # Something tricky is going on...
+                        el.text = '/* deleted */'
+                    elif new != old:
+                        el.text = new
+        if self.comments or self.processing_instructions:
+            # FIXME: why either?  I feel like there's some obscure reason
+            # because you can put PIs in comments...?  But I've already
+            # forgotten it
+            kill_tags.add(etree.Comment)
+        if self.processing_instructions:
+            kill_tags.add(etree.ProcessingInstruction)
+        if self.style:
+            kill_tags.add('style')
+            etree.strip_attributes(doc, 'style')
+        if self.links:
+            kill_tags.add('link')
+        elif self.style or self.javascript:
+            # We must get rid of included stylesheets if Javascript is not
+            # allowed, as you can put Javascript in them
+            for el in list(doc.iter('link')):
+                if 'stylesheet' in el.get('rel', '').lower():
+                    # Note this kills alternate stylesheets as well
+                    if not self.allow_element(el):
+                        el.drop_tree()
+        if self.meta:
+            kill_tags.add('meta')
+        if self.page_structure:
+            remove_tags.update(('head', 'html', 'title'))
+        if self.embedded:
+            # FIXME: is <layer> really embedded?
+            # We should get rid of any <param> tags not inside <applet>;
+            # These are not really valid anyway.
+            for el in list(doc.iter('param')):
+                found_parent = False
+                parent = el.getparent()
+                while parent is not None and parent.tag not in ('applet', 'object'):
+                    parent = parent.getparent()
+                if parent is None:
+                    el.drop_tree()
+            kill_tags.update(('applet',))
+            # The alternate contents that are in an iframe are a good fallback:
+            remove_tags.update(('iframe', 'embed', 'layer', 'object', 'param'))
+        if self.frames:
+            # FIXME: ideally we should look at the frame links, but
+            # generally frames don't mix properly with an HTML
+            # fragment anyway.
+            kill_tags.update(defs.frame_tags)
+        if self.forms:
+            remove_tags.add('form')
+            kill_tags.update(('button', 'input', 'select', 'textarea'))
+        if self.annoying_tags:
+            remove_tags.update(('blink', 'marquee'))
+
+        _remove = []
+        _kill = []
+        for el in doc.iter():
+            if el.tag in kill_tags:
+                if self.allow_element(el):
+                    continue
+                _kill.append(el)
+            elif el.tag in remove_tags:
+                if self.allow_element(el):
+                    continue
+                _remove.append(el)
+
+        if _remove and _remove[0] == doc:
+            # We have to drop the parent-most tag, which we can't
+            # do.  Instead we'll rewrite it:
+            el = _remove.pop(0)
+            el.tag = 'div'
+            el.attrib.clear()
+        elif _kill and _kill[0] == doc:
+            # We have to drop the parent-most element, which we can't
+            # do.  Instead we'll clear it:
+            el = _kill.pop(0)
+            if el.tag != 'html':
+                el.tag = 'div'
+            el.clear()
+
+        _kill.reverse() # start with innermost tags
+        for el in _kill:
+            el.drop_tree()
+        for el in _remove:
+            el.drop_tag()
+
+        if self.remove_unknown_tags:
+            if allow_tags:
+                raise ValueError(
+                    "It does not make sense to pass in both allow_tags and remove_unknown_tags")
+            allow_tags = set(defs.tags)
+        if allow_tags:
+            bad = []
+            for el in doc.iter():
+                if el.tag not in allow_tags:
+                    bad.append(el)
+            if bad:
+                if bad[0] is doc:
+                    el = bad.pop(0)
+                    el.tag = 'div'
+                    el.attrib.clear()
+                for el in bad:
+                    el.drop_tag()
+        if self.add_nofollow:
+            for el in _find_external_links(doc):
+                if not self.allow_follow(el):
+                    rel = el.get('rel')
+                    if rel:
+                        if ('nofollow' in rel
+                                and ' nofollow ' in (' %s ' % rel)):
+                            continue
+                        rel = '%s nofollow' % rel
+                    else:
+                        rel = 'nofollow'
+                    el.set('rel', rel)
+
+    def allow_follow(self, anchor):
+        """
+        Override to suppress rel="nofollow" on some anchors.
+        """
+        return False
+
+    def allow_element(self, el):
+        if el.tag not in self._tag_link_attrs:
+            return False
+        attr = self._tag_link_attrs[el.tag]
+        if isinstance(attr, (list, tuple)):
+            for one_attr in attr:
+                url = el.get(one_attr)
+                if not url:
+                    return False
+                if not self.allow_embedded_url(el, url):
+                    return False
+            return True
+        else:
+            url = el.get(attr)
+            if not url:
+                return False
+            return self.allow_embedded_url(el, url)
+
+    def allow_embedded_url(self, el, url):
+        if (self.whitelist_tags is not None
+            and el.tag not in self.whitelist_tags):
+            return False
+        scheme, netloc, path, query, fragment = urlsplit(url)
+        netloc = netloc.lower().split(':', 1)[0]
+        if scheme not in ('http', 'https'):
+            return False
+        if netloc in self.host_whitelist:
+            return True
+        return False
+
+    def kill_conditional_comments(self, doc):
+        """
+        IE conditional comments basically embed HTML that the parser
+        doesn't normally see.  We can't allow anything like that, so
+        we'll kill any comments that could be conditional.
+        """
+        bad = []
+        self._kill_elements(
+            doc, lambda el: _conditional_comment_re.search(el.text),
+            etree.Comment)                
+
+    def _kill_elements(self, doc, condition, iterate=None):
+        bad = []
+        for el in doc.iter(iterate):
+            if condition(el):
+                bad.append(el)
+        for el in bad:
+            el.drop_tree()
+
+    def _remove_javascript_link(self, link):
+        # links like "j a v a s c r i p t:" might be interpreted in IE
+        new = _substitute_whitespace('', link)
+        if _javascript_scheme_re.search(new):
+            # FIXME: should this be None to delete?
+            return ''
+        return link
+
+    _substitute_comments = re.compile(r'/\*.*?\*/', re.S).sub
+
+    def _has_sneaky_javascript(self, style):
+        """
+        Depending on the browser, stuff like ``e x p r e s s i o n(...)``
+        can get interpreted, or ``expre/* stuff */ssion(...)``.  This
+        checks for attempt to do stuff like this.
+
+        Typically the response will be to kill the entire style; if you
+        have just a bit of Javascript in the style another rule will catch
+        that and remove only the Javascript from the style; this catches
+        more sneaky attempts.
+        """
+        style = self._substitute_comments('', style)
+        style = style.replace('\\', '')
+        style = _substitute_whitespace('', style)
+        style = style.lower()
+        if 'javascript:' in style:
+            return True
+        if 'expression(' in style:
+            return True
+        return False
+
+    def clean_html(self, html):
+        result_type = type(html)
+        if isinstance(html, basestring):
+            doc = fromstring(html)
+        else:
+            doc = copy.deepcopy(html)
+        self(doc)
+        return _transform_result(result_type, doc)
+
+clean = Cleaner()
+clean_html = clean.clean_html
+
+############################################################
+## Autolinking
+############################################################
+
+_link_regexes = [
+    re.compile(r'(?P<body>https?://(?P<host>[a-z0-9._-]+)(?:/[/\-_.,a-z0-9%&?;=~]*)?(?:\([/\-_.,a-z0-9%&?;=~]*\))?)', re.I),
+    # This is conservative, but autolinking can be a bit conservative:
+    re.compile(r'mailto:(?P<body>[a-z0-9._-]+@(?P<host>[a-z0-9_._]+[a-z]))', re.I),
+    ]
+
+_avoid_elements = ['textarea', 'pre', 'code', 'head', 'select', 'a']
+
+_avoid_hosts = [
+    re.compile(r'^localhost', re.I),
+    re.compile(r'\bexample\.(?:com|org|net)$', re.I),
+    re.compile(r'^127\.0\.0\.1$'),
+    ]
+
+_avoid_classes = ['nolink']
+
+def autolink(el, link_regexes=_link_regexes,
+             avoid_elements=_avoid_elements,
+             avoid_hosts=_avoid_hosts,
+             avoid_classes=_avoid_classes):
+    """
+    Turn any URLs into links.
+
+    It will search for links identified by the given regular
+    expressions (by default mailto and http(s) links).
+
+    It won't link text in an element in avoid_elements, or an element
+    with a class in avoid_classes.  It won't link to anything with a
+    host that matches one of the regular expressions in avoid_hosts
+    (default localhost and 127.0.0.1).
+
+    If you pass in an element, the element's tail will not be
+    substituted, only the contents of the element.
+    """
+    if el.tag in avoid_elements:
+        return
+    class_name = el.get('class')
+    if class_name:
+        class_name = class_name.split()
+        for match_class in avoid_classes:
+            if match_class in class_name:
+                return
+    for child in list(el):
+        autolink(child, link_regexes=link_regexes,
+                 avoid_elements=avoid_elements,
+                 avoid_hosts=avoid_hosts,
+                 avoid_classes=avoid_classes)
+        if child.tail:
+            text, tail_children = _link_text(
+                child.tail, link_regexes, avoid_hosts, factory=el.makeelement)
+            if tail_children:
+                child.tail = text
+                index = el.index(child)
+                el[index+1:index+1] = tail_children
+    if el.text:
+        text, pre_children = _link_text(
+            el.text, link_regexes, avoid_hosts, factory=el.makeelement)
+        if pre_children:
+            el.text = text
+            el[:0] = pre_children
+
+def _link_text(text, link_regexes, avoid_hosts, factory):
+    leading_text = ''
+    links = []
+    last_pos = 0
+    while 1:
+        best_match, best_pos = None, None
+        for regex in link_regexes:
+            regex_pos = last_pos
+            while 1:
+                match = regex.search(text, pos=regex_pos)
+                if match is None:
+                    break
+                host = match.group('host')
+                for host_regex in avoid_hosts:
+                    if host_regex.search(host):
+                        regex_pos = match.end()
+                        break
+                else:
+                    break
+            if match is None:
+                continue
+            if best_pos is None or match.start() < best_pos:
+                best_match = match
+                best_pos = match.start()
+        if best_match is None:
+            # No more matches
+            if links:
+                assert not links[-1].tail
+                links[-1].tail = text
+            else:
+                assert not leading_text
+                leading_text = text
+            break
+        link = best_match.group(0)
+        end = best_match.end()
+        if link.endswith('.') or link.endswith(','):
+            # These punctuation marks shouldn't end a link
+            end -= 1
+            link = link[:-1]
+        prev_text = text[:best_match.start()]
+        if links:
+            assert not links[-1].tail
+            links[-1].tail = prev_text
+        else:
+            assert not leading_text
+            leading_text = prev_text
+        anchor = factory('a')
+        anchor.set('href', link)
+        body = best_match.group('body')
+        if not body:
+            body = link
+        if body.endswith('.') or body.endswith(','):
+            body = body[:-1]
+        anchor.text = body
+        links.append(anchor)
+        text = text[end:]
+    return leading_text, links
+                
+def autolink_html(html, *args, **kw):
+    result_type = type(html)
+    if isinstance(html, basestring):
+        doc = fromstring(html)
+    else:
+        doc = copy.deepcopy(html)
+    autolink(doc, *args, **kw)
+    return _transform_result(result_type, doc)
+
+autolink_html.__doc__ = autolink.__doc__
+
+############################################################
+## Word wrapping
+############################################################
+
+_avoid_word_break_elements = ['pre', 'textarea', 'code']
+_avoid_word_break_classes = ['nobreak']
+
+def word_break(el, max_width=40,
+               avoid_elements=_avoid_word_break_elements,
+               avoid_classes=_avoid_word_break_classes,
+               break_character=unichr(0x200b)):
+    """
+    Breaks any long words found in the body of the text (not attributes).
+
+    Doesn't effect any of the tags in avoid_elements, by default
+    ``<textarea>`` and ``<pre>``
+
+    Breaks words by inserting &#8203;, which is a unicode character
+    for Zero Width Space character.  This generally takes up no space
+    in rendering, but does copy as a space, and in monospace contexts
+    usually takes up space.
+
+    See http://www.cs.tut.fi/~jkorpela/html/nobr.html for a discussion
+    """
+    # Character suggestion of &#8203 comes from:
+    #   http://www.cs.tut.fi/~jkorpela/html/nobr.html
+    if el.tag in _avoid_word_break_elements:
+        return
+    class_name = el.get('class')
+    if class_name:
+        dont_break = False
+        class_name = class_name.split()
+        for avoid in avoid_classes:
+            if avoid in class_name:
+                dont_break = True
+                break
+        if dont_break:
+            return
+    if el.text:
+        el.text = _break_text(el.text, max_width, break_character)
+    for child in el:
+        word_break(child, max_width=max_width,
+                   avoid_elements=avoid_elements,
+                   avoid_classes=avoid_classes,
+                   break_character=break_character)
+        if child.tail:
+            child.tail = _break_text(child.tail, max_width, break_character)
+
+def word_break_html(html, *args, **kw):
+    result_type = type(html)
+    doc = fromstring(html)
+    word_break(doc, *args, **kw)
+    return _transform_result(result_type, doc)
+
+def _break_text(text, max_width, break_character):
+    words = text.split()
+    for word in words:
+        if len(word) > max_width:
+            replacement = _insert_break(word, max_width, break_character)
+            text = text.replace(word, replacement)
+    return text
+
+_break_prefer_re = re.compile(r'[^a-z]', re.I)
+
+def _insert_break(word, width, break_character):
+    orig_word = word
+    result = ''
+    while len(word) > width:
+        start = word[:width]
+        breaks = list(_break_prefer_re.finditer(start))
+        if breaks:
+            last_break = breaks[-1]
+            # Only walk back up to 10 characters to find a nice break:
+            if last_break.end() > width-10:
+                # FIXME: should the break character be at the end of the
+                # chunk, or the beginning of the next chunk?
+                start = word[:last_break.end()]
+        result += start + break_character
+        word = word[len(start):]
+    result += word
+    return result
+    
diff --git a/lib/lxml/html/defs.py b/lib/lxml/html/defs.py
new file mode 100644
index 00000000..e6ca5882
--- /dev/null
+++ b/lib/lxml/html/defs.py
@@ -0,0 +1,137 @@
+# FIXME: this should all be confirmed against what a DTD says
+# (probably in a test; this may not match the DTD exactly, but we
+# should document just how it differs).
+
+# Data taken from http://www.w3.org/TR/html401/index/elements.html
+# and http://www.w3.org/community/webed/wiki/HTML/New_HTML5_Elements
+# for html5_tags.
+
+try:
+    frozenset
+except NameError:
+    from sets import Set as frozenset
+
+
+empty_tags = frozenset([
+    'area', 'base', 'basefont', 'br', 'col', 'frame', 'hr',
+    'img', 'input', 'isindex', 'link', 'meta', 'param'])
+
+deprecated_tags = frozenset([
+    'applet', 'basefont', 'center', 'dir', 'font', 'isindex',
+    'menu', 's', 'strike', 'u'])
+
+# archive actually takes a space-separated list of URIs
+link_attrs = frozenset([
+    'action', 'archive', 'background', 'cite', 'classid',
+    'codebase', 'data', 'href', 'longdesc', 'profile', 'src',
+    'usemap',
+    # Not standard:
+    'dynsrc', 'lowsrc',
+    ])
+
+# Not in the HTML 4 spec:
+# onerror, onresize
+event_attrs = frozenset([
+    'onblur', 'onchange', 'onclick', 'ondblclick', 'onerror',
+    'onfocus', 'onkeydown', 'onkeypress', 'onkeyup', 'onload',
+    'onmousedown', 'onmousemove', 'onmouseout', 'onmouseover',
+    'onmouseup', 'onreset', 'onresize', 'onselect', 'onsubmit',
+    'onunload',
+    ])
+
+safe_attrs = frozenset([
+    'abbr', 'accept', 'accept-charset', 'accesskey', 'action', 'align',
+    'alt', 'axis', 'border', 'cellpadding', 'cellspacing', 'char', 'charoff',
+    'charset', 'checked', 'cite', 'class', 'clear', 'cols', 'colspan',
+    'color', 'compact', 'coords', 'datetime', 'dir', 'disabled', 'enctype',
+    'for', 'frame', 'headers', 'height', 'href', 'hreflang', 'hspace', 'id',
+    'ismap', 'label', 'lang', 'longdesc', 'maxlength', 'media', 'method',
+    'multiple', 'name', 'nohref', 'noshade', 'nowrap', 'prompt', 'readonly',
+    'rel', 'rev', 'rows', 'rowspan', 'rules', 'scope', 'selected', 'shape',
+    'size', 'span', 'src', 'start', 'summary', 'tabindex', 'target', 'title',
+    'type', 'usemap', 'valign', 'value', 'vspace', 'width'])
+
+# From http://htmlhelp.com/reference/html40/olist.html
+top_level_tags = frozenset([
+    'html', 'head', 'body', 'frameset',
+    ])
+
+head_tags = frozenset([
+    'base', 'isindex', 'link', 'meta', 'script', 'style', 'title',
+    ])
+
+general_block_tags = frozenset([
+    'address',
+    'blockquote',
+    'center',
+    'del',
+    'div',
+    'h1',
+    'h2',
+    'h3',
+    'h4',
+    'h5',
+    'h6',
+    'hr',
+    'ins',
+    'isindex',
+    'noscript',
+    'p',
+    'pre',
+    ])
+
+list_tags = frozenset([
+    'dir', 'dl', 'dt', 'dd', 'li', 'menu', 'ol', 'ul',
+    ])
+
+table_tags = frozenset([
+    'table', 'caption', 'colgroup', 'col',
+    'thead', 'tfoot', 'tbody', 'tr', 'td', 'th',
+    ])
+
+# just this one from
+# http://www.georgehernandez.com/h/XComputers/HTML/2BlockLevel.htm
+block_tags = general_block_tags | list_tags | table_tags | frozenset([
+    # Partial form tags
+    'fieldset', 'form', 'legend', 'optgroup', 'option',
+    ])
+
+form_tags = frozenset([
+    'form', 'button', 'fieldset', 'legend', 'input', 'label',
+    'select', 'optgroup', 'option', 'textarea',
+    ])
+
+special_inline_tags = frozenset([
+    'a', 'applet', 'basefont', 'bdo', 'br', 'embed', 'font', 'iframe',
+    'img', 'map', 'area', 'object', 'param', 'q', 'script',
+    'span', 'sub', 'sup',
+    ])
+
+phrase_tags = frozenset([
+    'abbr', 'acronym', 'cite', 'code', 'del', 'dfn', 'em',
+    'ins', 'kbd', 'samp', 'strong', 'var',
+    ])
+
+font_style_tags = frozenset([
+    'b', 'big', 'i', 's', 'small', 'strike', 'tt', 'u',
+    ])
+
+frame_tags = frozenset([
+    'frameset', 'frame', 'noframes',
+    ])
+    
+html5_tags = frozenset([
+    'article', 'aside', 'audio', 'canvas', 'command', 'datalist',
+    'details', 'embed', 'figcaption', 'figure', 'footer', 'header',
+    'hgroup', 'keygen', 'mark', 'math', 'meter', 'nav', 'output',
+    'progress', 'rp', 'rt', 'ruby', 'section', 'source', 'summary',
+    'svg', 'time', 'track', 'video', 'wbr'
+    ])
+
+# These tags aren't standard
+nonstandard_tags = frozenset(['blink', 'marquee'])
+
+
+tags = (top_level_tags | head_tags | general_block_tags | list_tags
+        | table_tags | form_tags | special_inline_tags | phrase_tags
+        | font_style_tags | nonstandard_tags | html5_tags)
diff --git a/lib/lxml/html/diff.py b/lib/lxml/html/diff.py
new file mode 100644
index 00000000..c6a62c67
--- /dev/null
+++ b/lib/lxml/html/diff.py
@@ -0,0 +1,881 @@
+import difflib
+from lxml import etree
+from lxml.html import fragment_fromstring
+import re
+
+__all__ = ['html_annotate', 'htmldiff']
+
+try:
+    from html import escape as html_escape
+except ImportError:
+    from cgi import escape as html_escape
+try:
+    _unicode = unicode
+except NameError:
+    # Python 3
+    _unicode = str
+try:
+    basestring
+except NameError:
+    # Python 3
+    basestring = str
+
+############################################################
+## Annotation
+############################################################
+
+def default_markup(text, version):
+    return '<span title="%s">%s</span>' % (
+        html_escape(_unicode(version), 1), text)
+
+def html_annotate(doclist, markup=default_markup):
+    """
+    doclist should be ordered from oldest to newest, like::
+
+        >>> version1 = 'Hello World'
+        >>> version2 = 'Goodbye World'
+        >>> print(html_annotate([(version1, 'version 1'),
+        ...                      (version2, 'version 2')]))
+        <span title="version 2">Goodbye</span> <span title="version 1">World</span>
+
+    The documents must be *fragments* (str/UTF8 or unicode), not
+    complete documents
+
+    The markup argument is a function to markup the spans of words.
+    This function is called like markup('Hello', 'version 2'), and
+    returns HTML.  The first argument is text and never includes any
+    markup.  The default uses a span with a title:
+
+        >>> print(default_markup('Some Text', 'by Joe'))
+        <span title="by Joe">Some Text</span>
+    """
+    # The basic strategy we have is to split the documents up into
+    # logical tokens (which are words with attached markup).  We then
+    # do diffs of each of the versions to track when a token first
+    # appeared in the document; the annotation attached to the token
+    # is the version where it first appeared.
+    tokenlist = [tokenize_annotated(doc, version)
+                 for doc, version in doclist]
+    cur_tokens = tokenlist[0]
+    for tokens in tokenlist[1:]:
+        html_annotate_merge_annotations(cur_tokens, tokens)
+        cur_tokens = tokens
+
+    # After we've tracked all the tokens, we can combine spans of text
+    # that are adjacent and have the same annotation
+    cur_tokens = compress_tokens(cur_tokens)
+    # And finally add markup
+    result = markup_serialize_tokens(cur_tokens, markup)
+    return ''.join(result).strip()
+
+def tokenize_annotated(doc, annotation): 
+    """Tokenize a document and add an annotation attribute to each token
+    """
+    tokens = tokenize(doc, include_hrefs=False)
+    for tok in tokens: 
+        tok.annotation = annotation
+    return tokens
+
+def html_annotate_merge_annotations(tokens_old, tokens_new): 
+    """Merge the annotations from tokens_old into tokens_new, when the
+    tokens in the new document already existed in the old document.
+    """
+    s = InsensitiveSequenceMatcher(a=tokens_old, b=tokens_new)
+    commands = s.get_opcodes()
+
+    for command, i1, i2, j1, j2 in commands:
+        if command == 'equal': 
+            eq_old = tokens_old[i1:i2]
+            eq_new = tokens_new[j1:j2]
+            copy_annotations(eq_old, eq_new)
+
+def copy_annotations(src, dest): 
+    """
+    Copy annotations from the tokens listed in src to the tokens in dest
+    """
+    assert len(src) == len(dest)
+    for src_tok, dest_tok in zip(src, dest): 
+        dest_tok.annotation = src_tok.annotation
+
+def compress_tokens(tokens):
+    """
+    Combine adjacent tokens when there is no HTML between the tokens, 
+    and they share an annotation
+    """
+    result = [tokens[0]] 
+    for tok in tokens[1:]: 
+        if (not result[-1].post_tags and 
+            not tok.pre_tags and 
+            result[-1].annotation == tok.annotation): 
+            compress_merge_back(result, tok)
+        else: 
+            result.append(tok)
+    return result
+
+def compress_merge_back(tokens, tok): 
+    """ Merge tok into the last element of tokens (modifying the list of
+    tokens in-place).  """
+    last = tokens[-1]
+    if type(last) is not token or type(tok) is not token: 
+        tokens.append(tok)
+    else:
+        text = _unicode(last)
+        if last.trailing_whitespace:
+            text += last.trailing_whitespace
+        text += tok
+        merged = token(text,
+                       pre_tags=last.pre_tags,
+                       post_tags=tok.post_tags,
+                       trailing_whitespace=tok.trailing_whitespace)
+        merged.annotation = last.annotation
+        tokens[-1] = merged
+    
+def markup_serialize_tokens(tokens, markup_func):
+    """
+    Serialize the list of tokens into a list of text chunks, calling
+    markup_func around text to add annotations.
+    """
+    for token in tokens:
+        for pre in token.pre_tags:
+            yield pre
+        html = token.html()
+        html = markup_func(html, token.annotation)
+        if token.trailing_whitespace:
+            html += token.trailing_whitespace
+        yield html
+        for post in token.post_tags:
+            yield post
+
+
+############################################################
+## HTML Diffs
+############################################################
+
+def htmldiff(old_html, new_html):
+    ## FIXME: this should take parsed documents too, and use their body
+    ## or other content.
+    """ Do a diff of the old and new document.  The documents are HTML
+    *fragments* (str/UTF8 or unicode), they are not complete documents
+    (i.e., no <html> tag).
+
+    Returns HTML with <ins> and <del> tags added around the
+    appropriate text.  
+
+    Markup is generally ignored, with the markup from new_html
+    preserved, and possibly some markup from old_html (though it is
+    considered acceptable to lose some of the old markup).  Only the
+    words in the HTML are diffed.  The exception is <img> tags, which
+    are treated like words, and the href attribute of <a> tags, which
+    are noted inside the tag itself when there are changes.
+    """ 
+    old_html_tokens = tokenize(old_html)
+    new_html_tokens = tokenize(new_html)
+    result = htmldiff_tokens(old_html_tokens, new_html_tokens)
+    result = ''.join(result).strip()
+    return fixup_ins_del_tags(result)
+
+def htmldiff_tokens(html1_tokens, html2_tokens):
+    """ Does a diff on the tokens themselves, returning a list of text
+    chunks (not tokens).
+    """
+    # There are several passes as we do the differences.  The tokens
+    # isolate the portion of the content we care to diff; difflib does
+    # all the actual hard work at that point.  
+    #
+    # Then we must create a valid document from pieces of both the old
+    # document and the new document.  We generally prefer to take
+    # markup from the new document, and only do a best effort attempt
+    # to keep markup from the old document; anything that we can't
+    # resolve we throw away.  Also we try to put the deletes as close
+    # to the location where we think they would have been -- because
+    # we are only keeping the markup from the new document, it can be
+    # fuzzy where in the new document the old text would have gone.
+    # Again we just do a best effort attempt.
+    s = InsensitiveSequenceMatcher(a=html1_tokens, b=html2_tokens)
+    commands = s.get_opcodes()
+    result = []
+    for command, i1, i2, j1, j2 in commands:
+        if command == 'equal':
+            result.extend(expand_tokens(html2_tokens[j1:j2], equal=True))
+            continue
+        if command == 'insert' or command == 'replace':
+            ins_tokens = expand_tokens(html2_tokens[j1:j2])
+            merge_insert(ins_tokens, result)
+        if command == 'delete' or command == 'replace':
+            del_tokens = expand_tokens(html1_tokens[i1:i2])
+            merge_delete(del_tokens, result)
+    # If deletes were inserted directly as <del> then we'd have an
+    # invalid document at this point.  Instead we put in special
+    # markers, and when the complete diffed document has been created
+    # we try to move the deletes around and resolve any problems.
+    result = cleanup_delete(result)
+
+    return result
+
+def expand_tokens(tokens, equal=False):
+    """Given a list of tokens, return a generator of the chunks of
+    text for the data in the tokens.
+    """
+    for token in tokens:
+        for pre in token.pre_tags:
+            yield pre
+        if not equal or not token.hide_when_equal:
+            if token.trailing_whitespace:
+                yield token.html() + token.trailing_whitespace
+            else:
+                yield token.html()
+        for post in token.post_tags:
+            yield post
+
+def merge_insert(ins_chunks, doc):
+    """ doc is the already-handled document (as a list of text chunks);
+    here we add <ins>ins_chunks</ins> to the end of that.  """
+    # Though we don't throw away unbalanced_start or unbalanced_end
+    # (we assume there is accompanying markup later or earlier in the
+    # document), we only put <ins> around the balanced portion.
+    unbalanced_start, balanced, unbalanced_end = split_unbalanced(ins_chunks)
+    doc.extend(unbalanced_start)
+    if doc and not doc[-1].endswith(' '):
+        # Fix up the case where the word before the insert didn't end with 
+        # a space
+        doc[-1] += ' '
+    doc.append('<ins>')
+    if balanced and balanced[-1].endswith(' '):
+        # We move space outside of </ins>
+        balanced[-1] = balanced[-1][:-1]
+    doc.extend(balanced)
+    doc.append('</ins> ')
+    doc.extend(unbalanced_end)
+
+# These are sentinals to represent the start and end of a <del>
+# segment, until we do the cleanup phase to turn them into proper
+# markup:
+class DEL_START:
+    pass
+class DEL_END:
+    pass
+
+class NoDeletes(Exception):
+    """ Raised when the document no longer contains any pending deletes
+    (DEL_START/DEL_END) """
+
+def merge_delete(del_chunks, doc):
+    """ Adds the text chunks in del_chunks to the document doc (another
+    list of text chunks) with marker to show it is a delete.
+    cleanup_delete later resolves these markers into <del> tags."""
+    doc.append(DEL_START)
+    doc.extend(del_chunks)
+    doc.append(DEL_END)
+
+def cleanup_delete(chunks):
+    """ Cleans up any DEL_START/DEL_END markers in the document, replacing
+    them with <del></del>.  To do this while keeping the document
+    valid, it may need to drop some tags (either start or end tags).
+
+    It may also move the del into adjacent tags to try to move it to a
+    similar location where it was originally located (e.g., moving a
+    delete into preceding <div> tag, if the del looks like (DEL_START,
+    'Text</div>', DEL_END)"""
+    while 1:
+        # Find a pending DEL_START/DEL_END, splitting the document
+        # into stuff-preceding-DEL_START, stuff-inside, and
+        # stuff-following-DEL_END
+        try:
+            pre_delete, delete, post_delete = split_delete(chunks)
+        except NoDeletes:
+            # Nothing found, we've cleaned up the entire doc
+            break
+        # The stuff-inside-DEL_START/END may not be well balanced
+        # markup.  First we figure out what unbalanced portions there are:
+        unbalanced_start, balanced, unbalanced_end = split_unbalanced(delete)
+        # Then we move the span forward and/or backward based on these
+        # unbalanced portions:
+        locate_unbalanced_start(unbalanced_start, pre_delete, post_delete)
+        locate_unbalanced_end(unbalanced_end, pre_delete, post_delete)
+        doc = pre_delete
+        if doc and not doc[-1].endswith(' '):
+            # Fix up case where the word before us didn't have a trailing space
+            doc[-1] += ' '
+        doc.append('<del>')
+        if balanced and balanced[-1].endswith(' '):
+            # We move space outside of </del>
+            balanced[-1] = balanced[-1][:-1]
+        doc.extend(balanced)
+        doc.append('</del> ')
+        doc.extend(post_delete)
+        chunks = doc
+    return chunks
+
+def split_unbalanced(chunks):
+    """Return (unbalanced_start, balanced, unbalanced_end), where each is
+    a list of text and tag chunks.
+
+    unbalanced_start is a list of all the tags that are opened, but
+    not closed in this span.  Similarly, unbalanced_end is a list of
+    tags that are closed but were not opened.  Extracting these might
+    mean some reordering of the chunks."""
+    start = []
+    end = []
+    tag_stack = []
+    balanced = []
+    for chunk in chunks:
+        if not chunk.startswith('<'):
+            balanced.append(chunk)
+            continue
+        endtag = chunk[1] == '/'
+        name = chunk.split()[0].strip('<>/')
+        if name in empty_tags:
+            balanced.append(chunk)
+            continue
+        if endtag:
+            if tag_stack and tag_stack[-1][0] == name:
+                balanced.append(chunk)
+                name, pos, tag = tag_stack.pop()
+                balanced[pos] = tag
+            elif tag_stack:
+                start.extend([tag for name, pos, tag in tag_stack])
+                tag_stack = []
+                end.append(chunk)
+            else:
+                end.append(chunk)
+        else:
+            tag_stack.append((name, len(balanced), chunk))
+            balanced.append(None)
+    start.extend(
+        [chunk for name, pos, chunk in tag_stack])
+    balanced = [chunk for chunk in balanced if chunk is not None]
+    return start, balanced, end
+
+def split_delete(chunks):
+    """ Returns (stuff_before_DEL_START, stuff_inside_DEL_START_END,
+    stuff_after_DEL_END).  Returns the first case found (there may be
+    more DEL_STARTs in stuff_after_DEL_END).  Raises NoDeletes if
+    there's no DEL_START found. """
+    try:
+        pos = chunks.index(DEL_START)
+    except ValueError:
+        raise NoDeletes
+    pos2 = chunks.index(DEL_END)
+    return chunks[:pos], chunks[pos+1:pos2], chunks[pos2+1:]
+
+def locate_unbalanced_start(unbalanced_start, pre_delete, post_delete):
+    """ pre_delete and post_delete implicitly point to a place in the
+    document (where the two were split).  This moves that point (by
+    popping items from one and pushing them onto the other).  It moves
+    the point to try to find a place where unbalanced_start applies.
+
+    As an example::
+
+        >>> unbalanced_start = ['<div>']
+        >>> doc = ['<p>', 'Text', '</p>', '<div>', 'More Text', '</div>']
+        >>> pre, post = doc[:3], doc[3:]
+        >>> pre, post
+        (['<p>', 'Text', '</p>'], ['<div>', 'More Text', '</div>'])
+        >>> locate_unbalanced_start(unbalanced_start, pre, post)
+        >>> pre, post
+        (['<p>', 'Text', '</p>', '<div>'], ['More Text', '</div>'])
+
+    As you can see, we moved the point so that the dangling <div> that
+    we found will be effectively replaced by the div in the original
+    document.  If this doesn't work out, we just throw away
+    unbalanced_start without doing anything.
+    """
+    while 1:
+        if not unbalanced_start:
+            # We have totally succeded in finding the position
+            break
+        finding = unbalanced_start[0]
+        finding_name = finding.split()[0].strip('<>')
+        if not post_delete:
+            break
+        next = post_delete[0]
+        if next is DEL_START or not next.startswith('<'):
+            # Reached a word, we can't move the delete text forward
+            break
+        if next[1] == '/':
+            # Reached a closing tag, can we go further?  Maybe not...
+            break
+        name = next.split()[0].strip('<>')
+        if name == 'ins':
+            # Can't move into an insert
+            break
+        assert name != 'del', (
+            "Unexpected delete tag: %r" % next)
+        if name == finding_name:
+            unbalanced_start.pop(0)
+            pre_delete.append(post_delete.pop(0))
+        else:
+            # Found a tag that doesn't match
+            break
+
+def locate_unbalanced_end(unbalanced_end, pre_delete, post_delete):
+    """ like locate_unbalanced_start, except handling end tags and
+    possibly moving the point earlier in the document.  """
+    while 1:
+        if not unbalanced_end:
+            # Success
+            break
+        finding = unbalanced_end[-1]
+        finding_name = finding.split()[0].strip('<>/')
+        if not pre_delete:
+            break
+        next = pre_delete[-1]
+        if next is DEL_END or not next.startswith('</'):
+            # A word or a start tag
+            break
+        name = next.split()[0].strip('<>/')
+        if name == 'ins' or name == 'del':
+            # Can't move into an insert or delete
+            break
+        if name == finding_name:
+            unbalanced_end.pop()
+            post_delete.insert(0, pre_delete.pop())
+        else:
+            # Found a tag that doesn't match
+            break
+
+class token(_unicode):
+    """ Represents a diffable token, generally a word that is displayed to
+    the user.  Opening tags are attached to this token when they are
+    adjacent (pre_tags) and closing tags that follow the word
+    (post_tags).  Some exceptions occur when there are empty tags
+    adjacent to a word, so there may be close tags in pre_tags, or
+    open tags in post_tags.
+
+    We also keep track of whether the word was originally followed by
+    whitespace, even though we do not want to treat the word as
+    equivalent to a similar word that does not have a trailing
+    space."""
+
+    # When this is true, the token will be eliminated from the
+    # displayed diff if no change has occurred:
+    hide_when_equal = False
+
+    def __new__(cls, text, pre_tags=None, post_tags=None, trailing_whitespace=""):
+        obj = _unicode.__new__(cls, text)
+
+        if pre_tags is not None:
+            obj.pre_tags = pre_tags
+        else:
+            obj.pre_tags = []
+
+        if post_tags is not None:
+            obj.post_tags = post_tags
+        else:
+            obj.post_tags = []
+
+        obj.trailing_whitespace = trailing_whitespace
+
+        return obj
+
+    def __repr__(self):
+        return 'token(%s, %r, %r, %r)' % (_unicode.__repr__(self), self.pre_tags,
+                                          self.post_tags, self.trailing_whitespace)
+
+    def html(self):
+        return _unicode(self)
+
+class tag_token(token):
+
+    """ Represents a token that is actually a tag.  Currently this is just
+    the <img> tag, which takes up visible space just like a word but
+    is only represented in a document by a tag.  """
+
+    def __new__(cls, tag, data, html_repr, pre_tags=None, 
+                post_tags=None, trailing_whitespace=""):
+        obj = token.__new__(cls, "%s: %s" % (type, data), 
+                            pre_tags=pre_tags, 
+                            post_tags=post_tags, 
+                            trailing_whitespace=trailing_whitespace)
+        obj.tag = tag
+        obj.data = data
+        obj.html_repr = html_repr
+        return obj
+
+    def __repr__(self):
+        return 'tag_token(%s, %s, html_repr=%s, post_tags=%r, pre_tags=%r, trailing_whitespace=%r)' % (
+            self.tag, 
+            self.data, 
+            self.html_repr, 
+            self.pre_tags, 
+            self.post_tags, 
+            self.trailing_whitespace)
+    def html(self):
+        return self.html_repr
+
+class href_token(token):
+
+    """ Represents the href in an anchor tag.  Unlike other words, we only
+    show the href when it changes.  """
+
+    hide_when_equal = True
+
+    def html(self):
+        return ' Link: %s' % self
+
+def tokenize(html, include_hrefs=True):
+    """
+    Parse the given HTML and returns token objects (words with attached tags).
+
+    This parses only the content of a page; anything in the head is
+    ignored, and the <head> and <body> elements are themselves
+    optional.  The content is then parsed by lxml, which ensures the
+    validity of the resulting parsed document (though lxml may make
+    incorrect guesses when the markup is particular bad).
+
+    <ins> and <del> tags are also eliminated from the document, as
+    that gets confusing.
+
+    If include_hrefs is true, then the href attribute of <a> tags is
+    included as a special kind of diffable token."""
+    if etree.iselement(html):
+        body_el = html
+    else:
+        body_el = parse_html(html, cleanup=True)
+    # Then we split the document into text chunks for each tag, word, and end tag:
+    chunks = flatten_el(body_el, skip_tag=True, include_hrefs=include_hrefs)
+    # Finally re-joining them into token objects:
+    return fixup_chunks(chunks)
+
+def parse_html(html, cleanup=True):
+    """
+    Parses an HTML fragment, returning an lxml element.  Note that the HTML will be
+    wrapped in a <div> tag that was not in the original document.
+
+    If cleanup is true, make sure there's no <head> or <body>, and get
+    rid of any <ins> and <del> tags.
+    """
+    if cleanup:
+        # This removes any extra markup or structure like <head>:
+        html = cleanup_html(html)
+    return fragment_fromstring(html, create_parent=True)
+
+_body_re = re.compile(r'<body.*?>', re.I|re.S)
+_end_body_re = re.compile(r'</body.*?>', re.I|re.S)
+_ins_del_re = re.compile(r'</?(ins|del).*?>', re.I|re.S)
+
+def cleanup_html(html):
+    """ This 'cleans' the HTML, meaning that any page structure is removed
+    (only the contents of <body> are used, if there is any <body).
+    Also <ins> and <del> tags are removed.  """
+    match = _body_re.search(html)
+    if match:
+        html = html[match.end():]
+    match = _end_body_re.search(html)
+    if match:
+        html = html[:match.start()]
+    html = _ins_del_re.sub('', html)
+    return html
+    
+
+end_whitespace_re = re.compile(r'[ \t\n\r]$')
+
+def split_trailing_whitespace(word):
+    """
+    This function takes a word, such as 'test\n\n' and returns ('test','\n\n')
+    """
+    stripped_length = len(word.rstrip())
+    return word[0:stripped_length], word[stripped_length:]
+
+
+def fixup_chunks(chunks):
+    """
+    This function takes a list of chunks and produces a list of tokens.
+    """
+    tag_accum = []
+    cur_word = None
+    result = []
+    for chunk in chunks:
+        if isinstance(chunk, tuple):
+            if chunk[0] == 'img':
+                src = chunk[1]
+                tag, trailing_whitespace = split_trailing_whitespace(chunk[2])
+                cur_word = tag_token('img', src, html_repr=tag,
+                                     pre_tags=tag_accum,
+                                     trailing_whitespace=trailing_whitespace)
+                tag_accum = []
+                result.append(cur_word)
+
+            elif chunk[0] == 'href':
+                href = chunk[1]
+                cur_word = href_token(href, pre_tags=tag_accum, trailing_whitespace=" ")
+                tag_accum = []
+                result.append(cur_word)
+            continue
+
+        if is_word(chunk):
+            chunk, trailing_whitespace = split_trailing_whitespace(chunk)
+            cur_word = token(chunk, pre_tags=tag_accum, trailing_whitespace=trailing_whitespace)
+            tag_accum = []
+            result.append(cur_word)
+
+        elif is_start_tag(chunk):
+            tag_accum.append(chunk)
+
+        elif is_end_tag(chunk):
+            if tag_accum:
+                tag_accum.append(chunk)
+            else:
+                assert cur_word, (
+                    "Weird state, cur_word=%r, result=%r, chunks=%r of %r"
+                    % (cur_word, result, chunk, chunks))
+                cur_word.post_tags.append(chunk)
+        else:
+            assert(0)
+
+    if not result:
+        return [token('', pre_tags=tag_accum)]
+    else:
+        result[-1].post_tags.extend(tag_accum)
+
+    return result
+
+
+# All the tags in HTML that don't require end tags:
+empty_tags = (
+    'param', 'img', 'area', 'br', 'basefont', 'input',
+    'base', 'meta', 'link', 'col')
+
+block_level_tags = (
+    'address',
+    'blockquote',
+    'center',
+    'dir',
+    'div',
+    'dl',
+    'fieldset',
+    'form',
+    'h1',
+    'h2',
+    'h3',
+    'h4',
+    'h5',
+    'h6',
+    'hr',
+    'isindex',
+    'menu',
+    'noframes',
+    'noscript',
+    'ol',
+    'p',
+    'pre',
+    'table',
+    'ul',
+    )
+
+block_level_container_tags = (
+    'dd',
+    'dt',
+    'frameset',
+    'li',
+    'tbody',
+    'td',
+    'tfoot',
+    'th',
+    'thead',
+    'tr',
+    )
+
+
+def flatten_el(el, include_hrefs, skip_tag=False):
+    """ Takes an lxml element el, and generates all the text chunks for
+    that tag.  Each start tag is a chunk, each word is a chunk, and each
+    end tag is a chunk.
+
+    If skip_tag is true, then the outermost container tag is
+    not returned (just its contents)."""
+    if not skip_tag:
+        if el.tag == 'img':
+            yield ('img', el.get('src'), start_tag(el))
+        else:
+            yield start_tag(el)
+    if el.tag in empty_tags and not el.text and not len(el) and not el.tail:
+        return
+    start_words = split_words(el.text)
+    for word in start_words:
+        yield html_escape(word)
+    for child in el:
+        for item in flatten_el(child, include_hrefs=include_hrefs):
+            yield item
+    if el.tag == 'a' and el.get('href') and include_hrefs:
+        yield ('href', el.get('href'))
+    if not skip_tag:
+        yield end_tag(el)
+        end_words = split_words(el.tail)
+        for word in end_words:
+            yield html_escape(word)
+
+split_words_re = re.compile(r'\S+(?:\s+|$)', re.U)
+
+def split_words(text):
+    """ Splits some text into words. Includes trailing whitespace
+    on each word when appropriate.  """
+    if not text or not text.strip():
+        return []
+
+    words = split_words_re.findall(text)
+    return words
+
+start_whitespace_re = re.compile(r'^[ \t\n\r]')
+
+def start_tag(el):
+    """
+    The text representation of the start tag for a tag.
+    """
+    return '<%s%s>' % (
+        el.tag, ''.join([' %s="%s"' % (name, html_escape(value, True))
+                         for name, value in el.attrib.items()]))
+
+def end_tag(el):
+    """ The text representation of an end tag for a tag.  Includes
+    trailing whitespace when appropriate.  """
+    if el.tail and start_whitespace_re.search(el.tail):
+        extra = ' '
+    else:
+        extra = ''
+    return '</%s>%s' % (el.tag, extra)
+
+def is_word(tok):
+    return not tok.startswith('<')
+
+def is_end_tag(tok):
+    return tok.startswith('</')
+
+def is_start_tag(tok):
+    return tok.startswith('<') and not tok.startswith('</')
+
+def fixup_ins_del_tags(html):
+    """ Given an html string, move any <ins> or <del> tags inside of any
+    block-level elements, e.g. transform <ins><p>word</p></ins> to
+    <p><ins>word</ins></p> """
+    doc = parse_html(html, cleanup=False)
+    _fixup_ins_del_tags(doc)
+    html = serialize_html_fragment(doc, skip_outer=True)
+    return html
+
+def serialize_html_fragment(el, skip_outer=False):
+    """ Serialize a single lxml element as HTML.  The serialized form
+    includes the elements tail.  
+
+    If skip_outer is true, then don't serialize the outermost tag
+    """
+    assert not isinstance(el, basestring), (
+        "You should pass in an element, not a string like %r" % el)
+    html = etree.tostring(el, method="html", encoding=_unicode)
+    if skip_outer:
+        # Get rid of the extra starting tag:
+        html = html[html.find('>')+1:]
+        # Get rid of the extra end tag:
+        html = html[:html.rfind('<')]
+        return html.strip()
+    else:
+        return html
+
+def _fixup_ins_del_tags(doc):
+    """fixup_ins_del_tags that works on an lxml document in-place
+    """
+    for tag in ['ins', 'del']:
+        for el in doc.xpath('descendant-or-self::%s' % tag):
+            if not _contains_block_level_tag(el):
+                continue
+            _move_el_inside_block(el, tag=tag)
+            el.drop_tag()
+            #_merge_element_contents(el)
+
+def _contains_block_level_tag(el):
+    """True if the element contains any block-level elements, like <p>, <td>, etc.
+    """
+    if el.tag in block_level_tags or el.tag in block_level_container_tags:
+        return True
+    for child in el:
+        if _contains_block_level_tag(child):
+            return True
+    return False
+
+def _move_el_inside_block(el, tag):
+    """ helper for _fixup_ins_del_tags; actually takes the <ins> etc tags
+    and moves them inside any block-level tags.  """
+    for child in el:
+        if _contains_block_level_tag(child):
+            break
+    else:
+        import sys
+        # No block-level tags in any child
+        children_tag = etree.Element(tag)
+        children_tag.text = el.text
+        el.text = None
+        children_tag.extend(list(el))
+        el[:] = [children_tag]
+        return
+    for child in list(el):
+        if _contains_block_level_tag(child):
+            _move_el_inside_block(child, tag)
+            if child.tail:
+                tail_tag = etree.Element(tag)
+                tail_tag.text = child.tail
+                child.tail = None
+                el.insert(el.index(child)+1, tail_tag)
+        else:
+            child_tag = etree.Element(tag)
+            el.replace(child, child_tag)
+            child_tag.append(child)
+    if el.text:
+        text_tag = etree.Element(tag)
+        text_tag.text = el.text
+        el.text = None
+        el.insert(0, text_tag)
+            
+def _merge_element_contents(el):
+    """
+    Removes an element, but merges its contents into its place, e.g.,
+    given <p>Hi <i>there!</i></p>, if you remove the <i> element you get
+    <p>Hi there!</p>
+    """
+    parent = el.getparent()
+    text = el.text or ''
+    if el.tail:
+        if not len(el):
+            text += el.tail
+        else:
+            if el[-1].tail:
+                el[-1].tail += el.tail
+            else:
+                el[-1].tail = el.tail
+    index = parent.index(el)
+    if text:
+        if index == 0:
+            previous = None
+        else:
+            previous = parent[index-1]
+        if previous is None:
+            if parent.text:
+                parent.text += text
+            else:
+                parent.text = text
+        else:
+            if previous.tail:
+                previous.tail += text
+            else:
+                previous.tail = text
+    parent[index:index+1] = el.getchildren()
+
+class InsensitiveSequenceMatcher(difflib.SequenceMatcher):
+    """
+    Acts like SequenceMatcher, but tries not to find very small equal
+    blocks amidst large spans of changes
+    """
+
+    threshold = 2
+    
+    def get_matching_blocks(self):
+        size = min(len(self.b), len(self.b))
+        threshold = min(self.threshold, size / 4)
+        actual = difflib.SequenceMatcher.get_matching_blocks(self)
+        return [item for item in actual
+                if item[2] > threshold
+                or not item[2]]
+
+if __name__ == '__main__':
+    from lxml.html import _diffcommand
+    _diffcommand.main()
+    
diff --git a/lib/lxml/html/formfill.py b/lib/lxml/html/formfill.py
new file mode 100644
index 00000000..61f0f076
--- /dev/null
+++ b/lib/lxml/html/formfill.py
@@ -0,0 +1,299 @@
+from lxml.etree import XPath, ElementBase
+from lxml.html import fromstring, tostring, XHTML_NAMESPACE
+from lxml.html import _forms_xpath, _options_xpath, _nons, _transform_result
+from lxml.html import defs
+import copy
+
+try:
+    basestring
+except NameError:
+    # Python 3
+    basestring = str
+
+__all__ = ['FormNotFound', 'fill_form', 'fill_form_html',
+           'insert_errors', 'insert_errors_html',
+           'DefaultErrorCreator']
+
+class FormNotFound(LookupError):
+    """
+    Raised when no form can be found
+    """
+
+_form_name_xpath = XPath('descendant-or-self::form[name=$name]|descendant-or-self::x:form[name=$name]', namespaces={'x':XHTML_NAMESPACE})
+_input_xpath = XPath('|'.join(['descendant-or-self::'+_tag for _tag in ('input','select','textarea','x:input','x:select','x:textarea')]),
+                               namespaces={'x':XHTML_NAMESPACE})
+_label_for_xpath = XPath('//label[@for=$for_id]|//x:label[@for=$for_id]',
+                               namespaces={'x':XHTML_NAMESPACE})
+_name_xpath = XPath('descendant-or-self::*[@name=$name]')
+
+def fill_form(
+    el,
+    values,
+    form_id=None,
+    form_index=None,
+    ):
+    el = _find_form(el, form_id=form_id, form_index=form_index)
+    _fill_form(el, values)
+
+def fill_form_html(html, values, form_id=None, form_index=None):
+    result_type = type(html)
+    if isinstance(html, basestring):
+        doc = fromstring(html)
+    else:
+        doc = copy.deepcopy(html)
+    fill_form(doc, values, form_id=form_id, form_index=form_index)
+    return _transform_result(result_type, doc)
+
+def _fill_form(el, values):
+    counts = {}
+    if hasattr(values, 'mixed'):
+        # For Paste request parameters
+        values = values.mixed()
+    inputs = _input_xpath(el)
+    for input in inputs:
+        name = input.get('name')
+        if not name:
+            continue
+        if _takes_multiple(input):
+            value = values.get(name, [])
+            if not isinstance(value, (list, tuple)):
+                value = [value]
+            _fill_multiple(input, value)
+        elif name not in values:
+            continue
+        else:
+            index = counts.get(name, 0)
+            counts[name] = index + 1
+            value = values[name]
+            if isinstance(value, (list, tuple)):
+                try:
+                    value = value[index]
+                except IndexError:
+                    continue
+            elif index > 0:
+                continue
+            _fill_single(input, value)
+
+def _takes_multiple(input):
+    if _nons(input.tag) == 'select' and input.get('multiple'):
+        # FIXME: multiple="0"?
+        return True
+    type = input.get('type', '').lower()
+    if type in ('radio', 'checkbox'):
+        return True
+    return False
+
+def _fill_multiple(input, value):
+    type = input.get('type', '').lower()
+    if type == 'checkbox':
+        v = input.get('value')
+        if v is None:
+            if not value:
+                result = False
+            else:
+                result = value[0]
+                if isinstance(value, basestring):
+                    # The only valid "on" value for an unnamed checkbox is 'on'
+                    result = result == 'on'
+            _check(input, result)
+        else:
+            _check(input, v in value)
+    elif type == 'radio':
+        v = input.get('value')
+        _check(input, v in value)
+    else:
+        assert _nons(input.tag) == 'select'
+        for option in _options_xpath(input):
+            v = option.get('value')
+            if v is None:
+                # This seems to be the default, at least on IE
+                # FIXME: but I'm not sure
+                v = option.text_content()
+            _select(option, v in value)
+
+def _check(el, check):
+    if check:
+        el.set('checked', '')
+    else:
+        if 'checked' in el.attrib:
+            del el.attrib['checked']
+
+def _select(el, select):
+    if select:
+        el.set('selected', '')
+    else:
+        if 'selected' in el.attrib:
+            del el.attrib['selected']
+
+def _fill_single(input, value):
+    if _nons(input.tag) == 'textarea':
+        input.text = value
+    else:
+        input.set('value', value)
+
+def _find_form(el, form_id=None, form_index=None):
+    if form_id is None and form_index is None:
+        forms = _forms_xpath(el)
+        for form in forms:
+            return form
+        raise FormNotFound(
+            "No forms in page")
+    if form_id is not None:
+        form = el.get_element_by_id(form_id)
+        if form is not None:
+            return form
+        forms = _form_name_xpath(el, name=form_id)
+        if forms:
+            return forms[0]
+        else:
+            raise FormNotFound(
+                "No form with the name or id of %r (forms: %s)"
+                % (id, ', '.join(_find_form_ids(el))))               
+    if form_index is not None:
+        forms = _forms_xpath(el)
+        try:
+            return forms[form_index]
+        except IndexError:
+            raise FormNotFound(
+                "There is no form with the index %r (%i forms found)"
+                % (form_index, len(forms)))
+
+def _find_form_ids(el):
+    forms = _forms_xpath(el)
+    if not forms:
+        yield '(no forms)'
+        return
+    for index, form in enumerate(forms):
+        if form.get('id'):
+            if form.get('name'):
+                yield '%s or %s' % (form.get('id'),
+                                     form.get('name'))
+            else:
+                yield form.get('id')
+        elif form.get('name'):
+            yield form.get('name')
+        else:
+            yield '(unnamed form %s)' % index
+
+############################################################
+## Error filling
+############################################################
+
+class DefaultErrorCreator(object):
+    insert_before = True
+    block_inside = True
+    error_container_tag = 'div'
+    error_message_class = 'error-message'
+    error_block_class = 'error-block'
+    default_message = "Invalid"
+
+    def __init__(self, **kw):
+        for name, value in kw.items():
+            if not hasattr(self, name):
+                raise TypeError(
+                    "Unexpected keyword argument: %s" % name)
+            setattr(self, name, value)
+
+    def __call__(self, el, is_block, message):
+        error_el = el.makeelement(self.error_container_tag)
+        if self.error_message_class:
+            error_el.set('class', self.error_message_class)
+        if is_block and self.error_block_class:
+            error_el.set('class', error_el.get('class', '')+' '+self.error_block_class)
+        if message is None or message == '':
+            message = self.default_message
+        if isinstance(message, ElementBase):
+            error_el.append(message)
+        else:
+            assert isinstance(message, basestring), (
+                "Bad message; should be a string or element: %r" % message)
+            error_el.text = message or self.default_message
+        if is_block and self.block_inside:
+            if self.insert_before:
+                error_el.tail = el.text
+                el.text = None
+                el.insert(0, error_el)
+            else:
+                el.append(error_el)
+        else:
+            parent = el.getparent()
+            pos = parent.index(el)
+            if self.insert_before:
+                parent.insert(pos, error_el)
+            else:
+                error_el.tail = el.tail
+                el.tail = None
+                parent.insert(pos+1, error_el)
+
+default_error_creator = DefaultErrorCreator()
+    
+
+def insert_errors(
+    el,
+    errors,
+    form_id=None,
+    form_index=None,
+    error_class="error",
+    error_creator=default_error_creator,
+    ):
+    el = _find_form(el, form_id=form_id, form_index=form_index)
+    for name, error in errors.items():
+        if error is None:
+            continue
+        for error_el, message in _find_elements_for_name(el, name, error):
+            assert isinstance(message, (basestring, type(None), ElementBase)), (
+                "Bad message: %r" % message)
+            _insert_error(error_el, message, error_class, error_creator)
+
+def insert_errors_html(html, values, **kw):
+    result_type = type(html)
+    if isinstance(html, basestring):
+        doc = fromstring(html)
+    else:
+        doc = copy.deepcopy(html)
+    insert_errors(doc, values, **kw)
+    return _transform_result(result_type, doc)
+
+def _insert_error(el, error, error_class, error_creator):
+    if _nons(el.tag) in defs.empty_tags or _nons(el.tag) == 'textarea':
+        is_block = False
+    else:
+        is_block = True
+    if _nons(el.tag) != 'form' and error_class:
+        _add_class(el, error_class)
+    if el.get('id'):
+        labels = _label_for_xpath(el, for_id=el.get('id'))
+        if labels:
+            for label in labels:
+                _add_class(label, error_class)
+    error_creator(el, is_block, error)
+
+def _add_class(el, class_name):
+    if el.get('class'):
+        el.set('class', el.get('class')+' '+class_name)
+    else:
+        el.set('class', class_name)
+
+def _find_elements_for_name(form, name, error):
+    if name is None:
+        # An error for the entire form
+        yield form, error
+        return
+    if name.startswith('#'):
+        # By id
+        el = form.get_element_by_id(name[1:])
+        if el is not None:
+            yield el, error
+        return
+    els = _name_xpath(form, name=name)
+    if not els:
+        # FIXME: should this raise an exception?
+        return
+    if not isinstance(error, (list, tuple)):
+        yield els[0], error
+        return
+    # FIXME: if error is longer than els, should it raise an error?
+    for el, err in zip(els, error):
+        if err is None:
+            continue
+        yield el, err
diff --git a/lib/lxml/html/html5parser.py b/lib/lxml/html/html5parser.py
new file mode 100644
index 00000000..7188c7ea
--- /dev/null
+++ b/lib/lxml/html/html5parser.py
@@ -0,0 +1,207 @@
+"""
+An interface to html5lib that mimics the lxml.html interface.
+"""
+
+import sys
+import string
+
+from html5lib import HTMLParser as _HTMLParser
+from html5lib.treebuilders.etree_lxml import TreeBuilder
+
+from lxml import etree
+from lxml.html import _contains_block_level_tag, XHTML_NAMESPACE, Element
+
+# python3 compatibility
+try:
+    _strings = basestring
+except NameError:
+    _strings = (bytes, str)
+try:
+    from urllib2 import urlopen
+except ImportError:
+    from urllib.request import urlopen
+try:
+    from urlparse import urlparse
+except ImportError:
+    from urllib.parse import urlparse
+
+class HTMLParser(_HTMLParser):
+    """An html5lib HTML parser with lxml as tree."""
+
+    def __init__(self, strict=False, **kwargs):
+        _HTMLParser.__init__(self, strict=strict, tree=TreeBuilder, **kwargs)
+
+
+try:
+    from html5lib import XHTMLParser as _XHTMLParser
+except ImportError:
+    pass
+else:
+    class XHTMLParser(_XHTMLParser):
+        """An html5lib XHTML Parser with lxml as tree."""
+
+        def __init__(self, strict=False, **kwargs):
+            _XHTMLParser.__init__(self, strict=strict, tree=TreeBuilder, **kwargs)
+
+    xhtml_parser = XHTMLParser()
+
+
+def _find_tag(tree, tag):
+    elem = tree.find(tag)
+    if elem is not None:
+        return elem
+    return tree.find('{%s}%s' % (XHTML_NAMESPACE, tag))
+
+
+def document_fromstring(html, guess_charset=True, parser=None):
+    """Parse a whole document into a string."""
+    if not isinstance(html, _strings):
+        raise TypeError('string required')
+
+    if parser is None:
+        parser = html_parser
+
+    return parser.parse(html, useChardet=guess_charset).getroot()
+
+
+def fragments_fromstring(html, no_leading_text=False,
+                         guess_charset=False, parser=None):
+    """Parses several HTML elements, returning a list of elements.
+
+    The first item in the list may be a string.  If no_leading_text is true,
+    then it will be an error if there is leading text, and it will always be
+    a list of only elements.
+
+    If `guess_charset` is `True` and the text was not unicode but a
+    bytestring, the `chardet` library will perform charset guessing on the
+    string.
+    """
+    if not isinstance(html, _strings):
+        raise TypeError('string required')
+
+    if parser is None:
+        parser = html_parser
+
+    children = parser.parseFragment(html, 'div', useChardet=guess_charset)
+    if children and isinstance(children[0], _strings):
+        if no_leading_text:
+            if children[0].strip():
+                raise etree.ParserError('There is leading text: %r' %
+                                        children[0])
+            del children[0]
+    return children
+
+
+def fragment_fromstring(html, create_parent=False,
+                        guess_charset=False, parser=None):
+    """Parses a single HTML element; it is an error if there is more than
+    one element, or if anything but whitespace precedes or follows the
+    element.
+
+    If create_parent is true (or is a tag name) then a parent node
+    will be created to encapsulate the HTML in a single element.  In
+    this case, leading or trailing text is allowed.
+    """
+    if not isinstance(html, _strings):
+        raise TypeError('string required')
+
+    accept_leading_text = bool(create_parent)
+
+    elements = fragments_fromstring(
+        html, guess_charset=guess_charset, parser=parser,
+        no_leading_text=not accept_leading_text)
+
+    if create_parent:
+        if not isinstance(create_parent, _strings):
+            create_parent = 'div'
+        new_root = Element(create_parent)
+        if elements:
+            if isinstance(elements[0], _strings):
+                new_root.text = elements[0]
+                del elements[0]
+            new_root.extend(elements)
+        return new_root
+
+    if not elements:
+        raise etree.ParserError('No elements found')
+    if len(elements) > 1:
+        raise etree.ParserError('Multiple elements found')
+    result = elements[0]
+    if result.tail and result.tail.strip():
+        raise etree.ParserError('Element followed by text: %r' % result.tail)
+    result.tail = None
+    return result
+
+
+def fromstring(html, guess_charset=True, parser=None):
+    """Parse the html, returning a single element/document.
+
+    This tries to minimally parse the chunk of text, without knowing if it
+    is a fragment or a document.
+
+    base_url will set the document's base_url attribute (and the tree's docinfo.URL)
+    """
+    if not isinstance(html, _strings):
+        raise TypeError('string required')
+    doc = document_fromstring(html, parser=parser,
+                              guess_charset=guess_charset)
+
+    # document starts with doctype or <html>, full document!
+    start = html[:50].lstrip().lower()
+    if start.startswith('<html') or start.startswith('<!doctype'):
+        return doc
+
+    head = _find_tag(doc, 'head')
+
+    # if the head is not empty we have a full document
+    if len(head):
+        return doc
+
+    body = _find_tag(doc, 'body')
+
+    # The body has just one element, so it was probably a single
+    # element passed in
+    if (len(body) == 1 and (not body.text or not body.text.strip())
+        and (not body[-1].tail or not body[-1].tail.strip())):
+        return body[0]
+
+    # Now we have a body which represents a bunch of tags which have the
+    # content that was passed in.  We will create a fake container, which
+    # is the body tag, except <body> implies too much structure.
+    if _contains_block_level_tag(body):
+        body.tag = 'div'
+    else:
+        body.tag = 'span'
+    return body
+
+
+def parse(filename_url_or_file, guess_charset=True, parser=None):
+    """Parse a filename, URL, or file-like object into an HTML document
+    tree.  Note: this returns a tree, not an element.  Use
+    ``parse(...).getroot()`` to get the document root.
+    """
+    if parser is None:
+        parser = html_parser
+    if not isinstance(filename_url_or_file, _strings):
+        fp = filename_url_or_file
+    elif _looks_like_url(filename_url_or_file):
+        fp = urlopen(filename_url_or_file)
+    else:
+        fp = open(filename_url_or_file, 'rb')
+    return parser.parse(fp, useChardet=guess_charset)
+
+
+def _looks_like_url(str):
+    scheme = urlparse(str)[0]
+    if not scheme:
+        return False
+    elif (sys.platform == 'win32' and
+            scheme in string.ascii_letters
+            and len(scheme) == 1):
+        # looks like a 'normal' absolute path
+        return False
+    else:
+        return True
+
+
+html_parser = HTMLParser()
diff --git a/lib/lxml/html/soupparser.py b/lib/lxml/html/soupparser.py
new file mode 100644
index 00000000..bfb9fdfc
--- /dev/null
+++ b/lib/lxml/html/soupparser.py
@@ -0,0 +1,125 @@
+__doc__ = """External interface to the BeautifulSoup HTML parser.
+"""
+
+__all__ = ["fromstring", "parse", "convert_tree"]
+
+from lxml import etree, html
+from BeautifulSoup import \
+     BeautifulSoup, Tag, Comment, ProcessingInstruction, NavigableString
+
+
+def fromstring(data, beautifulsoup=None, makeelement=None, **bsargs):
+    """Parse a string of HTML data into an Element tree using the
+    BeautifulSoup parser.
+
+    Returns the root ``<html>`` Element of the tree.
+
+    You can pass a different BeautifulSoup parser through the
+    `beautifulsoup` keyword, and a diffent Element factory function
+    through the `makeelement` keyword.  By default, the standard
+    ``BeautifulSoup`` class and the default factory of `lxml.html` are
+    used.
+    """
+    return _parse(data, beautifulsoup, makeelement, **bsargs)
+
+def parse(file, beautifulsoup=None, makeelement=None, **bsargs):
+    """Parse a file into an ElemenTree using the BeautifulSoup parser.
+
+    You can pass a different BeautifulSoup parser through the
+    `beautifulsoup` keyword, and a diffent Element factory function
+    through the `makeelement` keyword.  By default, the standard
+    ``BeautifulSoup`` class and the default factory of `lxml.html` are
+    used.
+    """
+    if not hasattr(file, 'read'):
+        file = open(file)
+    root = _parse(file, beautifulsoup, makeelement, **bsargs)
+    return etree.ElementTree(root)
+
+def convert_tree(beautiful_soup_tree, makeelement=None):
+    """Convert a BeautifulSoup tree to a list of Element trees.
+
+    Returns a list instead of a single root Element to support
+    HTML-like soup with more than one root element.
+
+    You can pass a different Element factory through the `makeelement`
+    keyword.
+    """
+    if makeelement is None:
+        makeelement = html.html_parser.makeelement
+    root = _convert_tree(beautiful_soup_tree, makeelement)
+    children = root.getchildren()
+    for child in children:
+        root.remove(child)
+    return children
+
+
+# helpers
+
+def _parse(source, beautifulsoup, makeelement, **bsargs):
+    if beautifulsoup is None:
+        beautifulsoup = BeautifulSoup
+    if makeelement is None:
+        makeelement = html.html_parser.makeelement
+    if 'convertEntities' not in bsargs:
+        bsargs['convertEntities'] = 'html'
+    tree = beautifulsoup(source, **bsargs)
+    root = _convert_tree(tree, makeelement)
+    # from ET: wrap the document in a html root element, if necessary
+    if len(root) == 1 and root[0].tag == "html":
+        return root[0]
+    root.tag = "html"
+    return root
+
+def _convert_tree(beautiful_soup_tree, makeelement):
+    root = makeelement(beautiful_soup_tree.name,
+                       attrib=dict(beautiful_soup_tree.attrs))
+    _convert_children(root, beautiful_soup_tree, makeelement)
+    return root
+
+def _convert_children(parent, beautiful_soup_tree, makeelement):
+    SubElement = etree.SubElement
+    et_child = None
+    for child in beautiful_soup_tree:
+        if isinstance(child, Tag):
+            et_child = SubElement(parent, child.name, attrib=dict(
+                [(k, unescape(v)) for (k,v) in child.attrs]))
+            _convert_children(et_child, child, makeelement)
+        elif type(child) is NavigableString:
+            _append_text(parent, et_child, unescape(child))
+        else:
+            if isinstance(child, Comment):
+                parent.append(etree.Comment(child))
+            elif isinstance(child, ProcessingInstruction):
+                parent.append(etree.ProcessingInstruction(
+                    *child.split(' ', 1)))
+            else: # CData
+                _append_text(parent, et_child, unescape(child))
+
+def _append_text(parent, element, text):
+    if element is None:
+        parent.text = (parent.text or '') + text
+    else:
+        element.tail = (element.tail or '') + text
+
+
+# copied from ET's ElementSoup
+
+try:
+    from html.entities import name2codepoint # Python 3
+except ImportError:
+    from htmlentitydefs import name2codepoint
+import re
+
+handle_entities = re.compile("&(\w+);").sub
+
+def unescape(string):
+    if not string:
+        return ''
+    # work around oddities in BeautifulSoup's entity handling
+    def unescape_entity(m):
+        try:
+            return unichr(name2codepoint[m.group(1)])
+        except KeyError:
+            return m.group(0) # use as is
+    return handle_entities(unescape_entity, string)
diff --git a/lib/lxml/html/tests/__init__.py b/lib/lxml/html/tests/__init__.py
new file mode 100644
index 00000000..792d6005
--- /dev/null
+++ b/lib/lxml/html/tests/__init__.py
@@ -0,0 +1 @@
+#
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_applet.data b/lib/lxml/html/tests/feedparser-data/entry_content_applet.data
new file mode 100644
index 00000000..91e7f6ce
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_applet.data
@@ -0,0 +1,7 @@
+Description: entry content contains applet
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe <b>description</b>'
+Options: 
+
+<div>safe<applet code="foo.class" codebase="http://example.com/"></applet> <b>description</b></div>
+----------
+<div>safe <b>description</b></div>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_blink.data b/lib/lxml/html/tests/feedparser-data/entry_content_blink.data
new file mode 100644
index 00000000..de84a8d6
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_blink.data
@@ -0,0 +1,8 @@
+Description: entry content contains embed
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe description'
+Options: 
+Notes: <div> wrapper
+
+<div><blink>safe</blink> description</div>
+----------
+<div>safe description</div>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_crazy.data b/lib/lxml/html/tests/feedparser-data/entry_content_crazy.data
new file mode 100644
index 00000000..9ca77259
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_crazy.data
@@ -0,0 +1,84 @@
+Description: entry content is crazy
+Expect: not bozo and entries[0]['content'][0]['value'] == u'Crazy HTML -' + u'- Can Your Regex Parse This?\n\n\n\n<!-' + u'- <script> -' + u'->\n\n<!-' + u'- \n\t<script> \n-' + u'->\n\n\n\nfunction executeMe()\n{\n\n\n\n\n/* \n<h1>Did The Javascript Execute?</h1>\n<div>\nI will execute here, too, if you mouse over me\n</div>'
+Options: -page_structure
+Notes: for some reason the comments in the expected field are acting weird
+
+
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head>
+<title>Crazy HTML -- Can Your Regex Parse This?</title>
+
+</head>
+<body    notRealAttribute="value"onload="executeMe();"foo="bar"
+
+>
+<!-- <script> -->
+
+<!-- 
+	<script> 
+-->
+
+</script>
+
+
+<script
+
+
+>
+
+function executeMe()
+{
+
+
+
+
+/* <script> 
+function am_i_javascript()
+{
+	var str = "Some innocuously commented out stuff";
+}
+< /script>
+*/
+
+	
+	
+	
+	
+	
+	
+	
+	
+	alert("Executed");
+}
+
+                                   </script
+
+
+
+>
+<h1>Did The Javascript Execute?</h1>
+<div notRealAttribute="value
+"onmouseover="
+executeMe();
+"foo="bar">
+I will execute here, too, if you mouse over me
+</div>
+
+</body>
+
+</html>
+
+----------
+<html>
+ <head>
+  <title>Crazy HTML -- Can Your Regex Parse This?</title>
+ </head>
+ <body>
+<h1>Did The Javascript Execute?</h1>
+<div>
+I will execute here, too, if you mouse over me
+</div>
+ </body>
+</html>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_embed.data b/lib/lxml/html/tests/feedparser-data/entry_content_embed.data
new file mode 100644
index 00000000..94e1e34a
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_embed.data
@@ -0,0 +1,8 @@
+Description: entry content contains embed
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe <b>description</b>'
+Options: 
+Notes: <div> wrapper, close <embed> tag (not closing it lost the <b> tag)
+
+<div>safe<embed src="http://example.com/"></embed> <b>description</b></div>
+----------
+<div>safe <b>description</b></div>
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_frame.data b/lib/lxml/html/tests/feedparser-data/entry_content_frame.data
new file mode 100644
index 00000000..e87b9c40
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_frame.data
@@ -0,0 +1,7 @@
+Description: entry content contains frameset
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe <b>description</b>'
+Options: 
+
+<div>safe<frameset rows="*"><frame src="http://example.com/"></frameset> <b>description</b></div>
+----------
+<div>safe <b>description</b></div>
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_iframe.data b/lib/lxml/html/tests/feedparser-data/entry_content_iframe.data
new file mode 100644
index 00000000..41f26709
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_iframe.data
@@ -0,0 +1,8 @@
+Description: entry content contains iframe
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe <b>description</b>'
+Options: 
+Notes: div wrapper, close <iframe>
+
+<div>safe<iframe src="http://example.com/"></iframe> <b>description</b></iframe></div>
+----------
+<div>safe <b>description</b></div>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_link.data b/lib/lxml/html/tests/feedparser-data/entry_content_link.data
new file mode 100644
index 00000000..2e793120
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_link.data
@@ -0,0 +1,7 @@
+Description: entry content contains link
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe <b>description</b>'
+Options:
+
+<div>safe<link rel="stylesheet" type="text/css" href="http://example.com/evil.css"> <b>description</b></div>
+----------
+<div>safe <b>description</b></div>
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_meta.data b/lib/lxml/html/tests/feedparser-data/entry_content_meta.data
new file mode 100644
index 00000000..1dbaa93b
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_meta.data
@@ -0,0 +1,7 @@
+Description: entry content contains meta
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe <b>description</b>'
+Options: 
+
+<div>safe<meta http-equiv="Refresh" content="0; URL=http://example.com/"> <b>description</b></div>
+----------
+<div>safe <b>description</b></div>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_object.data b/lib/lxml/html/tests/feedparser-data/entry_content_object.data
new file mode 100644
index 00000000..a4e4db19
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_object.data
@@ -0,0 +1,8 @@
+Description: entry content contains object
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe <b>description</b>'
+Options: 
+Notes: div wrapper, close <object>
+
+<div>safe<object classid="clsid:C932BA85-4374-101B-A56C-00AA003668DC"></object> <b>description</b></div>
+----------
+<div>safe <b>description</b></div>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onabort.data b/lib/lxml/html/tests/feedparser-data/entry_content_onabort.data
new file mode 100644
index 00000000..5bb69258
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onabort.data
@@ -0,0 +1,7 @@
+Description: entry content contains onabort
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onabort="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onblur.data b/lib/lxml/html/tests/feedparser-data/entry_content_onblur.data
new file mode 100644
index 00000000..05b2bf73
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onblur.data
@@ -0,0 +1,7 @@
+Description: entry content contains onblur
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onblur="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onchange.data b/lib/lxml/html/tests/feedparser-data/entry_content_onchange.data
new file mode 100644
index 00000000..51f56e24
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onchange.data
@@ -0,0 +1,7 @@
+Description: entry content contains onchange
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onchange="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onclick.data b/lib/lxml/html/tests/feedparser-data/entry_content_onclick.data
new file mode 100644
index 00000000..e9362f6f
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onclick.data
@@ -0,0 +1,7 @@
+Description: entry content contains onclick
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onclick="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_ondblclick.data b/lib/lxml/html/tests/feedparser-data/entry_content_ondblclick.data
new file mode 100644
index 00000000..9ac5e9be
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_ondblclick.data
@@ -0,0 +1,7 @@
+Description: entry content contains ondblclick
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: javascript
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" ondblclick="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onerror.data b/lib/lxml/html/tests/feedparser-data/entry_content_onerror.data
new file mode 100644
index 00000000..0068273a
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onerror.data
@@ -0,0 +1,7 @@
+Description: entry content contains onerror
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onerror="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onfocus.data b/lib/lxml/html/tests/feedparser-data/entry_content_onfocus.data
new file mode 100644
index 00000000..50ff3040
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onfocus.data
@@ -0,0 +1,7 @@
+Description: entry content contains onfocus
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onfocus="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onkeydown.data b/lib/lxml/html/tests/feedparser-data/entry_content_onkeydown.data
new file mode 100644
index 00000000..9802fc79
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onkeydown.data
@@ -0,0 +1,7 @@
+Description: entry content contains onkeydown
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onkeydown="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onkeypress.data b/lib/lxml/html/tests/feedparser-data/entry_content_onkeypress.data
new file mode 100644
index 00000000..9fc20010
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onkeypress.data
@@ -0,0 +1,7 @@
+Description: entry content contains onkeypress
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onkeypress="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onkeyup.data b/lib/lxml/html/tests/feedparser-data/entry_content_onkeyup.data
new file mode 100644
index 00000000..bd2b89ac
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onkeyup.data
@@ -0,0 +1,7 @@
+Description: entry content contains onkeyup
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onkeyup="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onload.data b/lib/lxml/html/tests/feedparser-data/entry_content_onload.data
new file mode 100644
index 00000000..ba999a03
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onload.data
@@ -0,0 +1,7 @@
+Description: entry content contains onload
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onload="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onmousedown.data b/lib/lxml/html/tests/feedparser-data/entry_content_onmousedown.data
new file mode 100644
index 00000000..2cfaa089
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onmousedown.data
@@ -0,0 +1,7 @@
+Description: entry content contains onmousedown
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onmousedown="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onmouseout.data b/lib/lxml/html/tests/feedparser-data/entry_content_onmouseout.data
new file mode 100644
index 00000000..0a9daf94
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onmouseout.data
@@ -0,0 +1,7 @@
+Description: entry content contains onmouseout
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onmouseout="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onmouseover.data b/lib/lxml/html/tests/feedparser-data/entry_content_onmouseover.data
new file mode 100644
index 00000000..91f3b6de
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onmouseover.data
@@ -0,0 +1,7 @@
+Description: entry content contains onmouseover
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onmouseover="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onmouseup.data b/lib/lxml/html/tests/feedparser-data/entry_content_onmouseup.data
new file mode 100644
index 00000000..3c2d61a4
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onmouseup.data
@@ -0,0 +1,7 @@
+Description: entry content contains onmouseup
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onmouseup="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onreset.data b/lib/lxml/html/tests/feedparser-data/entry_content_onreset.data
new file mode 100644
index 00000000..6f6a1e5e
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onreset.data
@@ -0,0 +1,7 @@
+Description: entry content contains onreset
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onreset="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onresize.data b/lib/lxml/html/tests/feedparser-data/entry_content_onresize.data
new file mode 100644
index 00000000..5953fb09
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onresize.data
@@ -0,0 +1,7 @@
+Description: entry content contains onresize
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onresize="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onsubmit.data b/lib/lxml/html/tests/feedparser-data/entry_content_onsubmit.data
new file mode 100644
index 00000000..41f356e0
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onsubmit.data
@@ -0,0 +1,7 @@
+Description: entry content contains onsubmit
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onsubmit="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_onunload.data b/lib/lxml/html/tests/feedparser-data/entry_content_onunload.data
new file mode 100644
index 00000000..4191a3e4
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_onunload.data
@@ -0,0 +1,7 @@
+Description: entry content contains onunload
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />'
+Options: 
+
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" onunload="location.href='http://www.ragingplatypus.com/';" />
+----------
+<img src="http://www.ragingplatypus.com/i/cam-full.jpg" />
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_script.data b/lib/lxml/html/tests/feedparser-data/entry_content_script.data
new file mode 100644
index 00000000..9c2f1434
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_script.data
@@ -0,0 +1,7 @@
+Description: entry content contains script
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe description'
+Options: 
+
+<div>safe<script type="text/javascript">location.href='http:/'+'/example.com/';</script> description</div>
+----------
+<div>safe description</div>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_script_cdata.data b/lib/lxml/html/tests/feedparser-data/entry_content_script_cdata.data
new file mode 100644
index 00000000..e701eac4
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_script_cdata.data
@@ -0,0 +1,13 @@
+Description: entry content contains script (cdata)
+Expect: not bozo and entries[0]['content'][0]['value'] == u'safe description'
+Options: 
+Notes: div wrapper.  Currently not working because of how HTML() is parsing the CDATA (not in a useful way)
+       The resulting code is safe, it just includes crap from the <script> tag (but not the script tag
+       itself).
+Ignore: true
+
+<div>
+  <![CDATA[safe<script type="text/javascript">location.href='http:/'+'/example.com/';</script> description]]>
+</div>
+----------
+<div>safe description</div>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_script_inline.data b/lib/lxml/html/tests/feedparser-data/entry_content_script_inline.data
new file mode 100644
index 00000000..5ade5a40
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_script_inline.data
@@ -0,0 +1,7 @@
+Description: entry content contains script (inline)
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<div>safe description</div>'
+Options: 
+
+<div xmlns="http://www.w3.org/1999/xhtml">safe<script type="text/javascript">location.href='http:/'+'/example.com/';</script> description</div>
+----------
+<div>safe description</div>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/feedparser-data/entry_content_style.data b/lib/lxml/html/tests/feedparser-data/entry_content_style.data
new file mode 100644
index 00000000..ca7a41c0
--- /dev/null
+++ b/lib/lxml/html/tests/feedparser-data/entry_content_style.data
@@ -0,0 +1,7 @@
+Description: entry content contains style
+Expect: not bozo and entries[0]['content'][0]['value'] == u'<a href="http://www.ragingplatypus.com/">never trust your upstream platypus</a>'
+Options: style
+
+<a href="http://www.ragingplatypus.com/" style="display:block; position:absolute; left:0; top:0; width:100%; height:100%; z-index:1; background-color:black; background-image:url(http://www.ragingplatypus.com/i/cam-full.jpg); background-x:center; background-y:center; background-repeat:repeat;">never trust your upstream platypus</a>
+----------
+<a href="http://www.ragingplatypus.com/">never trust your upstream platypus</a>
\ No newline at end of file
diff --git a/lib/lxml/html/tests/hackers-org-data/background-image-plus.data b/lib/lxml/html/tests/hackers-org-data/background-image-plus.data
new file mode 100644
index 00000000..c32a1356
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/background-image-plus.data
@@ -0,0 +1,8 @@
+Description: I built a quick XSS fuzzer to detect any erroneous characters that are allowed after the open parenthesis but before the JavaScript directive in IE and Netscape 8.1 in secure site mode. These are in decimal but you can include hex and add padding of course. (Any of the following chars can be used: 1-32, 34, 39, 160, 8192-8.13, 12288, 65279)
+    http://ha.ckers.org/xss.html#XSS_DIV_background-image_plus
+Options: -safe_attrs_only
+Notes: As you see, the CSS gets corrupted, but I don't really care that much.
+
+<DIV STYLE="background-image: url(javascript:alert('XSS'))">text</div>
+----------
+<div style="background-image: url(">text</div>
diff --git a/lib/lxml/html/tests/hackers-org-data/background-image-with-unicoded.data b/lib/lxml/html/tests/hackers-org-data/background-image-with-unicoded.data
new file mode 100644
index 00000000..3ec45f91
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/background-image-with-unicoded.data
@@ -0,0 +1,10 @@
+Description: exploit (this has been modified slightly to obfuscate the url parameter). The original vulnerability was found by Renaud Lifchitz as a vulnerability in Hotmail.
+    http://ha.ckers.org/xss.html#XSS_DIV_background_image_unicode
+Options: -safe_attrs_only
+Ignore: true
+Notes: I don't understand how this exploit works.  It seems like the description actually refers to
+       the unicode you'd import, but why that matters I don't know.
+
+<DIV STYLE="background-image:\0075\0072\006C\0028'\006a\0061\0076\0061\0073\0063\0072\0069\0070\0074\003a\0061\006c\0065\0072\0074\0028.1027\0058.1053\0053\0027\0029'\0029">text</div>
+----------
+<div style="background-image: ">text</div>
diff --git a/lib/lxml/html/tests/hackers-org-data/downlevel-hidden.data b/lib/lxml/html/tests/hackers-org-data/downlevel-hidden.data
new file mode 100644
index 00000000..fc6e849c
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/downlevel-hidden.data
@@ -0,0 +1,9 @@
+Description: Downlevel-Hidden-Hidden block (only works in IE5.0 and later and Netscape 8.1 in IE rendering engine mode). Some websites consider anything inside a comment block to be safe and therefore does not need to be removed, which allows our Cross Site Scripting vector. Or the system could add comment tags around something to attempt to render it harmless. As we can see, that probably wouldn't do the job
+    http://ha.ckers.org/xss.html#XSS_Downlevel-Hidden
+Options: -comments, -processing_instructions
+
+<div><!--[if gte IE 4]>
+<SCRIPT>alert('XSS');</SCRIPT>
+<![endif]--></div>
+----------
+<div></div>
diff --git a/lib/lxml/html/tests/hackers-org-data/html-plus-time.data b/lib/lxml/html/tests/hackers-org-data/html-plus-time.data
new file mode 100644
index 00000000..77ccfdb7
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/html-plus-time.data
@@ -0,0 +1,12 @@
+Description: HTML+TIME in XML. This is how Grey Magic hacked Hotmail and Yahoo!. This only works in Internet Explorer and Netscape 8.1 in IE rendering engine mode and remember that you need to be between HTML and BODY tags for this to work
+    http://ha.ckers.org/xss.html#XSS_HTML_plus_time
+Ignore: true
+Notes: I don't understand the vector here, or how this is supposed to work.
+
+<div>
+<t:set attributeName="innerHTML" to="XSS&lt;SCRIPT DEFER&gt;alert(&quot;XSS&quot;)&lt;/SCRIPT&gt;">
+</BODY></HTML></div>
+----------
+<div>
+<t:set attributeName="innerHTML" to="XSS&lt;SCRIPT DEFER&gt;alert(&quot;XSS&quot;)&lt;/SCRIPT&gt;">
+</BODY></HTML>x</div>
diff --git a/lib/lxml/html/tests/hackers-org-data/javascript-link.data b/lib/lxml/html/tests/hackers-org-data/javascript-link.data
new file mode 100644
index 00000000..1eefa1f3
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/javascript-link.data
@@ -0,0 +1,15 @@
+Description: javascript: in many forms
+
+<div>
+ <a href="java
+script:alert()">x</a>
+ <a href="j a v a s c r i p t:alert()">x</a>
+ <a href="jscript
+:alert()">x</a>
+</div>
+----------
+<div>
+ <a href="">x</a>
+ <a href="">x</a>
+ <a href="">x</a>
+</div>
diff --git a/lib/lxml/html/tests/hackers-org-data/style-comment.data b/lib/lxml/html/tests/hackers-org-data/style-comment.data
new file mode 100644
index 00000000..f084e689
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/style-comment.data
@@ -0,0 +1,8 @@
+Description: to break up expression (Thanks to Roman Ivanov for this one)
+    http://ha.ckers.org/xss.html#XSS_STYLE_comment
+Options: -safe_attrs_only
+Notes: Because of the suspicious stuff in there, the style is removed entirely
+
+<IMG STYLE="xss:expr/*XSS*/ession(alert('XSS'))">
+----------
+<img>
diff --git a/lib/lxml/html/tests/hackers-org-data/style-expression.data b/lib/lxml/html/tests/hackers-org-data/style-expression.data
new file mode 100644
index 00000000..610eefea
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/style-expression.data
@@ -0,0 +1,10 @@
+Description: (this is really a hybrid of the above XSS vectors, but it really does show how hard STYLE tags can be to parse apart, like above this can send IE into a loop)
+    http://ha.ckers.org/xss.html#XSS_IMG_STYLE_expression
+Options: -safe_attrs_only
+Notes: Modified to avoid a parsing in libxml2 that ruins the XSS (the " marks).  
+       Also there seemed to be an extra "p" in exppression
+
+<div><img style="xss: ex/*<A STYLE='no\xss:noxss(*//*);
+xss:&#101;x&#x2F;*XSS*//*/*/pression(alert('XSS'))"></div>
+----------
+<div><img></div>
diff --git a/lib/lxml/html/tests/hackers-org-data/style-import.data b/lib/lxml/html/tests/hackers-org-data/style-import.data
new file mode 100644
index 00000000..d1aac0aa
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/style-import.data
@@ -0,0 +1,8 @@
+Description: tags with broken up JavaScript for XSS (this XSS at times sends IE into an infinite loop of alerts)
+    http://ha.ckers.org/xss.html#XSS_STYLE
+Options: -safe_attrs_only
+
+<div><STYLE>@im\port'\ja\vasc\ript:alert("XSS")';</STYLE></div>
+----------
+<div><style>/* deleted */</style></div>
+
diff --git a/lib/lxml/html/tests/hackers-org-data/style-js-tag.data b/lib/lxml/html/tests/hackers-org-data/style-js-tag.data
new file mode 100644
index 00000000..358adc87
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/style-js-tag.data
@@ -0,0 +1,7 @@
+Description: (Older versions of Netscape only)
+    http://ha.ckers.org/xss.html#XSS_STYLE_tag
+Options: -safe_attrs_only
+
+<div><STYLE TYPE="text/javascript">alert('XSS');</STYLE></div>
+----------
+<div></div>
diff --git a/lib/lxml/html/tests/hackers-org-data/style-url-js.data b/lib/lxml/html/tests/hackers-org-data/style-url-js.data
new file mode 100644
index 00000000..c96aea10
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/style-url-js.data
@@ -0,0 +1,8 @@
+Description: http://ha.ckers.org/xss.html#XSS_STYLE_background-image
+Options: -style, -safe_attrs_only
+Notes: The CSS is messed up here, but so it goes
+
+<div><STYLE>.XSS{background-image:url("javascript:alert('XSS')");}</STYLE><A CLASS=XSS></A></div>
+----------
+<div><style>.XSS{background-image:url("");}</style><a class="XSS"></a></div>
+
diff --git a/lib/lxml/html/tests/hackers-org-data/xml-data-island.data b/lib/lxml/html/tests/hackers-org-data/xml-data-island.data
new file mode 100644
index 00000000..a17df9ec
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/xml-data-island.data
@@ -0,0 +1,10 @@
+Description: XML data island with comment obfuscation (this is another take on the same exploit that doesn't use CDATA fields, but rather uses comments to break up the javascript directive)
+    http://ha.ckers.org/xss.html#XSS_XML_data_island_comment
+Ignore: true
+Notes: I don't understand the vector here.  Maybe datasrc should be filtered?
+
+<div><XML ID="xss"><I><B>&lt;IMG SRC="javas<!-- -->cript:alert('XSS')"&gt;</B></I></XML>
+<SPAN DATASRC="#xss" DATAFLD="B" DATAFORMATAS="HTML"></SPAN></div>
+----------
+<div><XML ID="xss"><I><B>&lt;IMG SRC="javas<!-- -->cript:alert('XSS')"&gt;</B></I></XML>
+<SPAN DATASRC="#xss" DATAFLD="B" DATAFORMATAS="HTML"></SPAN>x</div>
diff --git a/lib/lxml/html/tests/hackers-org-data/xml-embedded-js.data b/lib/lxml/html/tests/hackers-org-data/xml-embedded-js.data
new file mode 100644
index 00000000..b5196d68
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/xml-embedded-js.data
@@ -0,0 +1,9 @@
+Description: Locally hosted XML with embedded JavaScript#XSS_Local_XML that is generated using an XML data island. This is the same as above but instead referrs to a locally hosted (must be on the same server) XML file that contains your cross site scripting vector. You can see the result here <http://ha.ckers.org/xssxmltest.html>
+    http://ha.ckers.org/xss.html#XSS_Local_XML
+
+<div><XML SRC="xsstest.xml" ID=I></XML>
+<SPAN DATASRC=#I DATAFLD=C DATAFORMATAS=HTML></SPAN></div>
+----------
+<div>
+ <span></span>
+</div>
diff --git a/lib/lxml/html/tests/hackers-org-data/xml-namespace.data.BROKEN b/lib/lxml/html/tests/hackers-org-data/xml-namespace.data.BROKEN
new file mode 100644
index 00000000..2bc999f0
--- /dev/null
+++ b/lib/lxml/html/tests/hackers-org-data/xml-namespace.data.BROKEN
@@ -0,0 +1,16 @@
+Description: XML namespace. The htc file must be located on the same server as your XSS vector
+    http://ha.ckers.org/xss.html#XSS_XML_namespace
+Note: I don't completely understand the vector here.  page_structure is what does this.
+
+<HTML xmlns:xss>
+  <body>
+    <?import namespace="xss" implementation="http://ha.ckers.org/xss.htc">
+    <xss:xss>XSS</xss:xss>
+  </body>
+</HTML>
+----------
+<HTML>
+  <body>
+    <div>XSS</div>
+  </body>
+</HTML>
diff --git a/lib/lxml/html/tests/test_autolink.py b/lib/lxml/html/tests/test_autolink.py
new file mode 100644
index 00000000..61b474ce
--- /dev/null
+++ b/lib/lxml/html/tests/test_autolink.py
@@ -0,0 +1,11 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        suite.addTests([make_doctest('test_autolink.txt')])
+    return suite
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/lib/lxml/html/tests/test_autolink.txt b/lib/lxml/html/tests/test_autolink.txt
new file mode 100644
index 00000000..cafc6204
--- /dev/null
+++ b/lib/lxml/html/tests/test_autolink.txt
@@ -0,0 +1,79 @@
+This tests autolink::
+
+    >>> from lxml.html import usedoctest
+    >>> from lxml.html.clean import autolink_html
+    >>> print(autolink_html('''
+    ... <div>Link here: http://test.com/foo.html.</div>
+    ... '''))
+    <div>Link here: <a href="http://test.com/foo.html">http://test.com/foo.html</a>.</div>
+    >>> print(autolink_html('''
+    ... <div>Mail me at mailto:ianb@test.com or http://myhome.com</div>
+    ... '''))
+    <div>Mail me at <a href="mailto:ianb@test.com">ianb@test.com</a>
+    or <a href="http://myhome.com">http://myhome.com</a></div>
+    >>> print(autolink_html('''
+    ... <div>The <b>great</b> thing is the http://link.com links <i>and</i>
+    ... the http://foobar.com links.</div>'''))
+    <div>The <b>great</b> thing is the <a href="http://link.com">http://link.com</a> links <i>and</i>
+    the <a href="http://foobar.com">http://foobar.com</a> links.</div>
+    >>> print(autolink_html('''
+    ... <div>Link: &lt;http://foobar.com&gt;</div>'''))
+    <div>Link: &lt;<a href="http://foobar.com">http://foobar.com</a>&gt;</div>
+    >>> print(autolink_html('''
+    ... <div>Link: (http://foobar.com)</div>'''))
+    <div>Link: (<a href="http://foobar.com">http://foobar.com</a>)</div>
+
+Parenthesis are tricky, we'll do our best::
+
+    >>> print(autolink_html('''
+    ... <div>(Link: http://en.wikipedia.org/wiki/PC_Tools_(Central_Point_Software))</div>
+    ... '''))
+    <div>(Link: <a href="http://en.wikipedia.org/wiki/PC_Tools_(Central_Point_Software)">http://en.wikipedia.org/wiki/PC_Tools_(Central_Point_Software)</a>)</div>
+    >>> print(autolink_html('''
+    ... <div>... a link: http://foo.com)</div>
+    ... '''))
+    <div>... a link: <a href="http://foo.com">http://foo.com</a>)</div>
+
+Some cases that won't be caught (on purpose)::
+
+    >>> print(autolink_html('''
+    ... <div>A link to http://localhost/foo/bar won't, but a link to
+    ...  http://test.com will</div>'''))
+    <div>A link to http://localhost/foo/bar won't, but a link to
+    <a href="http://test.com">http://test.com</a> will</div>
+    >>> print(autolink_html('''
+    ... <div>A link in <textarea>http://test.com</textarea></div>'''))
+    <div>A link in <textarea>http://test.com</textarea></div>
+    >>> print(autolink_html('''
+    ... <div>A link in <a href="http://foo.com">http://bar.com</a></div>'''))
+    <div>A link in <a href="http://foo.com">http://bar.com</a></div>
+    >>> print(autolink_html('''
+    ... <div>A link in <code>http://foo.com</code> or
+    ... <span class="nolink">http://bar.com</span></div>'''))
+    <div>A link in <code>http://foo.com</code> or
+    <span class="nolink">http://bar.com</span></div>
+
+There's also a word wrapping function, that should probably be run
+after autolink::
+
+    >>> from lxml.html.clean import word_break_html
+    >>> def pascii(s):
+    ...     print(s.encode('ascii', 'xmlcharrefreplace').decode('ascii'))
+    >>> pascii(word_break_html( u'''
+    ... <div>Hey you
+    ... 12345678901234567890123456789012345678901234567890</div>'''))
+    <div>Hey you
+    1234567890123456789012345678901234567890&#8203;1234567890</div>
+
+Not everything is broken:
+
+    >>> pascii(word_break_html('''
+    ... <div>Hey you
+    ... <code>12345678901234567890123456789012345678901234567890</code></div>'''))
+    <div>Hey you
+    <code>12345678901234567890123456789012345678901234567890</code></div>
+    >>> pascii(word_break_html('''
+    ... <a href="12345678901234567890123456789012345678901234567890">text</a>'''))
+    <a href="12345678901234567890123456789012345678901234567890">text</a>
+
+    
diff --git a/lib/lxml/html/tests/test_basic.py b/lib/lxml/html/tests/test_basic.py
new file mode 100644
index 00000000..fd4896a7
--- /dev/null
+++ b/lib/lxml/html/tests/test_basic.py
@@ -0,0 +1,13 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest, doctest
+import lxml.html
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        suite.addTests([make_doctest('test_basic.txt')])
+    suite.addTests([doctest.DocTestSuite(lxml.html)])
+    return suite
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/lib/lxml/html/tests/test_basic.txt b/lib/lxml/html/tests/test_basic.txt
new file mode 100644
index 00000000..d7066402
--- /dev/null
+++ b/lib/lxml/html/tests/test_basic.txt
@@ -0,0 +1,162 @@
+lxml.html adds a find_class method to elements::
+
+    >>> from lxml.etree import Comment
+    >>> from lxml.html import document_fromstring, fragment_fromstring, tostring
+    >>> from lxml.html import fragments_fromstring, fromstring
+    >>> from lxml.html.clean import clean, clean_html
+    >>> from lxml.html import usedoctest
+    >>> try: unicode = unicode
+    ... except NameError: unicode = str
+
+    >>> h = document_fromstring('''
+    ... <html><head></head>
+    ... <body>
+    ...   <a class="vcard
+    ... fn   url" href="foobar">P1</a>
+    ...   <a class="not-fn vcard" href="baz">P2</a>
+    ... </body></html>''')
+    >>> print(tostring(h, encoding=unicode))
+    <html>
+      <head></head>
+      <body>
+        <a class="vcard
+    fn   url" href="foobar">P1</a>
+        <a class="not-fn vcard" href="baz">P2</a>
+      </body>
+    </html>
+    >>> print([e.text for e in h.find_class('fn')])
+    ['P1']
+    >>> print([e.text for e in h.find_class('vcard')])
+    ['P1', 'P2']
+
+Also added is a get_rel_links, which you can use to search for links
+like ``<a rel="$something">``::
+
+    >>> h = document_fromstring('''
+    ... <a href="1">test 1</a>
+    ... <a href="2" rel="tag">item 2</a>
+    ... <a href="3" rel="tagging">item 3</a>
+    ... <a href="4" rel="TAG">item 4</a>''')
+    >>> print([e.attrib['href'] for e in h.find_rel_links('tag')])
+    ['2', '4']
+    >>> print([e.attrib['href'] for e in h.find_rel_links('nofollow')])
+    []
+
+Another method is ``get_element_by_id`` that does what it says::
+
+    >>> print(tostring(fragment_fromstring('''
+    ... <div>
+    ...  <span id="test">stuff</span>
+    ... </div>''').get_element_by_id('test'), encoding=unicode))
+    <span id="test">stuff</span>
+
+Or to get the content of an element without the tags, use text_content()::
+
+    >>> el = fragment_fromstring('''
+    ... <div>This is <a href="foo">a <b>bold</b> link</a></div>''')
+    >>> el.text_content()
+    'This is a bold link'
+
+Or drop an element (leaving its content) or the entire tree, like::
+
+    >>> doc = document_fromstring('''
+    ... <html>
+    ...  <body>
+    ...   <div id="body">
+    ...    This is a <a href="foo" id="link">test</a> of stuff.
+    ...   </div>
+    ...   <!-- a comment -->
+    ...   <div>footer</div>
+    ...  </body>
+    ... </html>''')
+    >>> doc.get_element_by_id('link').drop_tag()
+    >>> print(tostring(doc, encoding=unicode))
+    <html>
+     <body>
+      <div id="body">
+       This is a test of stuff.
+      </div>
+      <!-- a comment -->
+      <div>footer</div>
+     </body>
+    </html>
+    >>> doc.get_element_by_id('body').drop_tree()
+    >>> print(tostring(doc, encoding=unicode))
+    <html>
+     <body>
+      <!-- a comment -->
+      <div>footer</div>
+     </body>
+    </html>
+
+Note, however, that comment text will not be merged into the tree when you
+drop the comment.  Here, ``drop_tag()`` behaves exactly like ``drop_tree()``:
+
+    >>> for comment in doc.getiterator(Comment):
+    ...     comment.drop_tag()
+    >>> print(tostring(doc, encoding=unicode))
+    <html>
+     <body>
+      <div>footer</div>
+     </body>
+    </html>
+
+In Python3 it should be possible to parse strings given as bytes objects, at
+least if an encoding is given.
+
+    >>> from lxml.html import HTMLParser
+    >>> enc = 'utf-8'
+    >>> html_parser = HTMLParser(encoding=enc)
+    >>> src = '<html><body>Test</body></html>'.encode(enc)
+
+    >>> doc = fromstring(src, parser=html_parser)
+    >>> print(tostring(doc, encoding=unicode))
+    <html><body>Test</body></html>
+
+    >>> docs = fragments_fromstring(src, parser=html_parser)
+    >>> len(docs)
+    1
+    >>> print(docs[0])
+    Test
+
+Bug 599318: Call fromstring with a frameset fragment should not raise an error,
+the whole document is returned.
+
+    >>> import lxml.html
+    >>> content='''
+    ... <frameset>
+    ...  <frame src="main.php" name="srcpg">
+    ... </frameset>'''
+    >>> etree_document = lxml.html.fromstring(content)
+    >>> print(tostring(etree_document, encoding=unicode))
+    <html><frameset><frame src="main.php" name="srcpg"></frameset></html>
+
+Bug 599318: Call fromstring with a div fragment should not raise an error,
+only the element is returned
+
+    >>> import lxml.html
+    >>> content='<div></div>'
+    >>> etree_document = lxml.html.fromstring(content)
+    >>> print(tostring(etree_document, encoding=unicode))
+    <div></div>
+
+Bug 599318: Call fromstring with a head fragment should not raise an error,
+the whole document is returned.
+
+    >>> import lxml.html
+    >>> content='<head></head>'
+    >>> etree_document = lxml.html.fromstring(content)
+    >>> print(tostring(etree_document, encoding=unicode))
+    <html><head></head></html>
+
+Bug 690319: Leading whitespace before doctype declaration should not raise an error.
+
+    >>> import lxml.html
+    >>> content='''
+    ...     <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
+    ...     <html>
+    ...     </html>'''
+    >>> etree_document = lxml.html.fromstring(content)
+    >>> print(tostring(etree_document, encoding=unicode))
+    <html></html>
+
diff --git a/lib/lxml/html/tests/test_clean.py b/lib/lxml/html/tests/test_clean.py
new file mode 100644
index 00000000..3bcaaf5a
--- /dev/null
+++ b/lib/lxml/html/tests/test_clean.py
@@ -0,0 +1,80 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest
+from lxml.etree import LIBXML_VERSION
+
+import lxml.html
+from lxml.html.clean import Cleaner, clean_html
+
+
+class CleanerTest(unittest.TestCase):
+    def test_allow_tags(self):
+        html = """
+            <html>
+            <head>
+            </head>
+            <body>
+            <p>some text</p>
+            <table>
+            <tr>
+            <td>hello</td><td>world</td>
+            </tr>
+            <tr>
+            <td>hello</td><td>world</td>
+            </tr>
+            </table>
+            <img>
+            </body>
+            </html>
+            """
+
+        html_root = lxml.html.document_fromstring(html)
+        cleaner = Cleaner(
+            remove_unknown_tags = False,
+            allow_tags = ['table', 'tr', 'td'])
+        result = cleaner.clean_html(html_root)
+
+        self.assertEqual(12-5+1, len(list(result.iter())))
+
+    def test_safe_attrs_included(self):
+        html = """<p><span style="color: #00ffff;">Cyan</span></p>"""
+
+        safe_attrs=set(lxml.html.defs.safe_attrs)
+        safe_attrs.add('style')
+
+        cleaner = Cleaner(
+            safe_attrs_only=True,
+            safe_attrs=safe_attrs)
+        result = cleaner.clean_html(html)
+
+        self.assertEqual(html, result)
+
+    def test_safe_attrs_excluded(self):
+        html = """<p><span style="color: #00ffff;">Cyan</span></p>"""
+        expected = """<p><span>Cyan</span></p>"""
+
+        safe_attrs=set()
+
+        cleaner = Cleaner(
+            safe_attrs_only=True,
+            safe_attrs=safe_attrs)
+        result = cleaner.clean_html(html)
+
+        self.assertEqual(expected, result)
+
+    def test_clean_invalid_root_tag(self):
+        # only testing that cleaning with invalid root tags works at all
+        s = lxml.html.fromstring('parent <invalid tag>child</another>')
+        self.assertEqual('parent child', clean_html(s).text_content())
+
+        s = lxml.html.fromstring('<invalid tag>child</another>')
+        self.assertEqual('child', clean_html(s).text_content())
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        suite.addTests([make_doctest('test_clean.txt')])
+        if LIBXML_VERSION >= (2,6,31):
+            suite.addTests([make_doctest('test_clean_embed.txt')])
+    suite.addTests(unittest.makeSuite(CleanerTest))
+    return suite
diff --git a/lib/lxml/html/tests/test_clean.txt b/lib/lxml/html/tests/test_clean.txt
new file mode 100644
index 00000000..fb99c0d9
--- /dev/null
+++ b/lib/lxml/html/tests/test_clean.txt
@@ -0,0 +1,161 @@
+>>> from lxml.html import fromstring, tostring
+>>> from lxml.html.clean import clean, clean_html, Cleaner
+>>> from lxml.html import usedoctest
+
+>>> doc = '''<html>
+...   <head>
+...     <script type="text/javascript" src="evil-site"></script>
+...     <link rel="alternate" type="text/rss" src="evil-rss">
+...     <link rel="alternate" type="text/rss" href="http://example.com">
+...     <link rel="stylesheet" type="text/rss" href="http://example.com">
+...     <style>
+...       body {background-image: url(javascript:do_evil)};
+...       div {background-image: url(data:text/html;base64,PHNjcmlwdD5hbGVydCgidGVzdCIpOzwvc2NyaXB0Pg==)};
+...       div {color: expression(evil)};
+...     </style>
+...   </head>
+...   <body onload="evil_function()">
+...     <!-- I am interpreted for EVIL! -->
+...     <a href="javascript:evil_function()">a link</a>
+...     <a href="data:text/html;base64,PHNjcmlwdD5hbGVydCgidGVzdCIpOzwvc2NyaXB0Pg==">data</a>
+...     <a href="#" onclick="evil_function()">another link</a>
+...     <p onclick="evil_function()">a paragraph</p>
+...     <div style="display: none">secret EVIL!</div>
+...     <object> of EVIL! </object>
+...     <iframe src="evil-site"></iframe>
+...     <form action="evil-site">
+...       Password: <input type="password" name="password">
+...     </form>
+...     <a href="evil-site">spam spam SPAM!</a>
+...     <a href="http://example.com" rel="author">Author</a>
+...     <a href="http://example.com" rel="nofollow">Text</a>
+...     <img src="evil!">
+...   </body>
+... </html>'''
+
+>>> print(doc)
+<html>
+  <head>
+    <script type="text/javascript" src="evil-site"></script>
+    <link rel="alternate" type="text/rss" src="evil-rss">
+    <link rel="alternate" type="text/rss" href="http://example.com">
+    <link rel="stylesheet" type="text/rss" href="http://example.com">
+    <style>
+      body {background-image: url(javascript:do_evil)};
+      div {background-image: url(data:text/html;base64,PHNjcmlwdD5hbGVydCgidGVzdCIpOzwvc2NyaXB0Pg==)};
+      div {color: expression(evil)};
+    </style>
+  </head>
+  <body onload="evil_function()">
+    <!-- I am interpreted for EVIL! -->
+    <a href="javascript:evil_function()">a link</a>
+    <a href="data:text/html;base64,PHNjcmlwdD5hbGVydCgidGVzdCIpOzwvc2NyaXB0Pg==">data</a>
+    <a href="#" onclick="evil_function()">another link</a>
+    <p onclick="evil_function()">a paragraph</p>
+    <div style="display: none">secret EVIL!</div>
+    <object> of EVIL! </object>
+    <iframe src="evil-site"></iframe>
+    <form action="evil-site">
+      Password: <input type="password" name="password">
+    </form>
+    <a href="evil-site">spam spam SPAM!</a>
+    <a href="http://example.com" rel="author">Author</a>
+    <a href="http://example.com" rel="nofollow">Text</a>
+    <img src="evil!">
+  </body>
+</html>
+
+>>> print(tostring(fromstring(doc)).decode("utf-8"))
+<html>
+  <head>
+    <script type="text/javascript" src="evil-site"></script>
+    <link rel="alternate" type="text/rss" src="evil-rss">
+    <link rel="alternate" type="text/rss" href="http://example.com">
+    <link rel="stylesheet" type="text/rss" href="http://example.com">
+    <style>
+      body {background-image: url(javascript:do_evil)};
+      div {background-image: url(data:text/html;base64,PHNjcmlwdD5hbGVydCgidGVzdCIpOzwvc2NyaXB0Pg==)};
+      div {color: expression(evil)};
+    </style>
+  </head>
+  <body onload="evil_function()">
+    <!-- I am interpreted for EVIL! -->
+    <a href="javascript:evil_function()">a link</a>
+    <a href="data:text/html;base64,PHNjcmlwdD5hbGVydCgidGVzdCIpOzwvc2NyaXB0Pg==">data</a>
+    <a href="#" onclick="evil_function()">another link</a>
+    <p onclick="evil_function()">a paragraph</p>
+    <div style="display: none">secret EVIL!</div>
+    <object> of EVIL! </object>
+    <iframe src="evil-site"></iframe>
+    <form action="evil-site">
+      Password: <input type="password" name="password">
+    </form>
+    <a href="evil-site">spam spam SPAM!</a>
+    <a href="http://example.com" rel="author">Author</a>
+    <a href="http://example.com" rel="nofollow">Text</a>
+    <img src="evil!">
+  </body>
+</html>
+
+>>> print(Cleaner(page_structure=False, safe_attrs_only=False).clean_html(doc))
+<html>
+  <head>
+    <style>/* deleted */</style>
+  </head>
+  <body>
+    <a href="">a link</a>
+    <a href="">data</a>
+    <a href="#">another link</a>
+    <p>a paragraph</p>
+    <div style="display: none">secret EVIL!</div>
+    of EVIL!
+    Password:
+    <a href="evil-site">spam spam SPAM!</a>
+    <a href="http://example.com" rel="author">Author</a>
+    <a href="http://example.com" rel="nofollow">Text</a>
+    <img src="evil!">
+  </body>
+</html>
+
+>>> print(Cleaner(style=True, links=True, add_nofollow=True, page_structure=False, safe_attrs_only=False).clean_html(doc))
+<html>
+  <head>
+  </head>
+  <body>
+    <a href="">a link</a>
+    <a href="">data</a>
+    <a href="#">another link</a>
+    <p>a paragraph</p>
+    <div>secret EVIL!</div>
+    of EVIL!
+    Password:
+    <a href="evil-site" rel="nofollow">spam spam SPAM!</a>
+    <a href="http://example.com" rel="author nofollow">Author</a>
+    <a href="http://example.com" rel="nofollow">Text</a>
+    <img src="evil!">
+  </body>
+</html>
+
+>>> print(Cleaner(links=False, page_structure=False, javascript=True, host_whitelist=['example.com'], whitelist_tags=None).clean_html(doc))
+<html>
+  <head>
+    <link rel="alternate" type="text/rss" src="evil-rss">
+    <link rel="alternate" type="text/rss" href="http://example.com">
+    <link rel="stylesheet" type="text/rss" href="http://example.com">
+    <style>/* deleted */</style>
+  </head>
+  <body>
+    <a href="">a link</a>
+    <a href="">data</a>
+    <a href="#">another link</a>
+    <p>a paragraph</p>
+    <div>secret EVIL!</div>
+    of EVIL!
+    Password:
+    <a href="evil-site">spam spam SPAM!</a>
+    <a href="http://example.com" rel="author">Author</a>
+    <a href="http://example.com" rel="nofollow">Text</a>
+    <img src="evil!">
+  </body>
+</html>
+
diff --git a/lib/lxml/html/tests/test_clean_embed.txt b/lib/lxml/html/tests/test_clean_embed.txt
new file mode 100644
index 00000000..59a40551
--- /dev/null
+++ b/lib/lxml/html/tests/test_clean_embed.txt
@@ -0,0 +1,39 @@
+THIS FAILS IN libxml2 2.6.29 AND 2.6.30 !!
+
+
+>>> from lxml.html import fromstring, tostring
+>>> from lxml.html.clean import clean, clean_html, Cleaner
+>>> from lxml.html import usedoctest
+
+>>> def tostring(el):  # work-around for Py3 'bytes' type
+...     from lxml.html import tostring
+...     s = tostring(el)
+...     if not isinstance(s, str):
+...         s = s.decode('UTF-8')
+...     return s
+
+>>> doc_embed = '''<div>
+... <embed src="http://www.youtube.com/v/183tVH1CZpA" type="application/x-shockwave-flash"></embed>
+... <embed src="http://anothersite.com/v/another"></embed>
+... <script src="http://www.youtube.com/example.js"></script>
+... <script src="/something-else.js"></script>
+... </div>'''
+>>> print(tostring(fromstring(doc_embed)))
+<div>
+<embed src="http://www.youtube.com/v/183tVH1CZpA" type="application/x-shockwave-flash"></embed>
+<embed src="http://anothersite.com/v/another"></embed>
+<script src="http://www.youtube.com/example.js"></script>
+<script src="/something-else.js"></script>
+</div>
+>>> print(Cleaner().clean_html(doc_embed))
+<div>
+</div>
+>>> print(Cleaner(host_whitelist=['www.youtube.com']).clean_html(doc_embed))
+<div>
+<embed src="http://www.youtube.com/v/183tVH1CZpA" type="application/x-shockwave-flash"></embed>
+</div>
+>>> print(Cleaner(host_whitelist=['www.youtube.com'], whitelist_tags=None).clean_html(doc_embed))
+<div>
+<embed src="http://www.youtube.com/v/183tVH1CZpA" type="application/x-shockwave-flash"></embed>
+<script src="http://www.youtube.com/example.js"></script>
+</div>
diff --git a/lib/lxml/html/tests/test_diff.py b/lib/lxml/html/tests/test_diff.py
new file mode 100644
index 00000000..f1fba4bc
--- /dev/null
+++ b/lib/lxml/html/tests/test_diff.py
@@ -0,0 +1,14 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest, doctest
+
+from lxml.html import diff
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        suite.addTests([make_doctest('test_diff.txt'),
+                        doctest.DocTestSuite(diff)])
+    return suite
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/lib/lxml/html/tests/test_diff.txt b/lib/lxml/html/tests/test_diff.txt
new file mode 100644
index 00000000..9057a2b6
--- /dev/null
+++ b/lib/lxml/html/tests/test_diff.txt
@@ -0,0 +1,252 @@
+lxml.html.diff does HTML comparisons.  These are word-based comparisons.
+
+First, a handy function for normalizing whitespace and doing word wrapping::
+
+    >>> import re, textwrap
+    >>> def pwrapped(text):
+    ...     text = re.sub(r'[ \n\t\r]+', ' ', text)
+    ...     text = textwrap.fill(text)
+    ...     print(text)
+    >>> def pdiff(text1, text2):
+    ...     pwrapped(htmldiff(text1, text2))
+
+Example::
+
+    >>> from lxml.html.diff import htmldiff, html_annotate
+    >>> html1 = '<p>This is some test text with some changes and some same stuff</p>'
+    >>> html2 = '''<p>This is some test textual writing with some changed stuff 
+    ... and some same stuff</p>'''
+    >>> pdiff(html1, html2)
+    <p>This is some test <ins>textual writing with some changed stuff
+    </ins> <del>text with some changes</del> and some same stuff</p>
+
+Style tags are largely ignored in terms of differences, though markup is not eliminated::
+
+    >>> html1 = '<p>Hi <i>you guys</i></p>'
+    >>> html2 = '<p>Hi <i>you</i> guys</p>'
+    >>> pdiff(html1, html2)
+    <p>Hi <i>you</i> guys</p>
+    >>> pdiff('text', '<p>text</p>')
+    <p>text</p>
+    >>> pdiff('<i>Hi guys</i> !!', '<i>Hi guy</i> !!')
+    <i>Hi <ins>guy</ins> <del>guys</del> </i> !!
+    >>> pdiff('H<i>i</i>', 'Hi')
+    <ins>Hi</ins> <del>H<i>i</i></del>
+    >>> pdiff('<i>A B</i> C', '<i>A</i> C')
+    <i>A <del>B</del> </i> C
+    >>> pdiff('<i>A B</i> C', '<i>B</i> C')
+    <i> <del>A</del> B</i> C
+    >>> pdiff('<p></p>', '<p></p>')
+    <p></p>
+    >>> pdiff('<p>Hi</p>', '<p>Bye</p>')
+    <p><ins>Bye</ins></p> <p><del>Hi</del></p>
+    >>> pdiff('<p>Hi Guy</p>', '<p>Bye Guy</p>')
+    <p> <ins>Bye</ins> <del>Hi</del> Guy</p>
+    >>> pdiff('<p>Hey there</p>', '')
+    <ins></ins> <p><del>Hey there</del></p>
+
+Movement between paragraphs is ignored, as tag-based changes are generally ignored::
+    >>> 
+    >>> pdiff('<p>Hello</p><p>World</p>', '<p>Hello World</p>')
+    <p>Hello World</p>
+
+As a special case, changing the href of a link is displayed, and
+images are treated like words:
+
+    >>> pdiff('<a href="http://yahoo.com">search</a>', '<a href="http://google.com">search</a>')
+    <a href="http://google.com">search <ins> Link: http://google.com</ins>
+    <del> Link: http://yahoo.com</del> </a>
+    >>> pdiff('<p>Print this <img src="print.gif"></p>', '<p>Print this</p>')
+    <p>Print this <del><img src="print.gif"></del> </p>
+    >>> pdiff('<a href="http://yahoo.com">search</a>', '<a href="http://yahoo.com">search</a>')
+    <a href="http://yahoo.com">search</a>
+
+Images may sometimes not have 'src' attributes:
+
+    >>> pdiff('<img src="tease"> <img> test <img src="test">', '<img> test <img src="toast">')
+    <del><img src="tease"></del> <img> test <ins><img src="toast"></ins>
+    <del><img src="test"></del>
+
+A test of empty elements:
+
+    >>> pdiff('some <br> text', 'some <br> test')
+    some <ins><br> test</ins> <del><br> text</del>
+    
+Whitespace is generally ignored for the diff but preserved during the diff:
+
+    >>> print(htmldiff('<p> first\nsecond\nthird</p>', '<p>   &#xA0; first\n  second\nthird  </p>'))
+    <p>first
+      second
+    third  </p>
+    >>> print(htmldiff('<pre>first\nsecond\nthird</pre>', '<pre>first\nsecond\nthird</pre>'))
+    <pre>first
+    second
+    third</pre>
+    >>> print(htmldiff('<pre>first\nsecond</pre>', '<pre>first\nsecond\n third</pre>'))
+    <pre>first
+    second
+     <ins>third</ins> </pre>
+
+The sixteen combinations::
+
+First "insert start" (del start/middle/end/none):
+
+    >>> pdiff('<b>A B C</b>', '<b>D B C</b')
+    <b> <ins>D</ins> <del>A</del> B C</b>
+    >>> pdiff('<b>A B C</b>', '<b>D A C</b>')
+    <b> <ins>D</ins> A <del>B</del> C</b>
+    >>> pdiff('<b>A B C</b>', '<b>D A B</b>')
+    <b> <ins>D</ins> A B <del>C</del> </b>
+    >>> pdiff('<b>A B C</b>', '<b>D A B C</b>')
+    <b> <ins>D</ins> A B C</b>
+
+Next, "insert middle" (del start/middle/end/none):
+
+    >>> pdiff('<b>A B C</b>', '<b>D B C</b>')
+    <b> <ins>D</ins> <del>A</del> B C</b>
+    >>> pdiff('<b>A B C</b>', '<b>A D C</b>')
+    <b>A <ins>D</ins> <del>B</del> C</b>
+    >>> pdiff('<b>A B C</b>', '<b>A D B</b>')
+    <b>A <ins>D</ins> B <del>C</del> </b>
+
+This one case hits the threshold of our insensitive matching:
+
+    >>> pdiff('<b>A B C</b>', '<b>A D B C</b>')
+    <b> <ins>A D</ins> <del>A</del> B C</b>
+
+
+Then "insert end" (del start/middle/end/none):
+
+    >>> pdiff('<b>A B C</b>', '<b>B C D</b>')
+    <b> <del>A</del> B C <ins>D</ins> </b>
+    >>> pdiff('<b>A B C</b>', '<b>A C D</b>')
+    <b>A <del>B</del> C <ins>D</ins> </b>
+    >>> pdiff('<b>A B C</b>', '<b>A B D</b>')
+    <b>A B <ins>D</ins> <del>C</del> </b>
+    >>> pdiff('<b>A B C</b>', '<b>A B C D</b>')
+    <b>A B C <ins>D</ins> </b>
+
+Then no insert (del start/middle/end):
+
+    >>> pdiff('<b>A B C</b>', '<b>B C</b>')
+    <b> <del>A</del> B C</b>
+    >>> pdiff('<b>A B C</b>', '<b>A C</b>')
+    <b>A <del>B</del> C</b>
+    >>> pdiff('<b>A B C</b>', '<b>A B</b>')
+    <b>A B <del>C</del> </b>
+
+    >>> pdiff('<b>A B</b> C', '<b>A B</b>')
+    <b>A B</b> <del>C</del>
+    >>> pdiff('<b>A B</b> <b>C</b>', '<b>A B</b>')
+    <b>A B</b> <del><b>C</b></del>
+    >>> pdiff('A <p><b>hey there</b> <i>how are you?</i></p>', 'A')
+    A <p><del><b>hey there</b> <i>how are you?</i></del></p>
+    
+Testing a larger document, to make sure there are not weird
+unnecessary parallels found:
+
+    >>> pdiff('''
+    ... <p>This is a test document with many words in it that goes on
+    ... for a while and doesn't have anything do to with the next
+    ... document that we match this against</p>''', '''
+    ... <p>This is another document with few similarities to the preceding
+    ... one, but enough that it may have overlap that could turn into
+    ... a confusing series of deletes and inserts.
+    ... </p>''')
+    <p><ins>This is another document with few similarities to the
+    preceding one, but enough that it may have overlap that could turn
+    into a confusing series of deletes and inserts. </ins></p>
+    <p><del>This is a test document with many words in it that goes on for
+    a while and doesn't have anything do to with the next document that we
+    match this against</del></p>
+
+
+
+Annotation of content can also be done, where every bit of content is
+marked up with information about where it came from.
+
+First, some setup; note that html_annotate is called with a sequence
+of documents and the annotation associated with that document.  We'll
+just use indexes, but you could use author or timestamp information.
+
+    >>> def markup(text, annotation):
+    ...     return '<span version="%s">%s</span>' % (annotation, text)
+    >>> def panno(*docs):
+    ...     pwrapped(html_annotate([(doc, index) for index, doc in enumerate(docs)],
+    ...                            markup=markup))
+
+Now, a sequence of documents:
+
+    >>> panno('Hello cruel world', 'Hi cruel world', 'Hi world')
+    <span version="1">Hi</span> <span version="0">world</span>
+    >>> panno('A similar document', 'A similar document',
+    ...       'A similar document here')
+    <span version="0">A similar document</span> <span
+    version="2">here</span>
+    >>> panno('<p>P1 para</p><p>P2 para</p>', '<p>P1 para</p><p>P3 foo</p>')
+    <p><span version="0">P1 para</span></p><p><span version="1">P3
+    foo</span></p>
+    >>> panno('Hello<p>There World</p>','Hello<p>There Town</p>')
+    <span version="0">Hello</span><p><span version="0">There</span> <span
+    version="1">Town</span></p>
+    >>> panno('<p>Hello</p>There World','<p>Hello</p>There Town')
+    <p><span version="0">Hello</span></p><span version="0">There</span>
+    <span version="1">Town</span>
+    >>> panno('<p>Hello</p><p>There World</p>','<p>Hello</p><p>There Town</p>')
+    <p><span version="0">Hello</span></p><p><span version="0">There</span>
+    <span version="1">Town</span></p>
+    >>> panno('<p>Hi <img src="/foo"> You</p>',
+    ...       '<p>Hi You</p>',
+    ...       '<p>Hi You <img src="/bar"></p>')
+    <p><span version="0">Hi You</span> <span version="2"><img
+    src="/bar"></span></p>
+    >>> panno('<p><a href="/foo">Hey</a></p>',
+    ...       '<p><a href="/bar">Hey</a></p>')
+    <p><a href="/bar"><span version="0">Hey</span></a></p>
+    >>> panno('<p><a href="/foo">Hey You</a></p>',
+    ...       '<p><a href="/foo">Hey Guy</a></p>')
+    <p><a href="/foo"><span version="0">Hey</span> <span
+    version="1">Guy</span></a></p>
+
+Internals
+---------
+
+
+Some utility functions::
+
+    >>> from lxml.html.diff import fixup_ins_del_tags, split_unbalanced, split_trailing_whitespace
+    >>> def pfixup(text):
+    ...     print(fixup_ins_del_tags(text).strip())
+    >>> pfixup('<ins><p>some text <b>and more text</b> and more</p></ins>')
+    <p><ins>some text <b>and more text</b> and more</ins></p>
+    >>> pfixup('<p><ins>Hi!</ins> you</p>')
+    <p><ins>Hi!</ins> you</p>
+    >>> pfixup('<div>Some text <ins>and <p>more text</p></ins> </div>')
+    <div>Some text <ins>and </ins><p><ins>more text</ins></p> </div>
+    >>> pfixup('''
+    ...    <ins><table><tr><td>One table</td><td>More stuff</td></tr></table></ins>''')
+    <table><tr><td><ins>One table</ins></td><td><ins>More stuff</ins></td></tr></table>
+
+
+Testing split_unbalanced::
+
+    >>> split_unbalanced(['<a href="blah">', 'hey', '</a>'])
+    ([], ['<a href="blah">', 'hey', '</a>'], [])
+    >>> split_unbalanced(['<a href="blah">', 'hey'])
+    (['<a href="blah">'], ['hey'], [])
+    >>> split_unbalanced(['Hey', '</i>', 'You', '</b>'])
+    ([], ['Hey', 'You'], ['</i>', '</b>'])
+    >>> split_unbalanced(['So', '</i>', 'Hi', '<b>', 'There', '</b>'])
+    ([], ['So', 'Hi', '<b>', 'There', '</b>'], ['</i>'])
+    >>> split_unbalanced(['So', '</i>', 'Hi', '<b>', 'There'])
+    (['<b>'], ['So', 'Hi', 'There'], ['</i>'])
+    
+
+Testing split_trailing_whitespace::
+
+    >>> split_trailing_whitespace('test\n\n')
+    ('test', '\n\n')
+    >>> split_trailing_whitespace(' test\n ')
+    (' test', '\n ')
+    >>> split_trailing_whitespace('test')
+    ('test', '')
diff --git a/lib/lxml/html/tests/test_elementsoup.py b/lib/lxml/html/tests/test_elementsoup.py
new file mode 100644
index 00000000..01ba46c3
--- /dev/null
+++ b/lib/lxml/html/tests/test_elementsoup.py
@@ -0,0 +1,33 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest, HelperTestCase
+
+try:
+    import BeautifulSoup
+    BS_INSTALLED = True
+except ImportError:
+    BS_INSTALLED = False
+
+if BS_INSTALLED:
+    class SoupParserTestCase(HelperTestCase):
+        from lxml.html import soupparser
+
+        def test_broken_attribute(self):
+            html = """\
+              <html><head></head><body>
+                <form><input type='text' disabled size='10'></form>
+              </body></html>
+            """
+            root = self.soupparser.fromstring(html)
+            self.assertTrue(root.find('.//input').get('disabled') is not None)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if BS_INSTALLED:
+        suite.addTests([unittest.makeSuite(SoupParserTestCase)])
+        if sys.version_info[0] < 3:
+            suite.addTests([make_doctest('../../../../doc/elementsoup.txt')])
+    return suite
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/lib/lxml/html/tests/test_feedparser_data.py b/lib/lxml/html/tests/test_feedparser_data.py
new file mode 100644
index 00000000..eaf8c29e
--- /dev/null
+++ b/lib/lxml/html/tests/test_feedparser_data.py
@@ -0,0 +1,98 @@
+import sys
+import os
+import re
+try:
+    from rfc822 import Message
+except ImportError:
+    # Python 3
+    from email import message_from_file as Message
+import unittest
+from lxml.tests.common_imports import doctest
+if sys.version_info >= (2,4):
+    from lxml.doctestcompare import LHTMLOutputChecker
+
+from lxml.html.clean import clean, Cleaner
+
+feed_dirs = [
+    os.path.join(os.path.dirname(__file__), 'feedparser-data'),
+    os.path.join(os.path.dirname(__file__), 'hackers-org-data'),
+    ]
+bar_re = re.compile(r"-----+")
+
+class DummyInput:
+    def __init__(self, **kw):
+        for name, value in kw.items():
+            setattr(self, name, value)
+
+class FeedTestCase(unittest.TestCase):
+
+    def __init__(self, filename):
+        self.filename = filename
+        unittest.TestCase.__init__(self)
+
+    def parse(self):
+        f = open(self.filename, 'r')
+        headers = Message(f)
+        c = f.read()
+        f.close()
+        if not c.strip():
+            c = headers.get_payload()
+        if not headers.keys():
+            raise Exception(
+                "File %s has no headers" % self.filename)
+        self.description = headers['Description']
+        self.expect = headers.get('Expect', '')
+        self.ignore = headers.get('Ignore')
+        self.options = [
+            o.strip() for o in headers.get('Options', '').split(',')
+            if o.strip()]
+        parts = bar_re.split(c)
+        self.input = parts[0].rstrip() + '\n'
+        if parts[1:]:
+            self.expect = parts[1].rstrip() + '\n'
+        else:
+            self.expect = None
+
+    def runTest(self):
+        self.parse()
+        if self.ignore:
+            # We've marked this test to be ignored.
+            return
+        kw = {}
+        for name in self.options:
+            if name.startswith('-'):
+                kw[name[1:]] = False
+            else:
+                kw[name] = True
+        if kw.get('clean', True):
+            transformed = Cleaner(**kw).clean_html(self.input)
+        else:
+            transformed = self.input
+        assert self.expect is not None, (
+            "No expected output in %s" % self.filename)
+        checker = LHTMLOutputChecker()
+        if not checker.check_output(self.expect, transformed, 0):
+            result = checker.output_difference(
+                DummyInput(want=self.expect), transformed, 0)
+            #result += '\noptions: %s %r' % (', '.join(self.options), kw)
+            #result += repr(transformed)
+            raise Exception("\n"+result)
+
+    def shortDescription(self):
+        return self.filename
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        for dir in feed_dirs:
+            for fn in os.listdir(dir):
+                fn = os.path.join(dir, fn)
+                if fn.endswith('.data'):
+                    case = FeedTestCase(fn)
+                    suite.addTests([case])
+                    # This is my lazy way of stopping on first error:
+                    try:
+                        case.runTest()
+                    except:
+                        break
+    return suite
diff --git a/lib/lxml/html/tests/test_formfill.py b/lib/lxml/html/tests/test_formfill.py
new file mode 100644
index 00000000..7893c20b
--- /dev/null
+++ b/lib/lxml/html/tests/test_formfill.py
@@ -0,0 +1,8 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        suite.addTests([make_doctest('test_formfill.txt')])
+    return suite
diff --git a/lib/lxml/html/tests/test_formfill.txt b/lib/lxml/html/tests/test_formfill.txt
new file mode 100644
index 00000000..7e1ed6f0
--- /dev/null
+++ b/lib/lxml/html/tests/test_formfill.txt
@@ -0,0 +1,112 @@
+Some basic imports:
+
+    >>> from lxml.html import usedoctest
+    >>> from lxml.html.formfill import fill_form_html
+
+The simplest kind of filling is just filling an input with a value:
+
+    >>> print(fill_form_html('''
+    ... <form><input type="text" name="foo"></form>''', dict(foo='bar')))
+    <form><input type="text" name="foo" value="bar"></form>
+    
+You can also fill multiple inputs, like:
+
+    >>> print(fill_form_html('''
+    ... <form>
+    ...   <input type="text" name="foo">
+    ...   <input type="text" name="foo">
+    ... </form>''', dict(foo=['bar1', 'bar2'])))
+    <form>
+      <input type="text" name="foo" value="bar1">
+      <input type="text" name="foo" value="bar2">
+    </form>
+
+Checkboxes can work either as boolean true/false, or be selected based
+on their inclusion in a set of values::
+
+    >>> print(fill_form_html('''
+    ... <form>
+    ...   Would you like to be spammed?
+    ...   <input type="checkbox" name="spam_me"> <br>
+    ...   Spam you'd like to receive:<br>
+    ...   Viagra spam:
+    ...       <input type="checkbox" name="type" value="viagra"><br>
+    ...   Stock spam:
+    ...       <input type="checkbox" name="type" value="stock"><br>
+    ...   Other spam:
+    ...       <input type="checkbox" name="type" value="other"><br>
+    ...   <input type="submit" value="Spam!">
+    ... </form>''', dict(spam_me=True, type=['viagra', 'other'])))
+    <form>
+      Would you like to be spammed?
+      <input type="checkbox" name="spam_me" checked> <br>
+      Spam you'd like to receive:<br>
+      Viagra spam:
+          <input type="checkbox" name="type" value="viagra" checked><br>
+      Stock spam:
+          <input type="checkbox" name="type" value="stock"><br>
+      Other spam:
+          <input type="checkbox" name="type" value="other" checked><br>
+      <input type="submit" value="Spam!">
+    </form>
+
+FIXME: I need to test more of this.  But I'm lazy and want to use the
+coverage report for some of this.
+
+
+This module also allows you to add error messages to the form.  The errors
+add an "error" class to the input fields, and any labels if the field
+has a label.  It also inserts an error message into the form, using a
+function you can provide (or the default function).
+
+Example::
+
+    >>> from lxml.html.formfill import insert_errors_html
+    >>> print(insert_errors_html('''
+    ... <form>
+    ...   <fieldset id="fieldset">
+    ...     <input name="v1"><br>
+    ...     <label for="v2">label</label>
+    ...     <input name="v2" id="v2"><br>
+    ...   </fieldset>
+    ...   <input name="v3" class="foo">
+    ...   <input name="v3" class="foo">
+    ...   <input name="v4">
+    ...   <input name="v4">
+    ... </form>''', {
+    ...   'v1': "err1",
+    ...   'v2': "err2",
+    ...   'v3': [None, "err3-2"],
+    ...   'v4': "err4",
+    ...   None: 'general error',
+    ...   '#fieldset': 'area error',
+    ... }))
+    <form>
+      <div class="error-message error-block">general error</div>
+      <fieldset id="fieldset" class="error">
+        <div class="error-message error-block">area error</div>
+        <div class="error-message">err1</div>
+        <input name="v1" class="error"><br>
+        <label for="v2" class="error">label</label>
+        <div class="error-message">err2</div>
+        <input name="v2" id="v2" class="error"><br>
+      </fieldset>
+      <input name="v3" class="foo">
+      <div class="error-message">err3-2</div>
+      <input name="v3" class="foo error">
+      <div class="error-message">err4</div>
+      <input name="v4" class="error">
+      <input name="v4">
+    </form>
+
+
+REGRESSION: When filling textareas, the "name" attribute used to
+be removed. The "name" attribute should be kept::
+
+    >>> print(fill_form_html('''
+    ... <form>
+    ...   <textarea name="foo">Initial value</textarea>
+    ... </form>''', dict(foo="Bar")))
+    <form>
+      <textarea name="foo">Bar</textarea>
+    </form>
diff --git a/lib/lxml/html/tests/test_forms.py b/lib/lxml/html/tests/test_forms.py
new file mode 100644
index 00000000..e8b00c4d
--- /dev/null
+++ b/lib/lxml/html/tests/test_forms.py
@@ -0,0 +1,11 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        suite.addTests([make_doctest('test_forms.txt')])
+    return suite
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/lib/lxml/html/tests/test_forms.txt b/lib/lxml/html/tests/test_forms.txt
new file mode 100644
index 00000000..25c6529a
--- /dev/null
+++ b/lib/lxml/html/tests/test_forms.txt
@@ -0,0 +1,195 @@
+>>> from lxml.html import usedoctest
+>>> from lxml.html import fromstring, tostring
+>>> h = fromstring('''<html><body>
+... <form action="test">
+...   <input type="hidden" name="hidden_field" value="hidden_value">
+...   <input type="text" name="text_field" value="text_value">
+...   <input type="checkbox" name="single_checkbox">
+...   <input type="checkbox" name="single_checkbox2" value="good">
+...   <input type="checkbox" name="check_group" value="1">
+...   <input type="checkbox" name="check_group" value="2" checked>
+...   <input type="checkbox" name="check_group" value="3" checked>
+...   <input type="checkbox" name="check_group" value="4">
+...   <textarea name="textarea_field">some text</textarea>
+...   <label for="value1">value 1</label>
+...     <input type="radio" name="radios" value="value1" id="value1">
+...   <label for="value2">value 2</label>
+...     <input type="radio" name="radios" value="value2" id="value2">
+...   <label for="value3">value 3</label>
+...     <input type="radio" name="radios" value="value3" id="value3" checked>
+...   <select name="select1">
+...     <option> No value </option>
+...     <option value="">Empty</option>
+...     <option value="1">number 1</option>
+...   </select>
+...   <select name="select2" multiple>
+...     <option value="1">number 1</option>
+...     <option value="2">number 2</option>
+...     <option value="3">number 3</option>
+...     <option>number 4</option>
+...   </select>
+...   <input type="submit" name="submit1" value="submit">
+...   <input type="submit" name="submit2" value="submit">
+...   <input type="reset" name="reset1">linksys
+... </form>
+... </body></html>''', base_url='http://example.org/form.html')
+>>> h.base_url
+u'http://example.org/form.html'
+>>> f = h.forms[0]
+>>> f.action
+u'http://example.org/test'
+>>> f.method
+'GET'
+>>> f.inputs # doctest:+NOPARSE_MARKUP
+<InputGetter for form 0>
+>>> hidden = f.inputs['hidden_field']
+>>> hidden.checkable
+False
+>>> hidden.value
+'hidden_value'
+>>> hidden.value = 'new value'
+>>> tostring(hidden, with_tail=False)
+b'<input type="hidden" name="hidden_field" value="new value">'
+>>> checkbox = f.inputs['single_checkbox']
+>>> checkbox.checkable
+True
+>>> checkbox.type
+'checkbox'
+>>> checkbox.checked
+False
+>>> print(checkbox.value)
+None
+>>> checkbox.checked = True
+>>> checkbox.value
+'on'
+>>> tostring(checkbox, with_tail=False)
+b'<input type="checkbox" name="single_checkbox" checked>'
+>>> checkbox2 = f.inputs['single_checkbox2']
+>>> checkbox2.checked = True
+>>> checkbox2.value
+'good'
+>>> group = f.inputs['check_group']
+>>> group.value # doctest:+NOPARSE_MARKUP
+<CheckboxValues {'2', '3'} for checkboxes name='check_group'>
+>>> group.value.add('1')
+>>> group.value # doctest:+NOPARSE_MARKUP
+<CheckboxValues {'1', '2', '3'} for checkboxes name='check_group'>
+>>> tostring(group[0], with_tail=False)
+b'<input type="checkbox" name="check_group" value="1" checked>'
+>>> group.value_options
+['1', '2', '3', '4']
+>>> group.value.add('doesnotexist')
+Traceback (most recent call last):
+    ...
+KeyError: "No checkbox with value 'doesnotexist'"
+>>> textarea = f.inputs['textarea_field']
+>>> textarea.value
+'some text'
+>>> radios = f.inputs['radios']
+>>> radios[0].label.text
+'value 1'
+>>> radios.value
+'value3'
+>>> radios.value = 'value1'
+>>> radios.value
+'value1'
+>>> tostring(radios[0], with_tail=False)
+b'<input type="radio" name="radios" value="value1" id="value1" checked>'
+>>> radios.value = None
+>>> tostring(radios[0], with_tail=False)
+b'<input type="radio" name="radios" value="value1" id="value1">'
+>>> radios.value_options
+['value1', 'value2', 'value3']
+>>> select = f.inputs['select1']
+>>> print(select.value)
+None
+>>> select.value = ""
+>>> select.value
+''
+>>> select.value = 'asdf'
+Traceback (most recent call last):
+    ...
+ValueError: There is no option with the value of 'asdf'
+>>> select.value_options
+['No value', '', '1']
+>>> select.value = 'No value'
+>>> select.value
+'No value'
+>>> select = f.inputs['select2']
+>>> select.value # doctest:+NOPARSE_MARKUP
+<MultipleSelectOptions {} for select name='select2'>
+>>> select.value.update(['2', '3'])
+>>> select.value # doctest:+NOPARSE_MARKUP
+<MultipleSelectOptions {'2', '3'} for select name='select2'>
+>>> select.value.remove('3')
+>>> select.value.add('asdf')
+Traceback (most recent call last):
+    ...
+ValueError: There is no option with the value 'asdf'
+>>> select.value.add('number 4')
+>>> select.value # doctest:+NOPARSE_MARKUP
+<MultipleSelectOptions {'2', 'number 4'} for select name='select2'>
+>>> select.value.remove('number 4')
+>>> select.value_options
+['1', '2', '3', 'number 4']
+>>> try: from urllib import urlencode
+... except ImportError: from urllib.parse import urlencode
+>>> print(urlencode(f.form_values()))
+hidden_field=new+value&text_field=text_value&single_checkbox=on&single_checkbox2=good&check_group=1&check_group=2&check_group=3&textarea_field=some+text&select1=No+value&select2=2
+>>> fields = f.fields
+>>> fields # doctest:+NOPARSE_MARKUP
+<FieldsDict for form 0>
+>>> for name, value in sorted(fields.items()):
+...     print('%s: %r' % (name, value))
+check_group: <CheckboxValues {'1', '2', '3'} for checkboxes name='check_group'>
+hidden_field: 'new value'
+radios: None
+reset1: None
+select1: 'No value'
+select2: <MultipleSelectOptions {'2'} for select name='select2'>
+single_checkbox: 'on'
+single_checkbox2: 'good'
+submit1: 'submit'
+submit2: 'submit'
+text_field: 'text_value'
+textarea_field: 'some text'
+
+>>> import lxml.html
+>>> tree = lxml.html.fromstring('''
+... <html><body>
+...  <form>
+...   <input name="foo" value="bar"/>
+...   <input type="submit" />
+...  </form>
+... </body></html>
+... ''')
+>>> tree # doctest: +ELLIPSIS
+<Element html at ...>
+>>> tree.forms[0] # doctest: +ELLIPSIS
+<Element form at ...>
+>>> tree.forms[0].fields # doctest: +NOPARSE_MARKUP
+<FieldsDict for form 0>
+>>> list(tree.forms[0].fields.keys())
+['foo']
+>>> list(tree.forms[0].fields.items())
+[('foo', 'bar')]
+>>> list(tree.forms[0].fields.values())
+['bar']
+
+>>> tree = lxml.html.fromstring('''
+... <html><body>
+...  <form>
+...   <textarea name="foo">some <b>text<br>content</b> with tags</textarea>
+...  </form>
+... </body></html>
+... ''')
+>>> list(tree.forms[0].fields.keys())
+['foo']
+>>> ta = tree.forms[0].inputs['foo']
+>>> print(ta.value)
+some <b>text<br>content</b> with tags
+>>> ta.value = 'abc<br>def'
+>>> print(ta.value)
+abc<br>def
+>>> len(ta)
+0
diff --git a/lib/lxml/html/tests/test_frames.py b/lib/lxml/html/tests/test_frames.py
new file mode 100644
index 00000000..2eeb844e
--- /dev/null
+++ b/lib/lxml/html/tests/test_frames.py
@@ -0,0 +1,36 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest, doctest
+import lxml.html
+from lxml.html import html_parser, XHTML_NAMESPACE
+
+class FrameTest(unittest.TestCase):
+
+    def test_parse_fragments_fromstring(self):
+        parser = lxml.html.HTMLParser(encoding='utf-8', remove_comments=True)
+        html = """<frameset>
+            <frame src="main.php" name="srcpg" id="srcpg" frameborder="0" rolling="Auto" marginwidth="" marginheight="0">
+        </frameset>"""
+        etree_document = lxml.html.fragments_fromstring(html, parser=parser)
+        self.assertEqual(len(etree_document), 1)
+        root = etree_document[0]
+        self.assertEqual(root.tag, "frameset")
+        frame_element = root[0]
+        self.assertEqual(frame_element.tag, 'frame')
+
+    def test_parse_fromstring(self):
+        parser = lxml.html.HTMLParser(encoding='utf-8', remove_comments=True)
+        html = """<html><frameset>
+            <frame src="main.php" name="srcpg" id="srcpg" frameborder="0" rolling="Auto" marginwidth="" marginheight="0">
+        </frameset></html>"""
+        etree_document = lxml.html.fromstring(html, parser=parser)
+        self.assertEqual(etree_document.tag, 'html')
+        self.assertEqual(len(etree_document), 1)
+        frameset_element = etree_document[0]
+        self.assertEqual(len(frameset_element), 1)
+        frame_element = frameset_element[0]
+        self.assertEqual(frame_element.tag, 'frame')
+
+
+def test_suite():
+    loader = unittest.TestLoader()
+    return loader.loadTestsFromModule(sys.modules[__name__])
\ No newline at end of file
diff --git a/lib/lxml/html/tests/test_html5parser.py b/lib/lxml/html/tests/test_html5parser.py
new file mode 100644
index 00000000..fad45dc4
--- /dev/null
+++ b/lib/lxml/html/tests/test_html5parser.py
@@ -0,0 +1,429 @@
+import os
+import imp
+try:
+    from StringIO import StringIO
+except ImportError:                     # python 3
+    from io import StringIO
+import sys
+import tempfile
+import unittest
+try:
+    from unittest import skipUnless
+except ImportError:
+    # sys.version < (2, 7)
+    def skipUnless(condition, reason):
+        return lambda f: condition and f or None
+
+if sys.version_info < (2,6):
+    class NamedTemporaryFile(object):
+        def __init__(self, delete=True, **kwargs):
+            self._tmpfile = tempfile.NamedTemporaryFile(**kwargs)
+        def close(self):
+            self._tmpfile.flush()
+        def __getattr__(self, name):
+            return getattr(self._tmpfile, name)
+else:
+    NamedTemporaryFile = tempfile.NamedTemporaryFile
+
+from lxml.builder import ElementMaker
+from lxml.etree import Element, ElementTree, ParserError
+from lxml.html import html_parser, XHTML_NAMESPACE
+
+try:
+    import urlparse
+except ImportError:
+    import urllib.parse as urlparse 
+    
+try:
+    from urllib import pathname2url
+except ImportError:
+    from urllib.request import pathname2url
+    
+
+def path2url(path):
+    return urlparse.urljoin(
+        'file:', pathname2url(path))
+
+
+try:
+    import html5lib
+except ImportError:
+    html5lib = None
+
+    class BogusModules(object):
+        # See PEP 302 for details on how this works
+        def __init__(self, mocks):
+            self.mocks = mocks
+
+        def find_module(self, fullname, path=None):
+            if fullname in self.mocks:
+                return self
+            return None
+
+        def load_module(self, fullname):
+            mod = sys.modules.setdefault(fullname, imp.new_module(fullname))
+            mod.__file__, mod.__loader__, mod.__path__ = "<dummy>", self, []
+            mod.__dict__.update(self.mocks[fullname])
+            return mod
+
+    # Fake just enough of html5lib so that html5parser.py is importable
+    # without errors.
+    sys.meta_path.append(BogusModules({
+        'html5lib': {
+            # A do-nothing HTMLParser class
+            'HTMLParser': type('HTMLParser', (object,), {
+                '__init__': lambda self, **kw: None,
+                }),
+            },
+        'html5lib.treebuilders': {
+            },
+        'html5lib.treebuilders.etree_lxml': {
+            'TreeBuilder': 'dummy treebuilder',
+            },
+        }))
+
+
+class Test_HTMLParser(unittest.TestCase):
+    def make_one(self, **kwargs):
+        from lxml.html.html5parser import HTMLParser
+        return HTMLParser(**kwargs)
+
+    @skipUnless(html5lib, 'html5lib is not installed')
+    def test_integration(self):
+        parser = self.make_one(strict=True)
+        tree = parser.parse(XHTML_TEST_DOCUMENT)
+        root = tree.getroot()
+        self.assertEqual(root.tag, xhtml_tag('html'))
+
+
+class Test_XHTMLParser(unittest.TestCase):
+    def make_one(self, **kwargs):
+        from lxml.html.html5parser import XHTMLParser
+        return XHTMLParser(**kwargs)
+
+    @skipUnless(hasattr(html5lib, 'XHTMLParser'),
+                'xhtml5lib does not have XHTMLParser')
+    def test_integration(self):
+        # XXX: This test are untested. (html5lib no longer has an XHTMLParser)
+        parser = self.make_one(strict=True)
+        tree = parser.parse(XHTML_TEST_DOCUMENT)
+        root = tree.getroot()
+        self.assertEqual(root.tag, xhtml_tag('html'))
+
+
+class Test_document_fromstring(unittest.TestCase):
+    def call_it(self, *args, **kwargs):
+        from lxml.html.html5parser import document_fromstring
+        return document_fromstring(*args, **kwargs)
+
+    def test_basic(self):
+        parser = DummyParser(doc=DummyElementTree(root='dummy root'))
+        elem = self.call_it('dummy input', parser=parser)
+        self.assertEqual(elem, 'dummy root')
+        self.assertEqual(parser.parse_args, ('dummy input',))
+        self.assertEqual(parser.parse_kwargs, {'useChardet': True})
+
+    def test_guess_charset_arg_gets_passed_to_parser(self):
+        parser = DummyParser()
+        elem = self.call_it('', guess_charset='gc_arg', parser=parser)
+        self.assertEqual(parser.parse_kwargs, {'useChardet': 'gc_arg'})
+
+    def test_raises_type_error_on_nonstring_input(self):
+        not_a_string = None
+        self.assertRaises(TypeError, self.call_it, not_a_string)
+
+    @skipUnless(html5lib, 'html5lib is not installed')
+    def test_integration(self):
+        elem = self.call_it(XHTML_TEST_DOCUMENT)
+        self.assertEqual(elem.tag, xhtml_tag('html'))
+
+
+class Test_fragments_fromstring(unittest.TestCase):
+    def call_it(self, *args, **kwargs):
+        from lxml.html.html5parser import fragments_fromstring
+        return fragments_fromstring(*args, **kwargs)
+
+    def test_basic(self):
+        parser = DummyParser(fragments='fragments')
+        fragments = self.call_it('dummy input', parser=parser)
+        self.assertEqual(fragments, 'fragments')
+
+    def test_guess_charset_arg_gets_passed_to_parser(self):
+        parser = DummyParser()
+        elem = self.call_it('', guess_charset='gc_arg', parser=parser)
+        self.assertEqual(parser.parseFragment_kwargs, {'useChardet': 'gc_arg'})
+
+    def test_raises_type_error_on_nonstring_input(self):
+        not_a_string = None
+        self.assertRaises(TypeError, self.call_it, not_a_string)
+
+    def test_no_leading_text_strips_empty_leading_text(self):
+        parser = DummyParser(fragments=['', 'tail'])
+        fragments = self.call_it('', parser=parser, no_leading_text=True)
+        self.assertEqual(fragments, ['tail'])
+
+    def test_no_leading_text_raises_error_if_leading_text(self):
+        parser = DummyParser(fragments=['leading text', 'tail'])
+        self.assertRaises(ParserError, self.call_it,
+                          '', parser=parser, no_leading_text=True)
+
+    @skipUnless(html5lib, 'html5lib is not installed')
+    def test_integration(self):
+        fragments = self.call_it('a<b>c</b>')
+        self.assertEqual(len(fragments), 2)
+        self.assertEqual(fragments[0], 'a')
+        self.assertEqual(fragments[1].tag, xhtml_tag('b'))
+
+
+class Test_fragment_fromstring(unittest.TestCase):
+    def call_it(self, *args, **kwargs):
+        from lxml.html.html5parser import fragment_fromstring
+        return fragment_fromstring(*args, **kwargs)
+
+    def test_basic(self):
+        element = DummyElement()
+        parser = DummyParser(fragments=[element])
+        self.assertEqual(self.call_it('html', parser=parser), element)
+
+    def test_raises_type_error_on_nonstring_input(self):
+        not_a_string = None
+        self.assertRaises(TypeError, self.call_it, not_a_string)
+
+    def test_create_parent(self):
+        parser = DummyParser(fragments=['head', Element('child')])
+        elem = self.call_it('html', parser=parser, create_parent='parent')
+        self.assertEqual(elem.tag, 'parent')
+        self.assertEqual(elem.text, 'head')
+        self.assertEqual(elem[0].tag, 'child')
+
+    def test_create_parent_default_type_no_ns(self):
+        parser = DummyParser(fragments=[], namespaceHTMLElements=False)
+        elem = self.call_it('html', parser=parser, create_parent=True)
+        self.assertEqual(elem.tag, 'div')
+
+    def test_raises_error_on_leading_text(self):
+        parser = DummyParser(fragments=['leading text'])
+        self.assertRaises(ParserError, self.call_it, 'html', parser=parser)
+
+    def test_raises_error_if_no_elements_found(self):
+        parser = DummyParser(fragments=[])
+        self.assertRaises(ParserError, self.call_it, 'html', parser=parser)
+
+    def test_raises_error_if_multiple_elements_found(self):
+        parser = DummyParser(fragments=[DummyElement(), DummyElement()])
+        self.assertRaises(ParserError, self.call_it, 'html', parser=parser)
+
+    def test_raises_error_if_tail(self):
+        parser = DummyParser(fragments=[DummyElement(tail='tail')])
+        self.assertRaises(ParserError, self.call_it, 'html', parser=parser)
+
+
+class Test_fromstring(unittest.TestCase):
+    def call_it(self, *args, **kwargs):
+        from lxml.html.html5parser import fromstring
+        return fromstring(*args, **kwargs)
+
+    def test_returns_whole_doc_if_input_contains_html_tag(self):
+        parser = DummyParser(root='the doc')
+        self.assertEqual(self.call_it('<html></html>', parser=parser),
+                         'the doc')
+
+    def test_returns_whole_doc_if_input_contains_doctype(self):
+        parser = DummyParser(root='the doc')
+        self.assertEqual(self.call_it('<!DOCTYPE html>', parser=parser),
+                         'the doc')
+
+    def test_returns_whole_doc_if_head_not_empty(self, use_ns=True):
+        E = HTMLElementMaker(namespaceHTMLElements=use_ns)
+        root = E.html(E.head(E.title()))
+        parser = DummyParser(root=root)
+        self.assertEqual(self.call_it('', parser=parser), root)
+
+    def test_returns_whole_doc_if_head_not_empty_no_ns(self):
+        self.test_returns_whole_doc_if_head_not_empty(use_ns=False)
+
+    def test_returns_unwraps_body_if_single_element(self):
+        E = HTMLElementMaker()
+        elem = E.p('test')
+        root = E.html(E.head(), E.body(elem))
+        parser = DummyParser(root=root)
+        self.assertEqual(self.call_it('', parser=parser), elem)
+
+    def test_returns_body_if_has_text(self):
+        E = HTMLElementMaker()
+        elem = E.p('test')
+        body = E.body('text', elem)
+        root = E.html(E.head(), body)
+        parser = DummyParser(root=root)
+        self.assertEqual(self.call_it('', parser=parser), body)
+
+    def test_returns_body_if_single_element_has_tail(self):
+        E = HTMLElementMaker()
+        elem = E.p('test')
+        elem.tail = 'tail'
+        body = E.body(elem)
+        root = E.html(E.head(), body)
+        parser = DummyParser(root=root)
+        self.assertEqual(self.call_it('', parser=parser), body)
+
+    def test_wraps_multiple_fragments_in_div_no_ns(self):
+        E = HTMLElementMaker(namespaceHTMLElements=False)
+        parser = DummyParser(root=E.html(E.head(), E.body(E.h1(), E.p())),
+                             namespaceHTMLElements=False)
+        elem = self.call_it('', parser=parser)
+        self.assertEqual(elem.tag, 'div')
+
+    def test_wraps_multiple_fragments_in_span_no_ns(self):
+        E = HTMLElementMaker(namespaceHTMLElements=False)
+        parser = DummyParser(root=E.html(E.head(), E.body('foo', E.a('link'))),
+                             namespaceHTMLElements=False)
+        elem = self.call_it('', parser=parser)
+        self.assertEqual(elem.tag, 'span')
+
+    def test_raises_type_error_on_nonstring_input(self):
+        not_a_string = None
+        self.assertRaises(TypeError, self.call_it, not_a_string)
+
+    @skipUnless(html5lib, 'html5lib is not installed')
+    def test_integration_whole_doc(self):
+        elem = self.call_it(XHTML_TEST_DOCUMENT)
+        self.assertEqual(elem.tag, xhtml_tag('html'))
+
+    @skipUnless(html5lib, 'html5lib is not installed')
+    def test_integration_single_fragment(self):
+        elem = self.call_it('<p></p>')
+        self.assertEqual(elem.tag, xhtml_tag('p'))
+
+
+class Test_parse(unittest.TestCase):
+    def call_it(self, *args, **kwargs):
+        from lxml.html.html5parser import parse
+        return parse(*args, **kwargs)
+
+    def make_temp_file(self, contents=''):
+        tmpfile = NamedTemporaryFile(delete=False)
+        try:
+            tmpfile.write(contents.encode('utf8'))
+            tmpfile.flush()
+            tmpfile.seek(0)
+            return tmpfile
+        except Exception:
+            try:
+                tmpfile.close()
+            finally:
+                os.unlink(tempfile.name)
+            raise
+
+    def test_with_file_object(self):
+        parser = DummyParser(doc='the doc')
+        fp = open(__file__)
+        try:
+            self.assertEqual(self.call_it(fp, parser=parser), 'the doc')
+            self.assertEqual(parser.parse_args, (fp,))
+        finally:
+            fp.close()
+
+    def test_with_file_name(self):
+        parser = DummyParser(doc='the doc')
+        tmpfile = self.make_temp_file('data')
+        try:
+            data = tmpfile.read()
+        finally:
+            tmpfile.close()
+        try:
+            self.assertEqual(self.call_it(tmpfile.name, parser=parser), 'the doc')
+            fp, = parser.parse_args
+            try:
+                self.assertEqual(fp.read(), data)
+            finally:
+                fp.close()
+        finally:
+            os.unlink(tmpfile.name)
+
+    def test_with_url(self):
+        parser = DummyParser(doc='the doc')
+        tmpfile = self.make_temp_file('content')
+        try:
+            data = tmpfile.read()
+        finally:
+            tmpfile.close()
+        try:
+            url = path2url(tmpfile.name)
+            self.assertEqual(self.call_it(url, parser=parser), 'the doc')
+            fp, = parser.parse_args
+            try:
+                self.assertEqual(fp.read(), data)
+            finally:
+                fp.close()
+        finally:
+            os.unlink(tmpfile.name)
+
+    @skipUnless(html5lib, 'html5lib is not installed')
+    def test_integration(self):
+        doc = self.call_it(StringIO(XHTML_TEST_DOCUMENT))
+        root = doc.getroot()
+        self.assertEqual(root.tag, xhtml_tag('html'))
+
+
+def test_suite():
+    loader = unittest.TestLoader()
+    return loader.loadTestsFromModule(sys.modules[__name__])
+
+
+class HTMLElementMaker(ElementMaker):
+    def __init__(self, namespaceHTMLElements=True):
+        initargs = dict(makeelement=html_parser.makeelement)
+        if namespaceHTMLElements:
+            initargs.update(namespace=XHTML_NAMESPACE,
+                            nsmap={None: XHTML_NAMESPACE})
+        ElementMaker.__init__(self, **initargs)
+
+
+class DummyParser(object):
+    def __init__(self, doc=None, root=None,
+                 fragments=None, namespaceHTMLElements=True):
+        self.doc = doc or DummyElementTree(root=root)
+        self.fragments = fragments
+        self.tree = DummyTreeBuilder(namespaceHTMLElements)
+
+    def parse(self, *args, **kwargs):
+        self.parse_args = args
+        self.parse_kwargs = kwargs
+        return self.doc
+
+    def parseFragment(self, *args, **kwargs):
+        self.parseFragment_args = args
+        self.parseFragment_kwargs = kwargs
+        return self.fragments
+
+
+class DummyTreeBuilder(object):
+    def __init__(self, namespaceHTMLElements=True):
+        self.namespaceHTMLElements = namespaceHTMLElements
+
+
+class DummyElementTree(object):
+    def __init__(self, root):
+        self.root = root
+
+    def getroot(self):
+        return self.root
+
+
+class DummyElement(object):
+    def __init__(self, tag='tag', tail=None):
+        self.tag = tag
+        self.tail = tail
+
+
+def xhtml_tag(tag):
+    return '{%s}%s' % (XHTML_NAMESPACE, tag)
+
+
+XHTML_TEST_DOCUMENT = '''
+    <!DOCTYPE html>
+    <html>
+    <head><title>TITLE</title></head>
+    <body></body>
+    </html>
+    '''
diff --git a/lib/lxml/html/tests/test_rewritelinks.py b/lib/lxml/html/tests/test_rewritelinks.py
new file mode 100644
index 00000000..b4653234
--- /dev/null
+++ b/lib/lxml/html/tests/test_rewritelinks.py
@@ -0,0 +1,11 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        suite.addTests([make_doctest('test_rewritelinks.txt')])
+    return suite
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/lib/lxml/html/tests/test_rewritelinks.txt b/lib/lxml/html/tests/test_rewritelinks.txt
new file mode 100644
index 00000000..d8324de1
--- /dev/null
+++ b/lib/lxml/html/tests/test_rewritelinks.txt
@@ -0,0 +1,245 @@
+
+Setup::
+
+    >>> import lxml.html
+
+We'll define a link translation function:
+
+    >>> base_href = 'http://old/base/path.html'
+    >>> try: import urlparse
+    ... except ImportError: import urllib.parse as urlparse
+    >>> def relocate_href(link):
+    ...     link = urlparse.urljoin(base_href, link)
+    ...     if link.startswith('http://old'):
+    ...         return 'https://new' + link[len('http://old'):]
+    ...     else:
+    ...         return link
+
+Now for content.  First, to make it easier on us, we need to trim the
+normalized HTML we get from these functions::
+
+Some basics::
+
+    >>> from lxml.html import usedoctest, tostring
+    >>> from lxml.html import rewrite_links
+    >>> print(rewrite_links(
+    ...     '<a href="http://old/blah/blah.html">link</a>', relocate_href))
+    <a href="https://new/blah/blah.html">link</a>
+    >>> print(rewrite_links(
+    ...     '<script src="http://old/foo.js"></script>', relocate_href))
+    <script src="https://new/foo.js"></script>
+    >>> print(rewrite_links(
+    ...     '<link href="foo.css">', relocate_href))
+    <link href="https://new/base/foo.css">
+    >>> print(rewrite_links('''\
+    ... <base href="http://blah/stuff/index.html">
+    ... <link href="foo.css">
+    ... <a href="http://old/bar.html">x</a>\
+    ... ''', relocate_href))
+    <link href="http://blah/stuff/foo.css">
+    <a href="https://new/bar.html">x</a>
+
+Links in CSS are also handled::
+
+    >>> print(rewrite_links('''
+    ... <style>
+    ...   body {background-image: url(http://old/image.gif)};
+    ...   @import "http://old/other-style.css";
+    ... </style>''', relocate_href))
+    <html><head><style>
+      body {background-image: url(https://new/image.gif)};
+      @import "https://new/other-style.css";
+    </style></head></html>
+    >>> print(rewrite_links('''
+    ... <style>
+    ...   body {background-image: url("http://old/image.gif")};
+    ...   @import "http://old/other-style.css";
+    ... </style>''', relocate_href))
+    <html><head><style>
+      body {background-image: url("https://new/image.gif")};
+      @import "https://new/other-style.css";
+    </style></head></html>
+
+Those links in style attributes are also rewritten::
+
+    >>> print(rewrite_links('''
+    ... <div style="background-image: url(http://old/image.gif)">text</div>
+    ... ''', relocate_href))
+    <div style="background-image: url(https://new/image.gif)">text</div>
+
+The ``<base href>`` tag is also respected (but also removed)::
+
+    >>> print(rewrite_links('''
+    ... <html><head>
+    ...  <base href="http://old/">
+    ... </head>
+    ... <body>
+    ...  <a href="foo.html">link</a>
+    ... </body></html>''', relocate_href))
+    <html>
+     <head></head>
+     <body>
+      <a href="https://new/foo.html">link</a>
+     </body>
+    </html>
+
+The ``iterlinks`` method (and function) gives you all the links in
+the document, along with the element and attribute the link comes
+from.  This makes it fairly easy to see what resources the document
+references or embeds (an ``<a>`` tag is a reference, an ``<img>`` tag
+is something embedded).  It returns a generator of ``(element, attrib,
+link)``, which is awkward to test here, so we'll make a printer::
+
+    >>> from lxml.html import iterlinks, document_fromstring, tostring
+    >>> def print_iter(seq):
+    ...     for element, attrib, link, pos in seq:
+    ...         if pos:
+    ...             extra = '@%s' % pos
+    ...         else:
+    ...             extra = ''
+    ...         print('%s %s="%s"%s' % (element.tag, attrib, link, extra))
+    >>> print_iter(iterlinks('''
+    ... <html>
+    ...  <head>
+    ...   <link rel="stylesheet" href="style.css">
+    ...   <style type="text/css">
+    ...     body {
+    ...       background-image: url(/bg.gif);
+    ...     }
+    ...     @import "/other-styles.css";
+    ...   </style>
+    ...   <script src="/js-funcs.js"></script>
+    ...  </head>
+    ...  <body>
+    ...   <table>
+    ...    <tr><td><ul>
+    ...     <li><a href="/test.html">Test stuff</a></li>
+    ...     <li><a href="/other.html">Other stuff</a></li>
+    ...    </td></tr>
+    ...    <td style="background-image: url(/td-bg.png)">
+    ...      <img src="/logo.gif">
+    ...      Hi world!
+    ...    </td></tr>
+    ...   </table>
+    ...  </body></html>'''))
+    link href="style.css"
+    style None="/other-styles.css"@69
+    style None="/bg.gif"@40
+    script src="/js-funcs.js"
+    a href="/test.html"
+    a href="/other.html"
+    td style="/td-bg.png"@22
+    img src="/logo.gif"
+
+An application of ``iterlinks()`` is ``make_links_absolute()``::
+
+    >>> from lxml.html import make_links_absolute
+    >>> print(make_links_absolute('''
+    ... <html>
+    ...  <head>
+    ...   <link rel="stylesheet" href="style.css">
+    ...   <style type="text/css">
+    ...     body {
+    ...       background-image: url(/bg.gif);
+    ...     }
+    ...     @import "/other-styles.css";
+    ...   </style>
+    ...   <script src="/js-funcs.js"></script>
+    ...  </head>
+    ...  <body>
+    ...   <table>
+    ...    <tr><td><ul>
+    ...     <li><a href=" /test.html">Test stuff</a></li>
+    ...     <li><a href="/other.html ">Other stuff</a></li>
+    ...    </td></tr>
+    ...    <tr><td style="background-image: url( /td-bg.png )">
+    ...      <img src="logo.gif">
+    ...      Hi world!
+    ...    </td></tr>
+    ...   </table>
+    ...  </body></html>''',
+    ... base_url="http://my.little.server/url/"))
+    <html>
+     <head>
+      <link rel="stylesheet" href="http://my.little.server/url/style.css">
+      <style type="text/css">
+        body {
+          background-image: url(http://my.little.server/bg.gif);
+        }
+        @import "http://my.little.server/other-styles.css";
+      </style>
+      <script src="http://my.little.server/js-funcs.js"></script>
+     </head>
+     <body>
+      <table>
+       <tr><td><ul>
+        <li><a href="http://my.little.server/test.html">Test stuff</a></li>
+        <li><a href="http://my.little.server/other.html">Other stuff</a></li>
+       </ul></td></tr>
+       <tr>
+         <td style="background-image: url(http://my.little.server/td-bg.png)">
+          <img src="http://my.little.server/url/logo.gif">
+          Hi world!
+       </td></tr>
+      </table>
+     </body>
+    </html>
+
+### Test disabled to support Py2.6 and earlier
+#If the document contains invalid links, you may choose to "discard" or "ignore"
+#them by passing the respective option into the ``handle_failures`` argument::
+#
+#    >>> html = lxml.html.fromstring ('''\
+#    ... <html><body><div>
+#    ...     <a href="http://fancybase.com]Buy">test2</a>
+#    ... </div></body></html>''')
+#
+#    >>> html.make_links_absolute(base_url="http://my.little.server/url/",
+#    ...                          handle_failures="discard")
+#
+#    >>> print(lxml.html.tostring (html, pretty_print=True, encoding='unicode'))
+#    <html><body><div>
+#        <a>test2</a>
+#    </div></body></html>
+
+Check if we can replace multiple links inside of the same text string::
+
+    >>> html = lxml.html.fromstring ("""\
+    ... <html>
+    ...   <head>
+    ...      <title>Test</title>
+    ...      <style type='text/css'>
+    ...        .bg1 {
+    ...            background: url(images/bg1.png);
+    ...        }
+    ...        .bg2 {
+    ...            background: url(images/bg2.png);
+    ...        }
+    ...      </style>
+    ...   </head>
+    ...   <body>
+    ...      <p>Hi</p>
+    ...   </body>
+    ... </html>
+    ... """,
+    ... base_url = 'http://www.example.com/')
+
+    >>> html.make_links_absolute ()
+
+    >>> print(lxml.html.tostring (html, pretty_print=True, encoding='unicode'))
+    <html>
+      <head>
+        <title>Test</title>
+        <style type="text/css">
+          .bg1 {
+            background: url(http://www.example.com/images/bg1.png);
+          }
+          .bg2 {
+            background: url(http://www.example.com/images/bg2.png);
+          }
+        </style>
+      </head>
+      <body>
+        <p>Hi</p>
+      </body>
+    </html>
diff --git a/lib/lxml/html/tests/test_xhtml.py b/lib/lxml/html/tests/test_xhtml.py
new file mode 100644
index 00000000..dc34aa70
--- /dev/null
+++ b/lib/lxml/html/tests/test_xhtml.py
@@ -0,0 +1,11 @@
+import unittest, sys
+from lxml.tests.common_imports import make_doctest
+import lxml.html
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([make_doctest('test_xhtml.txt')])
+    return suite
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/lib/lxml/html/tests/test_xhtml.txt b/lib/lxml/html/tests/test_xhtml.txt
new file mode 100644
index 00000000..db022101
--- /dev/null
+++ b/lib/lxml/html/tests/test_xhtml.txt
@@ -0,0 +1,30 @@
+    >>> from lxml.html import document_fromstring, fragment_fromstring, tostring
+
+lxml.html has two parsers, one for HTML, one for XHTML:
+
+    >>> from lxml.html import HTMLParser, XHTMLParser
+    >>> html = "<html><body><p>Hi!</p></body></html>"
+
+    >>> root = document_fromstring(html, parser=HTMLParser())
+    >>> print(root.tag)
+    html
+
+    >>> root = document_fromstring(html, parser=XHTMLParser())
+    >>> print(root.tag)
+    html
+
+There are two functions for converting between HTML and XHTML:
+
+    >>> from lxml.html import xhtml_to_html, html_to_xhtml
+
+    >>> doc = document_fromstring(html, parser=HTMLParser())
+    >>> tostring(doc)
+    b'<html><body><p>Hi!</p></body></html>'
+
+    >>> html_to_xhtml(doc)
+    >>> tostring(doc)
+    b'<html:html xmlns:html="http://www.w3.org/1999/xhtml"><html:body><html:p>Hi!</html:p></html:body></html:html>'
+
+    >>> xhtml_to_html(doc)
+    >>> tostring(doc)
+    b'<html xmlns:html="http://www.w3.org/1999/xhtml"><body><p>Hi!</p></body></html>'
diff --git a/lib/lxml/html/tests/transform_feedparser_data.py b/lib/lxml/html/tests/transform_feedparser_data.py
new file mode 100644
index 00000000..d340912b
--- /dev/null
+++ b/lib/lxml/html/tests/transform_feedparser_data.py
@@ -0,0 +1,110 @@
+"""
+This takes the feedparser tests from here:
+
+  http://feedparser.org/tests/wellformed/sanitize/
+
+and rewrites them to be easier to handle (not using the internal model
+of feedparser).  The input format is::
+
+  <!--
+  Description: {description}
+  Expect: {expression}
+  -->
+  ...
+  <content ...>{content}</content>
+  ...
+
+The Expect expression is checked for
+``entries[0]['content'][0]['value'] == {data}``.
+
+The output format is::
+
+  Description: {description}
+  Expect: {expression} (if data couldn't be parsed)
+  Options: 
+
+  {content, unescaped}
+  ----------
+  {data, unescaped, if found}
+
+"""
+
+import re
+import os
+import traceback
+
+_desc_re = re.compile(r'\s*Description:\s*(.*)')
+_expect_re = re.compile(r'\s*Expect:\s*(.*)')
+_data_expect_re = re.compile(r"entries\[0\]\['[^']+'\](?:\[0\]\['value'\])?\s*==\s*(.*)")
+_feed_data_expect_re = re.compile(r"feed\['[^']+'\]\s*==\s*(.*)")
+
+def parse_content(content):
+    match = _desc_re.search(content)
+    desc = match.group(1)
+    match = _expect_re.search(content)
+    expect = match.group(1)
+    data = None
+    for regex in [_data_expect_re, _feed_data_expect_re]:
+        match = regex.search(expect)
+        if match:
+            # Icky, but I'll trust it
+            data = eval(match.group(1).strip())
+            break
+    c = None
+    for tag in ['content', 'summary', 'title', 'copyright', 'tagline', 'info', 'subtitle', 'fullitem', 'body', 'description', 'content:encoded']:
+        regex = re.compile(r"<%s.*?>(.*)</%s>" % (tag, tag), re.S)
+        match = regex.search(content)
+        if match:
+            c = match.group(1)
+            break
+    assert c is not None
+    # Seems like body isn't quoted
+    if tag != 'body':
+        c = c.replace('&lt;', '<')
+        c = c.replace('&amp;', '&')
+    # FIXME: I should really do more unescaping...
+    return {
+        'Description': desc,
+        'Expect': expect,
+        'data': data,
+        'content': c}
+
+def serialize_content(d):
+    s = '''\
+Description: %(Description)s
+Expect: %(Expect)s
+Options: 
+
+%(content)s
+''' % d
+    if d.get('data') is not None:
+        s += '----------\n%s' % d['data']
+    return s
+
+def translate_file(filename):
+    f = open(filename, 'rb')
+    c = f.read()
+    f.close()
+    try:
+        output = serialize_content(parse_content(c))
+    except:
+        print('Bad data in %s:' % filename)
+        print(c)
+        traceback.print_exc()
+        print('-'*60)
+        return
+    new = os.path.splitext(filename)[0] + '.data'
+    f = open(new, 'wb')
+    f.write(output)
+    f.close()
+
+def translate_all(dir):
+    for fn in os.listdir(dir):
+        fn = os.path.join(dir, fn)
+        if fn.endswith('.xml'):
+            translate_file(fn)
+        
+if __name__ == '__main__':
+    import sys
+    translate_all(os.path.join(os.path.dirname(__file__), 'feedparser-data'))
+
diff --git a/lib/lxml/html/usedoctest.py b/lib/lxml/html/usedoctest.py
new file mode 100644
index 00000000..f352a1cc
--- /dev/null
+++ b/lib/lxml/html/usedoctest.py
@@ -0,0 +1,13 @@
+"""Doctest module for HTML comparison.
+
+Usage::
+
+   >>> import lxml.html.usedoctest
+   >>> # now do your HTML doctests ...
+
+See `lxml.doctestcompare`.
+"""
+
+from lxml import doctestcompare
+
+doctestcompare.temp_install(html=True, del_module=__name__)
diff --git a/lib/lxml/includes/__init__.py b/lib/lxml/includes/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/lib/lxml/includes/c14n.pxd b/lib/lxml/includes/c14n.pxd
new file mode 100644
index 00000000..d075e90e
--- /dev/null
+++ b/lib/lxml/includes/c14n.pxd
@@ -0,0 +1,26 @@
+from lxml.includes.tree cimport xmlDoc, xmlOutputBuffer, xmlChar
+from lxml.includes.xpath cimport xmlNodeSet
+
+cdef extern from "libxml/c14n.h":
+    cdef int xmlC14NDocDumpMemory(xmlDoc* doc,
+                                  xmlNodeSet* nodes,
+                                  int exclusive,
+                                  xmlChar** inclusive_ns_prefixes,
+                                  int with_comments,
+                                  xmlChar** doc_txt_ptr) nogil
+
+    cdef int xmlC14NDocSave(xmlDoc* doc,
+                            xmlNodeSet* nodes,
+                            int exclusive,
+                            xmlChar** inclusive_ns_prefixes,
+                            int with_comments,
+                            char* filename,
+                            int compression) nogil
+
+    cdef int xmlC14NDocSaveTo(xmlDoc* doc,
+                              xmlNodeSet* nodes,
+                              int exclusive,
+                              xmlChar** inclusive_ns_prefixes,
+                              int with_comments,
+                              xmlOutputBuffer* buffer) nogil
+
diff --git a/lib/lxml/includes/config.pxd b/lib/lxml/includes/config.pxd
new file mode 100644
index 00000000..9c04438f
--- /dev/null
+++ b/lib/lxml/includes/config.pxd
@@ -0,0 +1,3 @@
+cdef extern from "etree_defs.h":
+    cdef bint ENABLE_THREADING
+    cdef bint ENABLE_SCHEMATRON
diff --git a/lib/lxml/includes/dtdvalid.pxd b/lib/lxml/includes/dtdvalid.pxd
new file mode 100644
index 00000000..ae94dc63
--- /dev/null
+++ b/lib/lxml/includes/dtdvalid.pxd
@@ -0,0 +1,18 @@
+from lxml.includes cimport tree
+from lxml.includes.tree cimport xmlDoc, xmlDtd
+
+cdef extern from "libxml/valid.h" nogil:
+    ctypedef void (*xmlValidityErrorFunc)(void * ctx, const char * msg, ...)
+    ctypedef void (*xmlValidityWarningFunc)(void * ctx, const char * msg, ...)
+
+    ctypedef struct xmlValidCtxt:
+        void *userData
+        xmlValidityErrorFunc error
+        xmlValidityWarningFunc warning
+
+    cdef xmlValidCtxt* xmlNewValidCtxt()
+    cdef void xmlFreeValidCtxt(xmlValidCtxt* cur)
+
+    cdef int xmlValidateDtd(xmlValidCtxt* ctxt, xmlDoc* doc, xmlDtd* dtd)
+    cdef tree.xmlElement* xmlGetDtdElementDesc(
+        xmlDtd* dtd, tree.const_xmlChar* name)
diff --git a/lib/lxml/includes/etree_defs.h b/lib/lxml/includes/etree_defs.h
new file mode 100644
index 00000000..8faac466
--- /dev/null
+++ b/lib/lxml/includes/etree_defs.h
@@ -0,0 +1,328 @@
+#ifndef HAS_ETREE_DEFS_H
+#define HAS_ETREE_DEFS_H
+
+/* quick check for Python/libxml2/libxslt devel setup */
+#include "Python.h"
+#ifndef PY_VERSION_HEX
+#  error the development package of Python (header files etc.) is not installed correctly
+#else
+#  if PY_VERSION_HEX < 0x02060000 || PY_MAJOR_VERSION >= 3 && PY_VERSION_HEX < 0x03020000
+#  error this version of lxml requires Python 2.6, 2.7, 3.2 or later
+#  endif
+#endif
+
+#include "libxml/xmlversion.h"
+#ifndef LIBXML_VERSION
+#  error the development package of libxml2 (header files etc.) is not installed correctly
+#else
+#if LIBXML_VERSION < 20700
+#  error minimum required version of libxml2 is 2.7.0
+#endif
+#endif
+
+#include "libxslt/xsltconfig.h"
+#ifndef LIBXSLT_VERSION
+#  error the development package of libxslt (header files etc.) is not installed correctly
+#else
+#if LIBXSLT_VERSION < 10123
+#  error minimum required version of libxslt is 1.1.23
+#endif
+#endif
+
+
+/* v_arg functions */
+#define va_int(ap)     va_arg(ap, int)
+#define va_charptr(ap) va_arg(ap, char *)
+
+#ifdef PYPY_VERSION
+#    define IS_PYPY 1
+#else
+#    define IS_PYPY 0
+#endif
+
+#if PY_MAJOR_VERSION >= 3
+#  define IS_PYTHON3 1
+#else
+#  define IS_PYTHON3 0
+#endif
+
+#if IS_PYTHON3
+#undef LXML_UNICODE_STRINGS
+#define LXML_UNICODE_STRINGS 1
+#else
+#ifndef LXML_UNICODE_STRINGS
+#define LXML_UNICODE_STRINGS 0
+#endif
+#endif
+
+#if !IS_PYPY
+#  define PyWeakref_LockObject(obj)          (NULL)
+#endif
+
+/* Threading is not currently supported by PyPy */
+#if IS_PYPY
+#  ifndef WITHOUT_THREADING
+#    define WITHOUT_THREADING
+#  endif
+#endif
+
+/* Python 3 doesn't have PyFile_*() anymore */
+#if PY_MAJOR_VERSION >= 3
+#  define PyFile_AsFile(o)                   (NULL)
+#else
+#if IS_PYPY
+#  undef PyFile_AsFile
+#  define PyFile_AsFile(o)                   (NULL)
+#  undef PyUnicode_FromFormat
+#  define PyUnicode_FromFormat(s, a, b)      (NULL)
+#  undef PyByteArray_Check
+#  define PyByteArray_Check(o)               (0)
+#endif
+#endif
+
+#if PY_VERSION_HEX <= 0x03030000 && !(defined(CYTHON_PEP393_ENABLED) && CYTHON_PEP393_ENABLED)
+  #define PyUnicode_IS_READY(op)    (0)
+  #define PyUnicode_GET_LENGTH(u)   PyUnicode_GET_SIZE(u)
+  #define PyUnicode_KIND(u)         (sizeof(Py_UNICODE))
+  #define PyUnicode_DATA(u)         ((void*)PyUnicode_AS_UNICODE(u))
+#endif
+
+/* PySlice_GetIndicesEx() has wrong signature in Py<=3.1 */
+#if PY_VERSION_HEX >= 0x03020000
+#  define _lx_PySlice_GetIndicesEx(o, l, b, e, s, sl) PySlice_GetIndicesEx(o, l, b, e, s, sl)
+#else
+#  define _lx_PySlice_GetIndicesEx(o, l, b, e, s, sl) PySlice_GetIndicesEx(((PySliceObject*)o), l, b, e, s, sl)
+#endif
+
+#ifdef WITHOUT_THREADING
+#  define PyEval_SaveThread() (NULL)
+#  define PyEval_RestoreThread(state)
+#  define PyGILState_Ensure() (PyGILState_UNLOCKED)
+#  define PyGILState_Release(state)
+#  undef  Py_UNBLOCK_THREADS
+#  define Py_UNBLOCK_THREADS
+#  undef  Py_BLOCK_THREADS
+#  define Py_BLOCK_THREADS
+#endif
+
+#ifdef WITHOUT_THREADING
+#  define ENABLE_THREADING 0
+#else
+#  define ENABLE_THREADING 1
+#endif
+
+#if LIBXML_VERSION < 20704
+/* FIXME: hack to make new error reporting compile in old libxml2 versions */
+#  define xmlStructuredErrorContext NULL
+#  define xmlXIncludeProcessTreeFlagsData(n,o,d) xmlXIncludeProcessTreeFlags(n,o)
+#endif
+
+/* schematron was added in libxml2 2.6.21 */
+#ifdef LIBXML_SCHEMATRON_ENABLED
+#  define ENABLE_SCHEMATRON 1
+#else
+#  define ENABLE_SCHEMATRON 0
+#  define XML_SCHEMATRON_OUT_QUIET 0
+#  define XML_SCHEMATRON_OUT_XML 0
+#  define XML_SCHEMATRON_OUT_ERROR 0
+   typedef void xmlSchematron;
+   typedef void xmlSchematronParserCtxt;
+   typedef void xmlSchematronValidCtxt;
+#  define xmlSchematronNewDocParserCtxt(doc) NULL
+#  define xmlSchematronNewParserCtxt(file) NULL
+#  define xmlSchematronParse(ctxt) NULL
+#  define xmlSchematronFreeParserCtxt(ctxt)
+#  define xmlSchematronFree(schema)
+#  define xmlSchematronNewValidCtxt(schema, options) NULL
+#  define xmlSchematronValidateDoc(ctxt, doc) 0
+#  define xmlSchematronFreeValidCtxt(ctxt)
+#  define xmlSchematronSetValidStructuredErrors(ctxt, errorfunc, data)
+#endif
+
+#if LIBXML_VERSION < 20900
+#  define XML_PARSE_BIG_LINES 4194304
+#endif
+
+#include "libxml/tree.h"
+#ifndef LIBXML2_NEW_BUFFER
+   typedef xmlBuffer xmlBuf;
+#  define xmlBufContent(buf) xmlBufferContent(buf)
+#  define xmlBufUse(buf) xmlBufferLength(buf)
+#endif
+
+/* libexslt 1.1.25+ support EXSLT functions in XPath */
+#if LIBXSLT_VERSION < 10125
+#define exsltDateXpathCtxtRegister(ctxt, prefix)
+#define exsltSetsXpathCtxtRegister(ctxt, prefix)
+#define exsltMathXpathCtxtRegister(ctxt, prefix)
+#define exsltStrXpathCtxtRegister(ctxt, prefix)
+#endif
+
+/* work around MSDEV 6.0 */
+#if (_MSC_VER == 1200) && (WINVER < 0x0500)
+long _ftol( double ); //defined by VC6 C libs
+long _ftol2( double dblSource ) { return _ftol( dblSource ); }
+#endif
+
+#ifdef __GNUC__
+/* Test for GCC > 2.95 */
+#if __GNUC__ > 2 || (__GNUC__ == 2 && (__GNUC_MINOR__ > 95)) 
+#define unlikely_condition(x) __builtin_expect((x), 0)
+#else /* __GNUC__ > 2 ... */
+#define unlikely_condition(x) (x)
+#endif /* __GNUC__ > 2 ... */
+#else /* __GNUC__ */
+#define unlikely_condition(x) (x)
+#endif /* __GNUC__ */
+
+#ifndef Py_TYPE
+  #define Py_TYPE(ob)   (((PyObject*)(ob))->ob_type)
+#endif
+
+#define PY_NEW(T) \
+     (((PyTypeObject*)(T))->tp_new( \
+             (PyTypeObject*)(T), __pyx_empty_tuple, NULL))
+
+#define _fqtypename(o)  ((Py_TYPE(o))->tp_name)
+
+#if PY_MAJOR_VERSION < 3
+#define _isString(obj)   (PyString_CheckExact(obj)  || \
+                          PyUnicode_CheckExact(obj) || \
+                          PyType_IsSubtype(Py_TYPE(obj), &PyBaseString_Type))
+#else
+/* builtin subtype type checks are almost as fast as exact checks in Py2.7+
+ * and Unicode is more common in Py3 */
+#define _isString(obj)   (PyUnicode_Check(obj) || PyBytes_Check(obj))
+#endif
+
+#define _isElement(c_node) \
+        (((c_node)->type == XML_ELEMENT_NODE) || \
+         ((c_node)->type == XML_COMMENT_NODE) || \
+         ((c_node)->type == XML_ENTITY_REF_NODE) || \
+         ((c_node)->type == XML_PI_NODE))
+
+#define _isElementOrXInclude(c_node) \
+        (_isElement(c_node)                     || \
+         ((c_node)->type == XML_XINCLUDE_START) || \
+         ((c_node)->type == XML_XINCLUDE_END))
+
+#define _getNs(c_node) \
+        (((c_node)->ns == 0) ? 0 : ((c_node)->ns->href))
+
+
+/* Macro pair implementation of a depth first tree walker
+ *
+ * Calls the code block between the BEGIN and END macros for all elements
+ * below c_tree_top (exclusively), starting at c_node (inclusively iff
+ * 'inclusive' is 1).  The _ELEMENT_ variants will only stop on nodes
+ * that match _isElement(), the normal variant will stop on every node
+ * except text nodes.
+ * 
+ * To traverse the node and all of its children and siblings in Pyrex, call
+ *    cdef xmlNode* some_node
+ *    BEGIN_FOR_EACH_ELEMENT_FROM(some_node.parent, some_node, 1)
+ *    # do something with some_node
+ *    END_FOR_EACH_ELEMENT_FROM(some_node)
+ *
+ * To traverse only the children and siblings of a node, call
+ *    cdef xmlNode* some_node
+ *    BEGIN_FOR_EACH_ELEMENT_FROM(some_node.parent, some_node, 0)
+ *    # do something with some_node
+ *    END_FOR_EACH_ELEMENT_FROM(some_node)
+ *
+ * To traverse only the children, do:
+ *    cdef xmlNode* some_node
+ *    some_node = parent_node.children
+ *    BEGIN_FOR_EACH_ELEMENT_FROM(parent_node, some_node, 1)
+ *    # do something with some_node
+ *    END_FOR_EACH_ELEMENT_FROM(some_node)
+ *
+ * NOTE: 'some_node' MUST be a plain 'xmlNode*' !
+ *
+ * NOTE: parent modification during the walk can divert the iterator, but
+ *       should not segfault !
+ */
+
+#define _LX__ELEMENT_MATCH(c_node, only_elements)  \
+    ((only_elements) ? (_isElement(c_node)) : 1)
+
+#define _LX__ADVANCE_TO_NEXT(c_node, only_elements)                        \
+    while ((c_node != 0) && (!_LX__ELEMENT_MATCH(c_node, only_elements)))  \
+        c_node = c_node->next;
+
+#define _LX__TRAVERSE_TO_NEXT(c_stop_node, c_node, only_elements)   \
+{                                                                   \
+    /* walk through children first */                               \
+    xmlNode* _lx__next = c_node->children;		            \
+    if (_lx__next != 0) {                                           \
+        if (c_node->type == XML_ENTITY_REF_NODE || c_node->type == XML_DTD_NODE) { \
+            _lx__next = 0;                                          \
+        } else {                                                    \
+            _LX__ADVANCE_TO_NEXT(_lx__next, only_elements)	    \
+        }                                                           \
+    }							            \
+    if ((_lx__next == 0) && (c_node != c_stop_node)) {              \
+        /* try siblings */                                          \
+        _lx__next = c_node->next;                                   \
+        _LX__ADVANCE_TO_NEXT(_lx__next, only_elements)              \
+        /* back off through parents */                              \
+        while (_lx__next == 0) {                                    \
+            c_node = c_node->parent;                                \
+            if (c_node == 0)                                        \
+                break;                                              \
+            if (c_node == c_stop_node)                              \
+                break;                                              \
+            if ((only_elements) && !_isElement(c_node))	            \
+                break;                                              \
+            /* we already traversed the parents -> siblings */      \
+            _lx__next = c_node->next;                               \
+            _LX__ADVANCE_TO_NEXT(_lx__next, only_elements)	    \
+        }                                                           \
+    }                                                               \
+    c_node = _lx__next;                                             \
+}
+
+#define _LX__BEGIN_FOR_EACH_FROM(c_tree_top, c_node, inclusive, only_elements)     \
+{									      \
+    if (c_node != 0) {							      \
+        const xmlNode* _lx__tree_top = (c_tree_top);                          \
+        const int _lx__only_elements = (only_elements);                       \
+        /* make sure we start at an element */                   	      \
+        if (!_LX__ELEMENT_MATCH(c_node, _lx__only_elements)) {		      \
+            /* we skip the node, so 'inclusive' is irrelevant */              \
+            if (c_node == _lx__tree_top)                                      \
+                c_node = 0; /* nothing to traverse */                         \
+            else {                                                            \
+                c_node = c_node->next;                                        \
+                _LX__ADVANCE_TO_NEXT(c_node, _lx__only_elements)              \
+            }                                                                 \
+        } else if (! (inclusive)) {                                           \
+            /* skip the first node */                                         \
+            _LX__TRAVERSE_TO_NEXT(_lx__tree_top, c_node, _lx__only_elements)  \
+        }                                                                     \
+                                                                              \
+        /* now run the user code on the elements we find */                   \
+        while (c_node != 0) {                                                 \
+            /* here goes the code to be run for each element */
+
+#define _LX__END_FOR_EACH_FROM(c_node)                                        \
+            _LX__TRAVERSE_TO_NEXT(_lx__tree_top, c_node, _lx__only_elements)  \
+        }                                                                     \
+    }                                                                         \
+}
+
+
+#define BEGIN_FOR_EACH_ELEMENT_FROM(c_tree_top, c_node, inclusive)   \
+    _LX__BEGIN_FOR_EACH_FROM(c_tree_top, c_node, inclusive, 1)
+
+#define END_FOR_EACH_ELEMENT_FROM(c_node)   \
+    _LX__END_FOR_EACH_FROM(c_node)
+
+#define BEGIN_FOR_EACH_FROM(c_tree_top, c_node, inclusive)   \
+    _LX__BEGIN_FOR_EACH_FROM(c_tree_top, c_node, inclusive, 0)
+
+#define END_FOR_EACH_FROM(c_node)   \
+    _LX__END_FOR_EACH_FROM(c_node)
+
+
+#endif /* HAS_ETREE_DEFS_H */
diff --git a/lib/lxml/includes/etreepublic.pxd b/lib/lxml/includes/etreepublic.pxd
new file mode 100644
index 00000000..02f74ec0
--- /dev/null
+++ b/lib/lxml/includes/etreepublic.pxd
@@ -0,0 +1,234 @@
+# public Cython/C interface to lxml.etree
+
+from lxml.includes cimport tree
+from lxml.includes.tree cimport const_xmlChar
+
+cdef extern from "lxml-version.h":
+    cdef char* LXML_VERSION_STRING
+
+cdef extern from "etree_defs.h":
+    # test if c_node is considered an Element (i.e. Element, Comment, etc.)
+    cdef bint _isElement(tree.xmlNode* c_node) nogil
+
+    # return the namespace URI of the node or NULL
+    cdef const_xmlChar* _getNs(tree.xmlNode* node) nogil
+
+    # pair of macros for tree traversal
+    cdef void BEGIN_FOR_EACH_ELEMENT_FROM(tree.xmlNode* tree_top,
+                                          tree.xmlNode* start_node,
+                                          int start_node_inclusive) nogil
+    cdef void END_FOR_EACH_ELEMENT_FROM(tree.xmlNode* start_node) nogil
+
+cdef extern from "lxml.etree_api.h":
+
+    # first function to call!
+    cdef int import_lxml__etree() except -1
+
+    ##########################################################################
+    # public ElementTree API classes
+
+    cdef class lxml.etree._Document [ object LxmlDocument ]:
+        cdef tree.xmlDoc* _c_doc
+
+    cdef class lxml.etree._Element [ object LxmlElement ]:
+        cdef _Document _doc
+        cdef tree.xmlNode* _c_node
+
+    cdef class lxml.etree.ElementBase(_Element) [ object LxmlElementBase ]:
+        pass
+
+    cdef class lxml.etree._ElementTree [ object LxmlElementTree ]:
+        cdef _Document _doc
+        cdef _Element  _context_node
+
+    cdef class lxml.etree.ElementClassLookup [ object LxmlElementClassLookup ]:
+        cdef object (*_lookup_function)(object, _Document, tree.xmlNode*)
+
+    cdef class lxml.etree.FallbackElementClassLookup(ElementClassLookup) \
+             [ object LxmlFallbackElementClassLookup ]:
+        cdef ElementClassLookup fallback
+        cdef object (*_fallback_function)(object, _Document, tree.xmlNode*)
+
+    ##########################################################################
+    # creating Element objects
+
+    # create an Element for a C-node in the Document
+    cdef _Element elementFactory(_Document doc, tree.xmlNode* c_node)
+
+    # create an ElementTree for an Element
+    cdef _ElementTree elementTreeFactory(_Element context_node)
+
+    # create an ElementTree subclass for an Element
+    cdef _ElementTree newElementTree(_Element context_node, object subclass)
+
+    # create a new Element for an existing or new document (doc = None)
+    # builds Python object after setting text, tail, namespaces and attributes
+    cdef _Element makeElement(tag, _Document doc, parser,
+                              text, tail, attrib, nsmap)
+
+    # create a new SubElement for an existing parent
+    # builds Python object after setting text, tail, namespaces and attributes
+    cdef _Element makeSubElement(_Element parent, tag, text, tail,
+                                 attrib, nsmap)
+
+    # deep copy a node to include it in the Document
+    cdef _Element deepcopyNodeToDocument(_Document doc, tree.xmlNode* c_root)
+
+    # set the internal lookup function for Element/Comment/PI classes
+    # use setElementClassLookupFunction(NULL, None) to reset it
+    # note that the lookup function *must always* return an _Element subclass!
+    cdef void setElementClassLookupFunction(
+         object (*function)(object, _Document, tree.xmlNode*), object state)
+
+    # lookup function that always returns the default Element class
+    # note that the first argument is expected to be None!
+    cdef object lookupDefaultElementClass(_1, _Document _2,
+                                          tree.xmlNode* c_node)
+
+    # lookup function for namespace/tag specific Element classes
+    # note that the first argument is expected to be None!
+    cdef object lookupNamespaceElementClass(_1, _Document _2,
+                                            tree.xmlNode* c_node)
+
+    # call the fallback lookup function of a FallbackElementClassLookup
+    cdef object callLookupFallback(FallbackElementClassLookup lookup,
+                                   _Document doc, tree.xmlNode* c_node)
+
+    ##########################################################################
+    # XML attribute access
+
+    # return an attribute value for a C attribute on a C element node
+    cdef object attributeValue(tree.xmlNode* c_element,
+                               tree.xmlAttr* c_attrib_node)
+
+    # return the value of the attribute with 'ns' and 'name' (or None)
+    cdef object attributeValueFromNsName(tree.xmlNode* c_element,
+                                         const_xmlChar* c_ns, const_xmlChar* c_name)
+
+    # return the value of attribute "{ns}name", or the default value
+    cdef object getAttributeValue(_Element element, key, default)
+
+    # return an iterator over attribute names (1), values (2) or items (3)
+    # attributes must not be removed during iteration!
+    cdef object iterattributes(_Element element, int keysvalues)
+
+    # return the list of all attribute names (1), values (2) or items (3)
+    cdef list collectAttributes(tree.xmlNode* c_element, int keysvalues)
+
+    # set an attribute value on an element
+    # on failure, sets an exception and returns -1
+    cdef int setAttributeValue(_Element element, key, value) except -1
+
+    # delete an attribute
+    # on failure, sets an exception and returns -1
+    cdef int delAttribute(_Element element, key) except -1
+
+    # delete an attribute based on name and namespace URI
+    # returns -1 if the attribute was not found (no exception)
+    cdef int delAttributeFromNsName(tree.xmlNode* c_element,
+                                    const_xmlChar* c_href, const_xmlChar* c_name)
+
+    ##########################################################################
+    # XML node helper functions
+
+    # check if the element has at least one child
+    cdef bint hasChild(tree.xmlNode* c_node) nogil
+
+    # find child element number 'index' (supports negative indexes)
+    cdef tree.xmlNode* findChild(tree.xmlNode* c_node,
+                                 Py_ssize_t index) nogil
+
+    # find child element number 'index' starting at first one
+    cdef tree.xmlNode* findChildForwards(tree.xmlNode* c_node,
+                                         Py_ssize_t index) nogil
+
+    # find child element number 'index' starting at last one
+    cdef tree.xmlNode* findChildBackwards(tree.xmlNode* c_node,
+                                          Py_ssize_t index) nogil
+
+    # return next/previous sibling element of the node
+    cdef tree.xmlNode* nextElement(tree.xmlNode* c_node) nogil
+    cdef tree.xmlNode* previousElement(tree.xmlNode* c_node) nogil
+
+    ##########################################################################
+    # iterators (DEPRECATED API, don't use in new code!)
+
+    cdef class lxml.etree._ElementTagMatcher [ object LxmlElementTagMatcher ]:
+        cdef char* _href
+        cdef char* _name
+
+    # store "{ns}tag" (or None) filter for this matcher or element iterator
+    # ** unless _href *and* _name are set up 'by hand', this function *must*
+    # ** be called when subclassing the iterator below!
+    cdef void initTagMatch(_ElementTagMatcher matcher, tag)
+
+    cdef class lxml.etree._ElementIterator(_ElementTagMatcher) [
+        object LxmlElementIterator ]:
+        cdef _Element _node
+        cdef tree.xmlNode* (*_next_element)(tree.xmlNode*)
+
+    # store the initial node of the iterator if it matches the required tag
+    # or its next matching sibling if not
+    cdef void iteratorStoreNext(_ElementIterator iterator, _Element node)
+
+    ##########################################################################
+    # other helper functions
+
+    # check if a C node matches a tag name and namespace
+    # (NULL allowed for each => always matches)
+    cdef int tagMatches(tree.xmlNode* c_node, const_xmlChar* c_href, const_xmlChar* c_name)
+
+    # convert a UTF-8 char* to a Python string or unicode string
+    cdef object pyunicode(const_xmlChar* s)
+
+    # convert the string to UTF-8 using the normal lxml.etree semantics
+    cdef bytes utf8(object s)
+
+    # split a tag into a (URI, name) tuple, return None as URI for '{}tag'
+    cdef tuple getNsTag(object tag)
+
+    # split a tag into a (URI, name) tuple, return b'' as URI for '{}tag'
+    cdef tuple getNsTagWithEmptyNs(object tag)
+
+    # get the "{ns}tag" string for a C node
+    cdef object namespacedName(tree.xmlNode* c_node)
+
+    # get the "{ns}tag" string for a href/tagname pair (c_ns may be NULL)
+    cdef object namespacedNameFromNsName(const_xmlChar* c_ns, const_xmlChar* c_tag)
+
+    # check if the node has a text value (which may be '')
+    cdef bint hasText(tree.xmlNode* c_node) nogil
+
+    # check if the node has a tail value (which may be '')
+    cdef bint hasTail(tree.xmlNode* c_node) nogil
+
+    # get the text content of an element (or None)
+    cdef object textOf(tree.xmlNode* c_node)
+
+    # get the tail content of an element (or None)
+    cdef object tailOf(tree.xmlNode* c_node)
+
+    # set the text value of an element
+    cdef int setNodeText(tree.xmlNode* c_node, text) except -1
+
+    # set the tail text value of an element
+    cdef int setTailText(tree.xmlNode* c_node, text) except -1
+
+    # append an element to the children of a parent element
+    # deprecated: don't use, does not propagate exceptions!
+    # use appendChildToElement() instead
+    cdef void appendChild(_Element parent, _Element child)
+
+    # added in lxml 3.3 as a safe replacement for appendChild()
+    # return -1 for exception, 0 for ok
+    cdef int appendChildToElement(_Element parent, _Element child) except -1
+
+    # recursively lookup a namespace in element or ancestors, or create it
+    cdef tree.xmlNs* findOrBuildNodeNsPrefix(
+        _Document doc, tree.xmlNode* c_node, const_xmlChar* href, const_xmlChar* prefix)
+
+    # find the Document of an Element, ElementTree or Document (itself!)
+    cdef _Document documentOrRaise(object input)
+
+    # find the root Element of an Element (itself!), ElementTree or Document
+    cdef _Element rootNodeOrRaise(object input)
diff --git a/lib/lxml/includes/htmlparser.pxd b/lib/lxml/includes/htmlparser.pxd
new file mode 100644
index 00000000..145a69a0
--- /dev/null
+++ b/lib/lxml/includes/htmlparser.pxd
@@ -0,0 +1,56 @@
+from libc.string cimport const_char
+
+from lxml.includes.tree cimport xmlDoc
+from lxml.includes.tree cimport xmlInputReadCallback, xmlInputCloseCallback
+from lxml.includes.xmlparser cimport xmlParserCtxt, xmlSAXHandler, xmlSAXHandlerV1
+
+cdef extern from "libxml/HTMLparser.h":
+    ctypedef enum htmlParserOption:
+        HTML_PARSE_NOERROR    # suppress error reports
+        HTML_PARSE_NOWARNING  # suppress warning reports
+        HTML_PARSE_PEDANTIC   # pedantic error reporting
+        HTML_PARSE_NOBLANKS   # remove blank nodes
+        HTML_PARSE_NONET      # Forbid network access
+        # libxml2 2.6.21+ only:
+        HTML_PARSE_RECOVER    # Relaxed parsing
+        HTML_PARSE_COMPACT    # compact small text nodes
+        # libxml2 2.7.7+ only:
+        HTML_PARSE_NOIMPLIED  # Do not add implied html/body... elements
+        # libxml2 2.7.8+ only:
+        HTML_PARSE_NODEFDTD   # do not default a doctype if not found
+        # libxml2 2.8.0+ only:
+        XML_PARSE_IGNORE_ENC  # ignore internal document encoding hint
+
+    xmlSAXHandlerV1 htmlDefaultSAXHandler
+
+    cdef xmlParserCtxt* htmlCreateMemoryParserCtxt(
+        char* buffer, int size) nogil
+    cdef xmlParserCtxt* htmlCreateFileParserCtxt(
+        char* filename, char* encoding) nogil
+    cdef xmlParserCtxt* htmlCreatePushParserCtxt(xmlSAXHandler* sax,
+                                                 void* user_data,
+                                                 char* chunk, int size,
+                                                 char* filename, int enc) nogil
+    cdef void htmlFreeParserCtxt(xmlParserCtxt* ctxt) nogil
+    cdef void htmlCtxtReset(xmlParserCtxt* ctxt) nogil
+    cdef int htmlCtxtUseOptions(xmlParserCtxt* ctxt, int options) nogil
+    cdef int htmlParseDocument(xmlParserCtxt* ctxt) nogil
+    cdef int htmlParseChunk(xmlParserCtxt* ctxt, 
+                            char* chunk, int size, int terminate) nogil
+
+    cdef xmlDoc* htmlCtxtReadFile(xmlParserCtxt* ctxt,
+                                  char* filename, const_char* encoding,
+                                  int options) nogil
+    cdef xmlDoc* htmlCtxtReadDoc(xmlParserCtxt* ctxt,
+                                 char* buffer, char* URL, const_char* encoding,
+                                 int options) nogil
+    cdef xmlDoc* htmlCtxtReadIO(xmlParserCtxt* ctxt, 
+                                xmlInputReadCallback ioread, 
+                                xmlInputCloseCallback ioclose, 
+                                void* ioctx,
+                                char* URL, const_char* encoding,
+                                int options) nogil
+    cdef xmlDoc* htmlCtxtReadMemory(xmlParserCtxt* ctxt,
+                                    char* buffer, int size,
+                                    char* filename, const_char* encoding,
+                                    int options) nogil
diff --git a/lib/lxml/includes/relaxng.pxd b/lib/lxml/includes/relaxng.pxd
new file mode 100644
index 00000000..28e9212d
--- /dev/null
+++ b/lib/lxml/includes/relaxng.pxd
@@ -0,0 +1,64 @@
+from lxml.includes.tree cimport xmlDoc
+from lxml.includes.xmlerror cimport xmlStructuredErrorFunc
+
+cdef extern from "libxml/relaxng.h":
+    ctypedef struct xmlRelaxNG
+    ctypedef struct xmlRelaxNGParserCtxt
+    
+    ctypedef struct xmlRelaxNGValidCtxt
+    
+    ctypedef enum xmlRelaxNGValidErr:
+        XML_RELAXNG_OK = 0
+        XML_RELAXNG_ERR_MEMORY = 1
+        XML_RELAXNG_ERR_TYPE = 2
+        XML_RELAXNG_ERR_TYPEVAL = 3
+        XML_RELAXNG_ERR_DUPID = 4
+        XML_RELAXNG_ERR_TYPECMP = 5
+        XML_RELAXNG_ERR_NOSTATE = 6
+        XML_RELAXNG_ERR_NODEFINE = 7
+        XML_RELAXNG_ERR_LISTEXTRA = 8
+        XML_RELAXNG_ERR_LISTEMPTY = 9
+        XML_RELAXNG_ERR_INTERNODATA = 10
+        XML_RELAXNG_ERR_INTERSEQ = 11
+        XML_RELAXNG_ERR_INTEREXTRA = 12
+        XML_RELAXNG_ERR_ELEMNAME = 13
+        XML_RELAXNG_ERR_ATTRNAME = 14
+        XML_RELAXNG_ERR_ELEMNONS = 15
+        XML_RELAXNG_ERR_ATTRNONS = 16
+        XML_RELAXNG_ERR_ELEMWRONGNS = 17
+        XML_RELAXNG_ERR_ATTRWRONGNS = 18
+        XML_RELAXNG_ERR_ELEMEXTRANS = 19
+        XML_RELAXNG_ERR_ATTREXTRANS = 20
+        XML_RELAXNG_ERR_ELEMNOTEMPTY = 21
+        XML_RELAXNG_ERR_NOELEM = 22
+        XML_RELAXNG_ERR_NOTELEM = 23
+        XML_RELAXNG_ERR_ATTRVALID = 24
+        XML_RELAXNG_ERR_CONTENTVALID = 25
+        XML_RELAXNG_ERR_EXTRACONTENT = 26
+        XML_RELAXNG_ERR_INVALIDATTR = 27
+        XML_RELAXNG_ERR_DATAELEM = 28
+        XML_RELAXNG_ERR_VALELEM = 29
+        XML_RELAXNG_ERR_LISTELEM = 30
+        XML_RELAXNG_ERR_DATATYPE = 31
+        XML_RELAXNG_ERR_VALUE = 32
+        XML_RELAXNG_ERR_LIST = 33
+        XML_RELAXNG_ERR_NOGRAMMAR = 34
+        XML_RELAXNG_ERR_EXTRADATA = 35
+        XML_RELAXNG_ERR_LACKDATA = 36
+        XML_RELAXNG_ERR_INTERNAL = 37
+        XML_RELAXNG_ERR_ELEMWRONG = 38
+        XML_RELAXNG_ERR_TEXTWRONG = 39
+        
+    cdef xmlRelaxNGValidCtxt* xmlRelaxNGNewValidCtxt(xmlRelaxNG* schema) nogil
+    cdef int xmlRelaxNGValidateDoc(xmlRelaxNGValidCtxt* ctxt, xmlDoc* doc) nogil
+    cdef xmlRelaxNG* xmlRelaxNGParse(xmlRelaxNGParserCtxt* ctxt) nogil
+    cdef xmlRelaxNGParserCtxt* xmlRelaxNGNewParserCtxt(char* URL) nogil
+    cdef xmlRelaxNGParserCtxt* xmlRelaxNGNewDocParserCtxt(xmlDoc* doc) nogil
+    cdef void xmlRelaxNGFree(xmlRelaxNG* schema) nogil
+    cdef void xmlRelaxNGFreeParserCtxt(xmlRelaxNGParserCtxt* ctxt) nogil
+    cdef void xmlRelaxNGFreeValidCtxt(xmlRelaxNGValidCtxt* ctxt) nogil
+
+    cdef void xmlRelaxNGSetValidStructuredErrors(
+        xmlRelaxNGValidCtxt* ctxt, xmlStructuredErrorFunc serror, void *ctx) nogil
+    cdef void xmlRelaxNGSetParserStructuredErrors(
+        xmlRelaxNGParserCtxt* ctxt, xmlStructuredErrorFunc serror, void *ctx) nogil
diff --git a/lib/lxml/includes/schematron.pxd b/lib/lxml/includes/schematron.pxd
new file mode 100644
index 00000000..f8e32528
--- /dev/null
+++ b/lib/lxml/includes/schematron.pxd
@@ -0,0 +1,34 @@
+from lxml.includes cimport xmlerror
+from lxml.includes.tree cimport xmlDoc
+
+cdef extern from "libxml/schematron.h":
+    ctypedef struct xmlSchematron
+    ctypedef struct xmlSchematronParserCtxt
+    ctypedef struct xmlSchematronValidCtxt
+
+    ctypedef enum xmlSchematronValidOptions:
+        XML_SCHEMATRON_OUT_QUIET     =    1 # quiet no report
+        XML_SCHEMATRON_OUT_TEXT      =    2 # build a textual report
+        XML_SCHEMATRON_OUT_XML       =    4 # output SVRL
+        XML_SCHEMATRON_OUT_ERROR     =    8 # output via xmlStructuredErrorFunc
+        XML_SCHEMATRON_OUT_FILE      =  256 # output to a file descriptor
+        XML_SCHEMATRON_OUT_BUFFER    =  512 # output to a buffer
+        XML_SCHEMATRON_OUT_IO        = 1024 # output to I/O mechanism
+
+    cdef xmlSchematronParserCtxt* xmlSchematronNewDocParserCtxt(
+        xmlDoc* doc) nogil
+    cdef xmlSchematronParserCtxt* xmlSchematronNewParserCtxt(
+        char* filename) nogil
+    cdef xmlSchematronValidCtxt* xmlSchematronNewValidCtxt(
+        xmlSchematron* schema, int options) nogil
+
+    cdef xmlSchematron* xmlSchematronParse(xmlSchematronParserCtxt* ctxt) nogil
+    cdef int xmlSchematronValidateDoc(xmlSchematronValidCtxt* ctxt,
+                                      xmlDoc* instance) nogil
+
+    cdef void xmlSchematronFreeParserCtxt(xmlSchematronParserCtxt* ctxt) nogil
+    cdef void xmlSchematronFreeValidCtxt(xmlSchematronValidCtxt* ctxt) nogil
+    cdef void xmlSchematronFree(xmlSchematron* schema) nogil
+    cdef void xmlSchematronSetValidStructuredErrors(
+        xmlSchematronValidCtxt* ctxt,
+        xmlerror.xmlStructuredErrorFunc error_func, void *data)
diff --git a/lib/lxml/includes/tree.pxd b/lib/lxml/includes/tree.pxd
new file mode 100644
index 00000000..64664c9f
--- /dev/null
+++ b/lib/lxml/includes/tree.pxd
@@ -0,0 +1,464 @@
+from libc cimport stdio
+from libc.string cimport const_char, const_uchar
+
+cdef extern from "lxml-version.h":
+    # deprecated declaration, use etreepublic.pxd instead
+    cdef char* LXML_VERSION_STRING
+
+cdef extern from "libxml/xmlversion.h":
+    cdef const_char* xmlParserVersion
+    cdef int LIBXML_VERSION
+
+cdef extern from "libxml/xmlstring.h":
+    ctypedef unsigned char xmlChar
+    ctypedef unsigned char const_xmlChar "const xmlChar"
+    cdef int xmlStrlen(const_xmlChar* str) nogil
+    cdef xmlChar* xmlStrdup(const_xmlChar* cur) nogil
+    cdef int xmlStrncmp(const_xmlChar* str1, const_xmlChar* str2, int length) nogil
+    cdef int xmlStrcmp(const_xmlChar* str1, const_xmlChar* str2) nogil
+    cdef const_xmlChar* xmlStrstr(const_xmlChar* str1, const_xmlChar* str2) nogil
+    cdef const_xmlChar* xmlStrchr(const_xmlChar* str1, xmlChar ch) nogil
+    cdef const_xmlChar* _xcstr "(const xmlChar*)PyBytes_AS_STRING" (object s)
+
+cdef extern from "libxml/encoding.h":
+    ctypedef enum xmlCharEncoding:
+        XML_CHAR_ENCODING_ERROR = -1 # No char encoding detected
+        XML_CHAR_ENCODING_NONE = 0 # No char encoding detected
+        XML_CHAR_ENCODING_UTF8 = 1 # UTF-8
+        XML_CHAR_ENCODING_UTF16LE = 2 # UTF-16 little endian
+        XML_CHAR_ENCODING_UTF16BE = 3 # UTF-16 big endian
+        XML_CHAR_ENCODING_UCS4LE = 4 # UCS-4 little endian
+        XML_CHAR_ENCODING_UCS4BE = 5 # UCS-4 big endian
+        XML_CHAR_ENCODING_EBCDIC = 6 # EBCDIC uh!
+        XML_CHAR_ENCODING_UCS4_2143 = 7 # UCS-4 unusual ordering
+        XML_CHAR_ENCODING_UCS4_3412 = 8 # UCS-4 unusual ordering
+        XML_CHAR_ENCODING_UCS2 = 9 # UCS-2
+        XML_CHAR_ENCODING_8859_1 = 10 # ISO-8859-1 ISO Latin 1
+        XML_CHAR_ENCODING_8859_2 = 11 # ISO-8859-2 ISO Latin 2
+        XML_CHAR_ENCODING_8859_3 = 12 # ISO-8859-3
+        XML_CHAR_ENCODING_8859_4 = 13 # ISO-8859-4
+        XML_CHAR_ENCODING_8859_5 = 14 # ISO-8859-5
+        XML_CHAR_ENCODING_8859_6 = 15 # ISO-8859-6
+        XML_CHAR_ENCODING_8859_7 = 16 # ISO-8859-7
+        XML_CHAR_ENCODING_8859_8 = 17 # ISO-8859-8
+        XML_CHAR_ENCODING_8859_9 = 18 # ISO-8859-9
+        XML_CHAR_ENCODING_2022_JP = 19 # ISO-2022-JP
+        XML_CHAR_ENCODING_SHIFT_JIS = 20 # Shift_JIS
+        XML_CHAR_ENCODING_EUC_JP = 21 # EUC-JP
+        XML_CHAR_ENCODING_ASCII = 22 # pure ASCII
+
+    ctypedef struct xmlCharEncodingHandler
+    cdef xmlCharEncodingHandler* xmlFindCharEncodingHandler(char* name) nogil
+    cdef xmlCharEncodingHandler* xmlGetCharEncodingHandler(
+        xmlCharEncoding enc) nogil
+    cdef int xmlCharEncCloseFunc(xmlCharEncodingHandler* handler) nogil
+    cdef xmlCharEncoding xmlDetectCharEncoding(const_xmlChar* text, int len) nogil
+    cdef const_char* xmlGetCharEncodingName(xmlCharEncoding enc) nogil
+    cdef xmlCharEncoding xmlParseCharEncoding(char* name) nogil
+    ctypedef int (*xmlCharEncodingOutputFunc)(
+            unsigned char *out_buf, int *outlen, const_uchar *in_buf, int *inlen)
+
+cdef extern from "libxml/chvalid.h":
+    cdef int xmlIsChar_ch(char c) nogil
+
+cdef extern from "libxml/hash.h":
+    ctypedef struct xmlHashTable
+    ctypedef void (*xmlHashScanner)(void* payload, void* data, const_xmlChar* name) # may require GIL!
+    void xmlHashScan(xmlHashTable* table, xmlHashScanner f, void* data) nogil
+    void* xmlHashLookup(xmlHashTable* table, const_xmlChar* name) nogil
+
+cdef extern from *: # actually "libxml/dict.h"
+    # libxml/dict.h appears to be broken to include in C
+    ctypedef struct xmlDict
+    cdef const_xmlChar* xmlDictLookup(xmlDict* dict, const_xmlChar* name, int len) nogil
+    cdef const_xmlChar* xmlDictExists(xmlDict* dict, const_xmlChar* name, int len) nogil
+    cdef int xmlDictOwns(xmlDict* dict, const_xmlChar* name) nogil
+    cdef size_t xmlDictSize(xmlDict* dict) nogil
+
+cdef extern from "libxml/tree.h":
+    ctypedef struct xmlDoc
+    ctypedef struct xmlAttr
+    ctypedef struct xmlNotationTable
+
+    ctypedef enum xmlElementType:
+        XML_ELEMENT_NODE=           1
+        XML_ATTRIBUTE_NODE=         2
+        XML_TEXT_NODE=              3
+        XML_CDATA_SECTION_NODE=     4
+        XML_ENTITY_REF_NODE=        5
+        XML_ENTITY_NODE=            6
+        XML_PI_NODE=                7
+        XML_COMMENT_NODE=           8
+        XML_DOCUMENT_NODE=          9
+        XML_DOCUMENT_TYPE_NODE=     10
+        XML_DOCUMENT_FRAG_NODE=     11
+        XML_NOTATION_NODE=          12
+        XML_HTML_DOCUMENT_NODE=     13
+        XML_DTD_NODE=               14
+        XML_ELEMENT_DECL=           15
+        XML_ATTRIBUTE_DECL=         16
+        XML_ENTITY_DECL=            17
+        XML_NAMESPACE_DECL=         18
+        XML_XINCLUDE_START=         19
+        XML_XINCLUDE_END=           20
+
+    ctypedef enum xmlElementTypeVal:
+        XML_ELEMENT_TYPE_UNDEFINED= 0
+        XML_ELEMENT_TYPE_EMPTY=     1
+        XML_ELEMENT_TYPE_ANY=       2
+        XML_ELEMENT_TYPE_MIXED=     3
+        XML_ELEMENT_TYPE_ELEMENT=   4
+
+    ctypedef enum xmlElementContentType:
+        XML_ELEMENT_CONTENT_PCDATA=  1
+        XML_ELEMENT_CONTENT_ELEMENT= 2
+        XML_ELEMENT_CONTENT_SEQ=     3
+        XML_ELEMENT_CONTENT_OR=      4
+
+    ctypedef enum xmlElementContentOccur:
+        XML_ELEMENT_CONTENT_ONCE= 1
+        XML_ELEMENT_CONTENT_OPT=  2
+        XML_ELEMENT_CONTENT_MULT= 3
+        XML_ELEMENT_CONTENT_PLUS= 4
+
+    ctypedef enum xmlAttributeType:
+        XML_ATTRIBUTE_CDATA =      1
+        XML_ATTRIBUTE_ID=          2
+        XML_ATTRIBUTE_IDREF=       3
+        XML_ATTRIBUTE_IDREFS=      4
+        XML_ATTRIBUTE_ENTITY=      5
+        XML_ATTRIBUTE_ENTITIES=    6
+        XML_ATTRIBUTE_NMTOKEN=     7
+        XML_ATTRIBUTE_NMTOKENS=    8
+        XML_ATTRIBUTE_ENUMERATION= 9
+        XML_ATTRIBUTE_NOTATION=    10
+    
+    ctypedef enum xmlAttributeDefault:
+        XML_ATTRIBUTE_NONE=     1
+        XML_ATTRIBUTE_REQUIRED= 2
+        XML_ATTRIBUTE_IMPLIED=  3
+        XML_ATTRIBUTE_FIXED=    4
+
+    ctypedef enum xmlEntityType:
+        XML_INTERNAL_GENERAL_ENTITY=          1
+        XML_EXTERNAL_GENERAL_PARSED_ENTITY=   2
+        XML_EXTERNAL_GENERAL_UNPARSED_ENTITY= 3
+        XML_INTERNAL_PARAMETER_ENTITY=        4
+        XML_EXTERNAL_PARAMETER_ENTITY=        5
+        XML_INTERNAL_PREDEFINED_ENTITY=       6
+
+    ctypedef struct xmlNs:
+        const_xmlChar* href
+        const_xmlChar* prefix
+        xmlNs* next
+
+    ctypedef struct xmlNode:
+        void* _private
+        xmlElementType   type
+        const_xmlChar* name
+        xmlNode* children
+        xmlNode* last
+        xmlNode* parent
+        xmlNode* next
+        xmlNode* prev
+        xmlDoc* doc
+        xmlChar* content
+        xmlAttr* properties
+        xmlNs* ns
+        xmlNs* nsDef
+        unsigned short line
+
+    ctypedef struct xmlElementContent:
+        xmlElementContentType type
+        xmlElementContentOccur ocur
+        const_xmlChar *name
+        xmlElementContent *c1
+        xmlElementContent *c2
+        xmlElementContent *parent
+        const_xmlChar *prefix
+
+    ctypedef struct xmlEnumeration:
+        xmlEnumeration *next
+        const_xmlChar *name
+
+    ctypedef struct xmlAttribute:
+        void* _private
+        xmlElementType type
+        const_xmlChar* name
+        xmlNode* children
+        xmlNode* last
+        xmlDtd* parent
+        xmlNode* next
+        xmlNode* prev
+        xmlDoc* doc
+        xmlAttribute* nexth
+        xmlAttributeType atype
+        xmlAttributeDefault def_ "def"
+        const_xmlChar* defaultValue
+        xmlEnumeration* tree
+        const_xmlChar* prefix
+        const_xmlChar* elem
+
+    ctypedef struct xmlElement:
+        void* _private
+        xmlElementType   type
+        const_xmlChar* name
+        xmlNode* children
+        xmlNode* last
+        xmlNode* parent
+        xmlNode* next
+        xmlNode* prev
+        xmlDoc* doc
+        xmlElementTypeVal etype
+        xmlElementContent* content
+        xmlAttribute* attributes
+        const_xmlChar* prefix
+        void *contModel
+
+    ctypedef struct xmlEntity:
+        void* _private
+        xmlElementType type
+        const_xmlChar* name
+        xmlNode* children
+        xmlNode* last
+        xmlDtd* parent
+        xmlNode* next
+        xmlNode* prev
+        xmlDoc* doc
+        xmlChar* orig
+        xmlChar* content
+        int length
+        xmlEntityType etype
+        const_xmlChar* ExternalID
+        const_xmlChar* SystemID
+        xmlEntity* nexte
+        const_xmlChar* URI
+        int owner
+        int checked
+
+    ctypedef struct xmlDtd:
+        const_xmlChar* name
+        const_xmlChar* ExternalID
+        const_xmlChar* SystemID
+        void* notations
+        void* entities
+        void* pentities
+        void* attributes
+        void* elements
+        xmlNode* children
+        xmlNode* last
+        xmlDoc* doc
+
+    ctypedef struct xmlDoc:
+        xmlElementType type
+        char* name
+        xmlNode* children
+        xmlNode* last
+        xmlNode* parent
+        xmlNode* next
+        xmlNode* prev
+        xmlDoc* doc
+        xmlDict* dict
+        xmlHashTable* ids
+        int standalone
+        const_xmlChar* version
+        const_xmlChar* encoding
+        const_xmlChar* URL
+        void* _private
+        xmlDtd* intSubset
+        xmlDtd* extSubset
+        
+    ctypedef struct xmlAttr:
+        void* _private
+        xmlElementType type
+        const_xmlChar* name
+        xmlNode* children
+        xmlNode* last
+        xmlNode* parent
+        xmlAttr* next
+        xmlAttr* prev
+        xmlDoc* doc
+        xmlNs* ns
+
+    ctypedef struct xmlID:
+        const_xmlChar* value
+        xmlAttr* attr
+        xmlDoc* doc
+        
+    ctypedef struct xmlBuffer
+
+    ctypedef struct xmlBuf   # new in libxml2 2.9
+
+    ctypedef struct xmlOutputBuffer:
+        xmlBuf* buffer
+        xmlBuf* conv
+        int error
+
+    const_xmlChar* XML_XML_NAMESPACE
+        
+    cdef void xmlFreeDoc(xmlDoc* cur) nogil
+    cdef void xmlFreeDtd(xmlDtd* cur) nogil
+    cdef void xmlFreeNode(xmlNode* cur) nogil
+    cdef void xmlFreeNsList(xmlNs* ns) nogil
+    cdef void xmlFreeNs(xmlNs* ns) nogil
+    cdef void xmlFree(void* buf) nogil
+    
+    cdef xmlNode* xmlNewNode(xmlNs* ns, const_xmlChar* name) nogil
+    cdef xmlNode* xmlNewDocText(xmlDoc* doc, const_xmlChar* content) nogil
+    cdef xmlNode* xmlNewDocComment(xmlDoc* doc, const_xmlChar* content) nogil
+    cdef xmlNode* xmlNewDocPI(xmlDoc* doc, const_xmlChar* name, const_xmlChar* content) nogil
+    cdef xmlNode* xmlNewReference(xmlDoc* doc, const_xmlChar* name) nogil
+    cdef xmlNode* xmlNewCDataBlock(xmlDoc* doc, const_xmlChar* text, int len) nogil
+    cdef xmlNs* xmlNewNs(xmlNode* node, const_xmlChar* href, const_xmlChar* prefix) nogil
+    cdef xmlNode* xmlAddChild(xmlNode* parent, xmlNode* cur) nogil
+    cdef xmlNode* xmlReplaceNode(xmlNode* old, xmlNode* cur) nogil
+    cdef xmlNode* xmlAddPrevSibling(xmlNode* cur, xmlNode* elem) nogil
+    cdef xmlNode* xmlAddNextSibling(xmlNode* cur, xmlNode* elem) nogil
+    cdef xmlNode* xmlNewDocNode(xmlDoc* doc, xmlNs* ns,
+                                const_xmlChar* name, const_xmlChar* content) nogil
+    cdef xmlDoc* xmlNewDoc(const_xmlChar* version) nogil
+    cdef xmlAttr* xmlNewProp(xmlNode* node, const_xmlChar* name, const_xmlChar* value) nogil
+    cdef xmlAttr* xmlNewNsProp(xmlNode* node, xmlNs* ns,
+                               const_xmlChar* name, const_xmlChar* value) nogil
+    cdef xmlChar* xmlGetNoNsProp(xmlNode* node, const_xmlChar* name) nogil
+    cdef xmlChar* xmlGetNsProp(xmlNode* node, const_xmlChar* name, const_xmlChar* nameSpace) nogil
+    cdef void xmlSetNs(xmlNode* node, xmlNs* ns) nogil
+    cdef xmlAttr* xmlSetProp(xmlNode* node, const_xmlChar* name, const_xmlChar* value) nogil
+    cdef xmlAttr* xmlSetNsProp(xmlNode* node, xmlNs* ns,
+                               const_xmlChar* name, const_xmlChar* value) nogil
+    cdef int xmlRemoveProp(xmlAttr* cur) nogil
+    cdef xmlChar* xmlGetNodePath(xmlNode* node) nogil
+    cdef void xmlDocDumpMemory(xmlDoc* cur, char** mem, int* size) nogil
+    cdef void xmlDocDumpMemoryEnc(xmlDoc* cur, char** mem, int* size,
+                                  char* encoding) nogil
+    cdef int xmlSaveFileTo(xmlOutputBuffer* out, xmlDoc* cur,
+                           char* encoding) nogil
+
+    cdef void xmlUnlinkNode(xmlNode* cur) nogil
+    cdef xmlNode* xmlDocSetRootElement(xmlDoc* doc, xmlNode* root) nogil
+    cdef xmlNode* xmlDocGetRootElement(xmlDoc* doc) nogil
+    cdef void xmlSetTreeDoc(xmlNode* tree, xmlDoc* doc) nogil
+    cdef xmlAttr* xmlHasProp(xmlNode* node, const_xmlChar* name) nogil
+    cdef xmlAttr* xmlHasNsProp(xmlNode* node, const_xmlChar* name, const_xmlChar* nameSpace) nogil
+    cdef xmlChar* xmlNodeGetContent(xmlNode* cur) nogil
+    cdef int xmlNodeBufGetContent(xmlBuffer* buffer, xmlNode* cur) nogil
+    cdef xmlNs* xmlSearchNs(xmlDoc* doc, xmlNode* node, const_xmlChar* prefix) nogil
+    cdef xmlNs* xmlSearchNsByHref(xmlDoc* doc, xmlNode* node, const_xmlChar* href) nogil
+    cdef int xmlIsBlankNode(xmlNode* node) nogil
+    cdef long xmlGetLineNo(xmlNode* node) nogil
+    cdef void xmlElemDump(stdio.FILE* f, xmlDoc* doc, xmlNode* cur) nogil
+    cdef void xmlNodeDumpOutput(xmlOutputBuffer* buf,
+                                xmlDoc* doc, xmlNode* cur, int level,
+                                int format, const_char* encoding) nogil
+    cdef void xmlNodeSetName(xmlNode* cur, const_xmlChar* name) nogil
+    cdef void xmlNodeSetContent(xmlNode* cur, const_xmlChar* content) nogil
+    cdef xmlDtd* xmlCopyDtd(xmlDtd* dtd) nogil
+    cdef xmlDoc* xmlCopyDoc(xmlDoc* doc, int recursive) nogil
+    cdef xmlNode* xmlCopyNode(xmlNode* node, int extended) nogil
+    cdef xmlNode* xmlDocCopyNode(xmlNode* node, xmlDoc* doc, int extended) nogil
+    cdef int xmlReconciliateNs(xmlDoc* doc, xmlNode* tree) nogil
+    cdef xmlNs* xmlNewReconciliedNs(xmlDoc* doc, xmlNode* tree, xmlNs* ns) nogil
+    cdef xmlBuffer* xmlBufferCreate() nogil
+    cdef void xmlBufferWriteChar(xmlBuffer* buf, char* string) nogil
+    cdef void xmlBufferFree(xmlBuffer* buf) nogil
+    cdef const_xmlChar* xmlBufferContent(xmlBuffer* buf) nogil
+    cdef int xmlBufferLength(xmlBuffer* buf) nogil
+    cdef const_xmlChar* xmlBufContent(xmlBuf* buf) nogil # new in libxml2 2.9
+    cdef size_t xmlBufUse(xmlBuf* buf) nogil # new in libxml2 2.9
+    cdef int xmlKeepBlanksDefault(int val) nogil
+    cdef xmlChar* xmlNodeGetBase(xmlDoc* doc, xmlNode* node) nogil
+    cdef void xmlNodeSetBase(xmlNode* node, const_xmlChar* uri) nogil
+    cdef int xmlValidateNCName(const_xmlChar* value, int space) nogil
+
+cdef extern from "libxml/uri.h":
+    cdef const_xmlChar* xmlBuildURI(const_xmlChar* href, const_xmlChar* base) nogil
+
+cdef extern from "libxml/HTMLtree.h":
+    cdef void htmlNodeDumpFormatOutput(xmlOutputBuffer* buf,
+                                       xmlDoc* doc, xmlNode* cur,
+                                       char* encoding, int format) nogil
+    cdef xmlDoc* htmlNewDoc(const_xmlChar* uri, const_xmlChar* externalID) nogil
+
+cdef extern from "libxml/valid.h":
+    cdef xmlAttr* xmlGetID(xmlDoc* doc, const_xmlChar* ID) nogil
+    cdef void xmlDumpNotationTable(xmlBuffer* buffer,
+                                   xmlNotationTable* table) nogil
+
+cdef extern from "libxml/xmlIO.h":
+    cdef int xmlOutputBufferWrite(xmlOutputBuffer* out,
+                                  int len, const_char* str) nogil
+    cdef int xmlOutputBufferWriteString(xmlOutputBuffer* out, const_char* str) nogil
+    cdef int xmlOutputBufferWriteEscape(xmlOutputBuffer* out,
+                                        const_xmlChar* str,
+                                        xmlCharEncodingOutputFunc escapefunc) nogil
+    cdef int xmlOutputBufferFlush(xmlOutputBuffer* out) nogil
+    cdef int xmlOutputBufferClose(xmlOutputBuffer* out) nogil
+
+    ctypedef int (*xmlInputReadCallback)(void* context,
+                                         char* buffer, int len)
+    ctypedef int (*xmlInputCloseCallback)(void* context)
+
+    ctypedef int (*xmlOutputWriteCallback)(void* context,
+                                           char* buffer, int len)
+    ctypedef int (*xmlOutputCloseCallback)(void* context)
+
+    cdef xmlOutputBuffer* xmlAllocOutputBuffer(
+        xmlCharEncodingHandler* encoder) nogil
+    cdef xmlOutputBuffer* xmlOutputBufferCreateIO(
+        xmlOutputWriteCallback iowrite,
+        xmlOutputCloseCallback ioclose,
+        void * ioctx, 
+        xmlCharEncodingHandler* encoder) nogil
+    cdef xmlOutputBuffer* xmlOutputBufferCreateFile(
+        stdio.FILE* file, xmlCharEncodingHandler* encoder) nogil
+    cdef xmlOutputBuffer* xmlOutputBufferCreateFilename(
+        char* URI, xmlCharEncodingHandler* encoder, int compression) nogil
+
+cdef extern from "libxml/xmlsave.h":
+    ctypedef struct xmlSaveCtxt
+
+    ctypedef enum xmlSaveOption:
+        XML_SAVE_FORMAT   = 1   # format save output            (2.6.17)
+        XML_SAVE_NO_DECL  = 2   # drop the xml declaration      (2.6.21)
+        XML_SAVE_NO_EMPTY = 4   # no empty tags                 (2.6.22)
+        XML_SAVE_NO_XHTML = 8   # disable XHTML1 specific rules (2.6.22)
+        XML_SAVE_XHTML = 16     # force XHTML1 specific rules         (2.7.2)
+        XML_SAVE_AS_XML = 32    # force XML serialization on HTML doc (2.7.2)
+        XML_SAVE_AS_HTML = 64   # force HTML serialization on XML doc (2.7.2)
+
+    cdef xmlSaveCtxt* xmlSaveToFilename(char* filename, char* encoding,
+                                        int options) nogil
+    cdef xmlSaveCtxt* xmlSaveToBuffer(xmlBuffer* buffer, char* encoding,
+                                      int options) nogil # libxml2 2.6.23
+    cdef long xmlSaveDoc(xmlSaveCtxt* ctxt, xmlDoc* doc) nogil
+    cdef long xmlSaveTree(xmlSaveCtxt* ctxt, xmlNode* node) nogil
+    cdef int xmlSaveClose(xmlSaveCtxt* ctxt) nogil
+    cdef int xmlSaveFlush(xmlSaveCtxt* ctxt) nogil
+    cdef int xmlSaveSetAttrEscape(xmlSaveCtxt* ctxt, void* escape_func) nogil
+    cdef int xmlSaveSetEscape(xmlSaveCtxt* ctxt, void* escape_func) nogil
+
+cdef extern from "libxml/globals.h":
+    cdef int xmlThrDefKeepBlanksDefaultValue(int onoff) nogil
+    cdef int xmlThrDefLineNumbersDefaultValue(int onoff) nogil
+    cdef int xmlThrDefIndentTreeOutput(int onoff) nogil
+    
+cdef extern from "libxml/xmlmemory.h" nogil:
+    cdef void* xmlMalloc(size_t size)
+    cdef int xmlMemBlocks()
+    cdef int xmlMemUsed()
+    cdef void xmlMemDisplay(stdio.FILE* file)
+    cdef void xmlMemDisplayLast(stdio.FILE* file, long num_bytes)
+    cdef void xmlMemShow(stdio.FILE* file, int count)
+
+cdef extern from "etree_defs.h":
+    cdef bint _isElement(xmlNode* node) nogil
+    cdef bint _isElementOrXInclude(xmlNode* node) nogil
+    cdef const_xmlChar* _getNs(xmlNode* node) nogil
+    cdef void BEGIN_FOR_EACH_ELEMENT_FROM(xmlNode* tree_top,
+                                          xmlNode* start_node,
+                                          bint inclusive) nogil
+    cdef void END_FOR_EACH_ELEMENT_FROM(xmlNode* start_node) nogil
+    cdef void BEGIN_FOR_EACH_FROM(xmlNode* tree_top,
+                                  xmlNode* start_node,
+                                  bint inclusive) nogil
+    cdef void END_FOR_EACH_FROM(xmlNode* start_node) nogil
diff --git a/lib/lxml/includes/uri.pxd b/lib/lxml/includes/uri.pxd
new file mode 100644
index 00000000..2b6bb79f
--- /dev/null
+++ b/lib/lxml/includes/uri.pxd
@@ -0,0 +1,5 @@
+cdef extern from "libxml/uri.h":
+    ctypedef struct xmlURI
+
+    cdef xmlURI* xmlParseURI(char* str)
+    cdef void xmlFreeURI(xmlURI* uri)
diff --git a/lib/lxml/includes/xinclude.pxd b/lib/lxml/includes/xinclude.pxd
new file mode 100644
index 00000000..4232d3e4
--- /dev/null
+++ b/lib/lxml/includes/xinclude.pxd
@@ -0,0 +1,22 @@
+from lxml.includes.tree cimport xmlDoc, xmlNode
+
+cdef extern from "libxml/xinclude.h":
+
+    ctypedef struct xmlXIncludeCtxt
+
+    cdef int xmlXIncludeProcess(xmlDoc* doc) nogil
+    cdef int xmlXIncludeProcessFlags(xmlDoc* doc, int parser_opts) nogil
+    cdef int xmlXIncludeProcessTree(xmlNode* doc) nogil
+    cdef int xmlXIncludeProcessTreeFlags(xmlNode* doc, int parser_opts) nogil
+
+    # libxml2 >= 2.7.4
+    cdef int xmlXIncludeProcessTreeFlagsData(
+            xmlNode* doc, int parser_opts, void* data) nogil
+
+    cdef xmlXIncludeCtxt* xmlXIncludeNewContext(xmlDoc* doc) nogil
+    cdef int xmlXIncludeProcessNode(xmlXIncludeCtxt* ctxt, xmlNode* node) nogil
+    cdef int xmlXIncludeSetFlags(xmlXIncludeCtxt* ctxt, int flags) nogil
+
+    # libxml2 >= 2.6.27
+    cdef int xmlXIncludeProcessFlagsData(
+        xmlDoc* doc, int flags, void* data) nogil
diff --git a/lib/lxml/includes/xmlerror.pxd b/lib/lxml/includes/xmlerror.pxd
new file mode 100644
index 00000000..6294c677
--- /dev/null
+++ b/lib/lxml/includes/xmlerror.pxd
@@ -0,0 +1,850 @@
+
+# --- BEGIN: GENERATED CONSTANTS ---
+
+# This section is generated by the script 'update-error-constants.py'.
+
+cdef extern from "libxml/xmlerror.h":
+    ctypedef enum xmlErrorLevel:
+        XML_ERR_NONE                                       =       0
+        XML_ERR_WARNING                                    =       1 # A simple warning
+        XML_ERR_ERROR                                      =       2 # A recoverable error
+        XML_ERR_FATAL                                      =       3 # A fatal error
+
+    ctypedef enum xmlErrorDomain:
+        XML_FROM_NONE                                      =       0
+        XML_FROM_PARSER                                    =       1 # The XML parser
+        XML_FROM_TREE                                      =       2 # The tree module
+        XML_FROM_NAMESPACE                                 =       3 # The XML Namespace module
+        XML_FROM_DTD                                       =       4 # The XML DTD validation with parser contex
+        XML_FROM_HTML                                      =       5 # The HTML parser
+        XML_FROM_MEMORY                                    =       6 # The memory allocator
+        XML_FROM_OUTPUT                                    =       7 # The serialization code
+        XML_FROM_IO                                        =       8 # The Input/Output stack
+        XML_FROM_FTP                                       =       9 # The FTP module
+        XML_FROM_HTTP                                      =      10 # The HTTP module
+        XML_FROM_XINCLUDE                                  =      11 # The XInclude processing
+        XML_FROM_XPATH                                     =      12 # The XPath module
+        XML_FROM_XPOINTER                                  =      13 # The XPointer module
+        XML_FROM_REGEXP                                    =      14 # The regular expressions module
+        XML_FROM_DATATYPE                                  =      15 # The W3C XML Schemas Datatype module
+        XML_FROM_SCHEMASP                                  =      16 # The W3C XML Schemas parser module
+        XML_FROM_SCHEMASV                                  =      17 # The W3C XML Schemas validation module
+        XML_FROM_RELAXNGP                                  =      18 # The Relax-NG parser module
+        XML_FROM_RELAXNGV                                  =      19 # The Relax-NG validator module
+        XML_FROM_CATALOG                                   =      20 # The Catalog module
+        XML_FROM_C14N                                      =      21 # The Canonicalization module
+        XML_FROM_XSLT                                      =      22 # The XSLT engine from libxslt
+        XML_FROM_VALID                                     =      23 # The XML DTD validation with valid context
+        XML_FROM_CHECK                                     =      24 # The error checking module
+        XML_FROM_WRITER                                    =      25 # The xmlwriter module
+        XML_FROM_MODULE                                    =      26 # The dynamically loaded module modul
+        XML_FROM_I18N                                      =      27 # The module handling character conversion
+        XML_FROM_SCHEMATRONV                               =      28 # The Schematron validator module
+        XML_FROM_BUFFER                                    =      29 # The buffers module
+        XML_FROM_URI                                       =      30 # The URI module
+
+    ctypedef enum xmlParserErrors:
+        XML_ERR_OK                                         =       0
+        XML_ERR_INTERNAL_ERROR                             =       1
+        XML_ERR_NO_MEMORY                                  =       2
+        XML_ERR_DOCUMENT_START                             =       3
+        XML_ERR_DOCUMENT_EMPTY                             =       4
+        XML_ERR_DOCUMENT_END                               =       5
+        XML_ERR_INVALID_HEX_CHARREF                        =       6
+        XML_ERR_INVALID_DEC_CHARREF                        =       7
+        XML_ERR_INVALID_CHARREF                            =       8
+        XML_ERR_INVALID_CHAR                               =       9
+        XML_ERR_CHARREF_AT_EOF                             =      10
+        XML_ERR_CHARREF_IN_PROLOG                          =      11
+        XML_ERR_CHARREF_IN_EPILOG                          =      12
+        XML_ERR_CHARREF_IN_DTD                             =      13
+        XML_ERR_ENTITYREF_AT_EOF                           =      14
+        XML_ERR_ENTITYREF_IN_PROLOG                        =      15
+        XML_ERR_ENTITYREF_IN_EPILOG                        =      16
+        XML_ERR_ENTITYREF_IN_DTD                           =      17
+        XML_ERR_PEREF_AT_EOF                               =      18
+        XML_ERR_PEREF_IN_PROLOG                            =      19
+        XML_ERR_PEREF_IN_EPILOG                            =      20
+        XML_ERR_PEREF_IN_INT_SUBSET                        =      21
+        XML_ERR_ENTITYREF_NO_NAME                          =      22
+        XML_ERR_ENTITYREF_SEMICOL_MISSING                  =      23
+        XML_ERR_PEREF_NO_NAME                              =      24
+        XML_ERR_PEREF_SEMICOL_MISSING                      =      25
+        XML_ERR_UNDECLARED_ENTITY                          =      26
+        XML_WAR_UNDECLARED_ENTITY                          =      27
+        XML_ERR_UNPARSED_ENTITY                            =      28
+        XML_ERR_ENTITY_IS_EXTERNAL                         =      29
+        XML_ERR_ENTITY_IS_PARAMETER                        =      30
+        XML_ERR_UNKNOWN_ENCODING                           =      31
+        XML_ERR_UNSUPPORTED_ENCODING                       =      32
+        XML_ERR_STRING_NOT_STARTED                         =      33
+        XML_ERR_STRING_NOT_CLOSED                          =      34
+        XML_ERR_NS_DECL_ERROR                              =      35
+        XML_ERR_ENTITY_NOT_STARTED                         =      36
+        XML_ERR_ENTITY_NOT_FINISHED                        =      37
+        XML_ERR_LT_IN_ATTRIBUTE                            =      38
+        XML_ERR_ATTRIBUTE_NOT_STARTED                      =      39
+        XML_ERR_ATTRIBUTE_NOT_FINISHED                     =      40
+        XML_ERR_ATTRIBUTE_WITHOUT_VALUE                    =      41
+        XML_ERR_ATTRIBUTE_REDEFINED                        =      42
+        XML_ERR_LITERAL_NOT_STARTED                        =      43
+        XML_ERR_LITERAL_NOT_FINISHED                       =      44
+        XML_ERR_COMMENT_NOT_FINISHED                       =      45
+        XML_ERR_PI_NOT_STARTED                             =      46
+        XML_ERR_PI_NOT_FINISHED                            =      47
+        XML_ERR_NOTATION_NOT_STARTED                       =      48
+        XML_ERR_NOTATION_NOT_FINISHED                      =      49
+        XML_ERR_ATTLIST_NOT_STARTED                        =      50
+        XML_ERR_ATTLIST_NOT_FINISHED                       =      51
+        XML_ERR_MIXED_NOT_STARTED                          =      52
+        XML_ERR_MIXED_NOT_FINISHED                         =      53
+        XML_ERR_ELEMCONTENT_NOT_STARTED                    =      54
+        XML_ERR_ELEMCONTENT_NOT_FINISHED                   =      55
+        XML_ERR_XMLDECL_NOT_STARTED                        =      56
+        XML_ERR_XMLDECL_NOT_FINISHED                       =      57
+        XML_ERR_CONDSEC_NOT_STARTED                        =      58
+        XML_ERR_CONDSEC_NOT_FINISHED                       =      59
+        XML_ERR_EXT_SUBSET_NOT_FINISHED                    =      60
+        XML_ERR_DOCTYPE_NOT_FINISHED                       =      61
+        XML_ERR_MISPLACED_CDATA_END                        =      62
+        XML_ERR_CDATA_NOT_FINISHED                         =      63
+        XML_ERR_RESERVED_XML_NAME                          =      64
+        XML_ERR_SPACE_REQUIRED                             =      65
+        XML_ERR_SEPARATOR_REQUIRED                         =      66
+        XML_ERR_NMTOKEN_REQUIRED                           =      67
+        XML_ERR_NAME_REQUIRED                              =      68
+        XML_ERR_PCDATA_REQUIRED                            =      69
+        XML_ERR_URI_REQUIRED                               =      70
+        XML_ERR_PUBID_REQUIRED                             =      71
+        XML_ERR_LT_REQUIRED                                =      72
+        XML_ERR_GT_REQUIRED                                =      73
+        XML_ERR_LTSLASH_REQUIRED                           =      74
+        XML_ERR_EQUAL_REQUIRED                             =      75
+        XML_ERR_TAG_NAME_MISMATCH                          =      76
+        XML_ERR_TAG_NOT_FINISHED                           =      77
+        XML_ERR_STANDALONE_VALUE                           =      78
+        XML_ERR_ENCODING_NAME                              =      79
+        XML_ERR_HYPHEN_IN_COMMENT                          =      80
+        XML_ERR_INVALID_ENCODING                           =      81
+        XML_ERR_EXT_ENTITY_STANDALONE                      =      82
+        XML_ERR_CONDSEC_INVALID                            =      83
+        XML_ERR_VALUE_REQUIRED                             =      84
+        XML_ERR_NOT_WELL_BALANCED                          =      85
+        XML_ERR_EXTRA_CONTENT                              =      86
+        XML_ERR_ENTITY_CHAR_ERROR                          =      87
+        XML_ERR_ENTITY_PE_INTERNAL                         =      88
+        XML_ERR_ENTITY_LOOP                                =      89
+        XML_ERR_ENTITY_BOUNDARY                            =      90
+        XML_ERR_INVALID_URI                                =      91
+        XML_ERR_URI_FRAGMENT                               =      92
+        XML_WAR_CATALOG_PI                                 =      93
+        XML_ERR_NO_DTD                                     =      94
+        XML_ERR_CONDSEC_INVALID_KEYWORD                    =      95
+        XML_ERR_VERSION_MISSING                            =      96
+        XML_WAR_UNKNOWN_VERSION                            =      97
+        XML_WAR_LANG_VALUE                                 =      98
+        XML_WAR_NS_URI                                     =      99
+        XML_WAR_NS_URI_RELATIVE                            =     100
+        XML_ERR_MISSING_ENCODING                           =     101
+        XML_WAR_SPACE_VALUE                                =     102
+        XML_ERR_NOT_STANDALONE                             =     103
+        XML_ERR_ENTITY_PROCESSING                          =     104
+        XML_ERR_NOTATION_PROCESSING                        =     105
+        XML_WAR_NS_COLUMN                                  =     106
+        XML_WAR_ENTITY_REDEFINED                           =     107
+        XML_ERR_UNKNOWN_VERSION                            =     108
+        XML_ERR_VERSION_MISMATCH                           =     109
+        XML_ERR_NAME_TOO_LONG                              =     110
+        XML_ERR_USER_STOP                                  =     111
+        XML_NS_ERR_XML_NAMESPACE                           =     200
+        XML_NS_ERR_UNDEFINED_NAMESPACE                     =     201
+        XML_NS_ERR_QNAME                                   =     202
+        XML_NS_ERR_ATTRIBUTE_REDEFINED                     =     203
+        XML_NS_ERR_EMPTY                                   =     204
+        XML_NS_ERR_COLON                                   =     205
+        XML_DTD_ATTRIBUTE_DEFAULT                          =     500
+        XML_DTD_ATTRIBUTE_REDEFINED                        =     501
+        XML_DTD_ATTRIBUTE_VALUE                            =     502
+        XML_DTD_CONTENT_ERROR                              =     503
+        XML_DTD_CONTENT_MODEL                              =     504
+        XML_DTD_CONTENT_NOT_DETERMINIST                    =     505
+        XML_DTD_DIFFERENT_PREFIX                           =     506
+        XML_DTD_ELEM_DEFAULT_NAMESPACE                     =     507
+        XML_DTD_ELEM_NAMESPACE                             =     508
+        XML_DTD_ELEM_REDEFINED                             =     509
+        XML_DTD_EMPTY_NOTATION                             =     510
+        XML_DTD_ENTITY_TYPE                                =     511
+        XML_DTD_ID_FIXED                                   =     512
+        XML_DTD_ID_REDEFINED                               =     513
+        XML_DTD_ID_SUBSET                                  =     514
+        XML_DTD_INVALID_CHILD                              =     515
+        XML_DTD_INVALID_DEFAULT                            =     516
+        XML_DTD_LOAD_ERROR                                 =     517
+        XML_DTD_MISSING_ATTRIBUTE                          =     518
+        XML_DTD_MIXED_CORRUPT                              =     519
+        XML_DTD_MULTIPLE_ID                                =     520
+        XML_DTD_NO_DOC                                     =     521
+        XML_DTD_NO_DTD                                     =     522
+        XML_DTD_NO_ELEM_NAME                               =     523
+        XML_DTD_NO_PREFIX                                  =     524
+        XML_DTD_NO_ROOT                                    =     525
+        XML_DTD_NOTATION_REDEFINED                         =     526
+        XML_DTD_NOTATION_VALUE                             =     527
+        XML_DTD_NOT_EMPTY                                  =     528
+        XML_DTD_NOT_PCDATA                                 =     529
+        XML_DTD_NOT_STANDALONE                             =     530
+        XML_DTD_ROOT_NAME                                  =     531
+        XML_DTD_STANDALONE_WHITE_SPACE                     =     532
+        XML_DTD_UNKNOWN_ATTRIBUTE                          =     533
+        XML_DTD_UNKNOWN_ELEM                               =     534
+        XML_DTD_UNKNOWN_ENTITY                             =     535
+        XML_DTD_UNKNOWN_ID                                 =     536
+        XML_DTD_UNKNOWN_NOTATION                           =     537
+        XML_DTD_STANDALONE_DEFAULTED                       =     538
+        XML_DTD_XMLID_VALUE                                =     539
+        XML_DTD_XMLID_TYPE                                 =     540
+        XML_DTD_DUP_TOKEN                                  =     541
+        XML_HTML_STRUCURE_ERROR                            =     800
+        XML_HTML_UNKNOWN_TAG                               =     801
+        XML_RNGP_ANYNAME_ATTR_ANCESTOR                     =    1000
+        XML_RNGP_ATTR_CONFLICT                             =    1001
+        XML_RNGP_ATTRIBUTE_CHILDREN                        =    1002
+        XML_RNGP_ATTRIBUTE_CONTENT                         =    1003
+        XML_RNGP_ATTRIBUTE_EMPTY                           =    1004
+        XML_RNGP_ATTRIBUTE_NOOP                            =    1005
+        XML_RNGP_CHOICE_CONTENT                            =    1006
+        XML_RNGP_CHOICE_EMPTY                              =    1007
+        XML_RNGP_CREATE_FAILURE                            =    1008
+        XML_RNGP_DATA_CONTENT                              =    1009
+        XML_RNGP_DEF_CHOICE_AND_INTERLEAVE                 =    1010
+        XML_RNGP_DEFINE_CREATE_FAILED                      =    1011
+        XML_RNGP_DEFINE_EMPTY                              =    1012
+        XML_RNGP_DEFINE_MISSING                            =    1013
+        XML_RNGP_DEFINE_NAME_MISSING                       =    1014
+        XML_RNGP_ELEM_CONTENT_EMPTY                        =    1015
+        XML_RNGP_ELEM_CONTENT_ERROR                        =    1016
+        XML_RNGP_ELEMENT_EMPTY                             =    1017
+        XML_RNGP_ELEMENT_CONTENT                           =    1018
+        XML_RNGP_ELEMENT_NAME                              =    1019
+        XML_RNGP_ELEMENT_NO_CONTENT                        =    1020
+        XML_RNGP_ELEM_TEXT_CONFLICT                        =    1021
+        XML_RNGP_EMPTY                                     =    1022
+        XML_RNGP_EMPTY_CONSTRUCT                           =    1023
+        XML_RNGP_EMPTY_CONTENT                             =    1024
+        XML_RNGP_EMPTY_NOT_EMPTY                           =    1025
+        XML_RNGP_ERROR_TYPE_LIB                            =    1026
+        XML_RNGP_EXCEPT_EMPTY                              =    1027
+        XML_RNGP_EXCEPT_MISSING                            =    1028
+        XML_RNGP_EXCEPT_MULTIPLE                           =    1029
+        XML_RNGP_EXCEPT_NO_CONTENT                         =    1030
+        XML_RNGP_EXTERNALREF_EMTPY                         =    1031
+        XML_RNGP_EXTERNAL_REF_FAILURE                      =    1032
+        XML_RNGP_EXTERNALREF_RECURSE                       =    1033
+        XML_RNGP_FORBIDDEN_ATTRIBUTE                       =    1034
+        XML_RNGP_FOREIGN_ELEMENT                           =    1035
+        XML_RNGP_GRAMMAR_CONTENT                           =    1036
+        XML_RNGP_GRAMMAR_EMPTY                             =    1037
+        XML_RNGP_GRAMMAR_MISSING                           =    1038
+        XML_RNGP_GRAMMAR_NO_START                          =    1039
+        XML_RNGP_GROUP_ATTR_CONFLICT                       =    1040
+        XML_RNGP_HREF_ERROR                                =    1041
+        XML_RNGP_INCLUDE_EMPTY                             =    1042
+        XML_RNGP_INCLUDE_FAILURE                           =    1043
+        XML_RNGP_INCLUDE_RECURSE                           =    1044
+        XML_RNGP_INTERLEAVE_ADD                            =    1045
+        XML_RNGP_INTERLEAVE_CREATE_FAILED                  =    1046
+        XML_RNGP_INTERLEAVE_EMPTY                          =    1047
+        XML_RNGP_INTERLEAVE_NO_CONTENT                     =    1048
+        XML_RNGP_INVALID_DEFINE_NAME                       =    1049
+        XML_RNGP_INVALID_URI                               =    1050
+        XML_RNGP_INVALID_VALUE                             =    1051
+        XML_RNGP_MISSING_HREF                              =    1052
+        XML_RNGP_NAME_MISSING                              =    1053
+        XML_RNGP_NEED_COMBINE                              =    1054
+        XML_RNGP_NOTALLOWED_NOT_EMPTY                      =    1055
+        XML_RNGP_NSNAME_ATTR_ANCESTOR                      =    1056
+        XML_RNGP_NSNAME_NO_NS                              =    1057
+        XML_RNGP_PARAM_FORBIDDEN                           =    1058
+        XML_RNGP_PARAM_NAME_MISSING                        =    1059
+        XML_RNGP_PARENTREF_CREATE_FAILED                   =    1060
+        XML_RNGP_PARENTREF_NAME_INVALID                    =    1061
+        XML_RNGP_PARENTREF_NO_NAME                         =    1062
+        XML_RNGP_PARENTREF_NO_PARENT                       =    1063
+        XML_RNGP_PARENTREF_NOT_EMPTY                       =    1064
+        XML_RNGP_PARSE_ERROR                               =    1065
+        XML_RNGP_PAT_ANYNAME_EXCEPT_ANYNAME                =    1066
+        XML_RNGP_PAT_ATTR_ATTR                             =    1067
+        XML_RNGP_PAT_ATTR_ELEM                             =    1068
+        XML_RNGP_PAT_DATA_EXCEPT_ATTR                      =    1069
+        XML_RNGP_PAT_DATA_EXCEPT_ELEM                      =    1070
+        XML_RNGP_PAT_DATA_EXCEPT_EMPTY                     =    1071
+        XML_RNGP_PAT_DATA_EXCEPT_GROUP                     =    1072
+        XML_RNGP_PAT_DATA_EXCEPT_INTERLEAVE                =    1073
+        XML_RNGP_PAT_DATA_EXCEPT_LIST                      =    1074
+        XML_RNGP_PAT_DATA_EXCEPT_ONEMORE                   =    1075
+        XML_RNGP_PAT_DATA_EXCEPT_REF                       =    1076
+        XML_RNGP_PAT_DATA_EXCEPT_TEXT                      =    1077
+        XML_RNGP_PAT_LIST_ATTR                             =    1078
+        XML_RNGP_PAT_LIST_ELEM                             =    1079
+        XML_RNGP_PAT_LIST_INTERLEAVE                       =    1080
+        XML_RNGP_PAT_LIST_LIST                             =    1081
+        XML_RNGP_PAT_LIST_REF                              =    1082
+        XML_RNGP_PAT_LIST_TEXT                             =    1083
+        XML_RNGP_PAT_NSNAME_EXCEPT_ANYNAME                 =    1084
+        XML_RNGP_PAT_NSNAME_EXCEPT_NSNAME                  =    1085
+        XML_RNGP_PAT_ONEMORE_GROUP_ATTR                    =    1086
+        XML_RNGP_PAT_ONEMORE_INTERLEAVE_ATTR               =    1087
+        XML_RNGP_PAT_START_ATTR                            =    1088
+        XML_RNGP_PAT_START_DATA                            =    1089
+        XML_RNGP_PAT_START_EMPTY                           =    1090
+        XML_RNGP_PAT_START_GROUP                           =    1091
+        XML_RNGP_PAT_START_INTERLEAVE                      =    1092
+        XML_RNGP_PAT_START_LIST                            =    1093
+        XML_RNGP_PAT_START_ONEMORE                         =    1094
+        XML_RNGP_PAT_START_TEXT                            =    1095
+        XML_RNGP_PAT_START_VALUE                           =    1096
+        XML_RNGP_PREFIX_UNDEFINED                          =    1097
+        XML_RNGP_REF_CREATE_FAILED                         =    1098
+        XML_RNGP_REF_CYCLE                                 =    1099
+        XML_RNGP_REF_NAME_INVALID                          =    1100
+        XML_RNGP_REF_NO_DEF                                =    1101
+        XML_RNGP_REF_NO_NAME                               =    1102
+        XML_RNGP_REF_NOT_EMPTY                             =    1103
+        XML_RNGP_START_CHOICE_AND_INTERLEAVE               =    1104
+        XML_RNGP_START_CONTENT                             =    1105
+        XML_RNGP_START_EMPTY                               =    1106
+        XML_RNGP_START_MISSING                             =    1107
+        XML_RNGP_TEXT_EXPECTED                             =    1108
+        XML_RNGP_TEXT_HAS_CHILD                            =    1109
+        XML_RNGP_TYPE_MISSING                              =    1110
+        XML_RNGP_TYPE_NOT_FOUND                            =    1111
+        XML_RNGP_TYPE_VALUE                                =    1112
+        XML_RNGP_UNKNOWN_ATTRIBUTE                         =    1113
+        XML_RNGP_UNKNOWN_COMBINE                           =    1114
+        XML_RNGP_UNKNOWN_CONSTRUCT                         =    1115
+        XML_RNGP_UNKNOWN_TYPE_LIB                          =    1116
+        XML_RNGP_URI_FRAGMENT                              =    1117
+        XML_RNGP_URI_NOT_ABSOLUTE                          =    1118
+        XML_RNGP_VALUE_EMPTY                               =    1119
+        XML_RNGP_VALUE_NO_CONTENT                          =    1120
+        XML_RNGP_XMLNS_NAME                                =    1121
+        XML_RNGP_XML_NS                                    =    1122
+        XML_XPATH_EXPRESSION_OK                            =    1200
+        XML_XPATH_NUMBER_ERROR                             =    1201
+        XML_XPATH_UNFINISHED_LITERAL_ERROR                 =    1202
+        XML_XPATH_START_LITERAL_ERROR                      =    1203
+        XML_XPATH_VARIABLE_REF_ERROR                       =    1204
+        XML_XPATH_UNDEF_VARIABLE_ERROR                     =    1205
+        XML_XPATH_INVALID_PREDICATE_ERROR                  =    1206
+        XML_XPATH_EXPR_ERROR                               =    1207
+        XML_XPATH_UNCLOSED_ERROR                           =    1208
+        XML_XPATH_UNKNOWN_FUNC_ERROR                       =    1209
+        XML_XPATH_INVALID_OPERAND                          =    1210
+        XML_XPATH_INVALID_TYPE                             =    1211
+        XML_XPATH_INVALID_ARITY                            =    1212
+        XML_XPATH_INVALID_CTXT_SIZE                        =    1213
+        XML_XPATH_INVALID_CTXT_POSITION                    =    1214
+        XML_XPATH_MEMORY_ERROR                             =    1215
+        XML_XPTR_SYNTAX_ERROR                              =    1216
+        XML_XPTR_RESOURCE_ERROR                            =    1217
+        XML_XPTR_SUB_RESOURCE_ERROR                        =    1218
+        XML_XPATH_UNDEF_PREFIX_ERROR                       =    1219
+        XML_XPATH_ENCODING_ERROR                           =    1220
+        XML_XPATH_INVALID_CHAR_ERROR                       =    1221
+        XML_TREE_INVALID_HEX                               =    1300
+        XML_TREE_INVALID_DEC                               =    1301
+        XML_TREE_UNTERMINATED_ENTITY                       =    1302
+        XML_TREE_NOT_UTF8                                  =    1303
+        XML_SAVE_NOT_UTF8                                  =    1400
+        XML_SAVE_CHAR_INVALID                              =    1401
+        XML_SAVE_NO_DOCTYPE                                =    1402
+        XML_SAVE_UNKNOWN_ENCODING                          =    1403
+        XML_REGEXP_COMPILE_ERROR                           =    1450
+        XML_IO_UNKNOWN                                     =    1500
+        XML_IO_EACCES                                      =    1501
+        XML_IO_EAGAIN                                      =    1502
+        XML_IO_EBADF                                       =    1503
+        XML_IO_EBADMSG                                     =    1504
+        XML_IO_EBUSY                                       =    1505
+        XML_IO_ECANCELED                                   =    1506
+        XML_IO_ECHILD                                      =    1507
+        XML_IO_EDEADLK                                     =    1508
+        XML_IO_EDOM                                        =    1509
+        XML_IO_EEXIST                                      =    1510
+        XML_IO_EFAULT                                      =    1511
+        XML_IO_EFBIG                                       =    1512
+        XML_IO_EINPROGRESS                                 =    1513
+        XML_IO_EINTR                                       =    1514
+        XML_IO_EINVAL                                      =    1515
+        XML_IO_EIO                                         =    1516
+        XML_IO_EISDIR                                      =    1517
+        XML_IO_EMFILE                                      =    1518
+        XML_IO_EMLINK                                      =    1519
+        XML_IO_EMSGSIZE                                    =    1520
+        XML_IO_ENAMETOOLONG                                =    1521
+        XML_IO_ENFILE                                      =    1522
+        XML_IO_ENODEV                                      =    1523
+        XML_IO_ENOENT                                      =    1524
+        XML_IO_ENOEXEC                                     =    1525
+        XML_IO_ENOLCK                                      =    1526
+        XML_IO_ENOMEM                                      =    1527
+        XML_IO_ENOSPC                                      =    1528
+        XML_IO_ENOSYS                                      =    1529
+        XML_IO_ENOTDIR                                     =    1530
+        XML_IO_ENOTEMPTY                                   =    1531
+        XML_IO_ENOTSUP                                     =    1532
+        XML_IO_ENOTTY                                      =    1533
+        XML_IO_ENXIO                                       =    1534
+        XML_IO_EPERM                                       =    1535
+        XML_IO_EPIPE                                       =    1536
+        XML_IO_ERANGE                                      =    1537
+        XML_IO_EROFS                                       =    1538
+        XML_IO_ESPIPE                                      =    1539
+        XML_IO_ESRCH                                       =    1540
+        XML_IO_ETIMEDOUT                                   =    1541
+        XML_IO_EXDEV                                       =    1542
+        XML_IO_NETWORK_ATTEMPT                             =    1543
+        XML_IO_ENCODER                                     =    1544
+        XML_IO_FLUSH                                       =    1545
+        XML_IO_WRITE                                       =    1546
+        XML_IO_NO_INPUT                                    =    1547
+        XML_IO_BUFFER_FULL                                 =    1548
+        XML_IO_LOAD_ERROR                                  =    1549
+        XML_IO_ENOTSOCK                                    =    1550
+        XML_IO_EISCONN                                     =    1551
+        XML_IO_ECONNREFUSED                                =    1552
+        XML_IO_ENETUNREACH                                 =    1553
+        XML_IO_EADDRINUSE                                  =    1554
+        XML_IO_EALREADY                                    =    1555
+        XML_IO_EAFNOSUPPORT                                =    1556
+        XML_XINCLUDE_RECURSION                             =    1600
+        XML_XINCLUDE_PARSE_VALUE                           =    1601
+        XML_XINCLUDE_ENTITY_DEF_MISMATCH                   =    1602
+        XML_XINCLUDE_NO_HREF                               =    1603
+        XML_XINCLUDE_NO_FALLBACK                           =    1604
+        XML_XINCLUDE_HREF_URI                              =    1605
+        XML_XINCLUDE_TEXT_FRAGMENT                         =    1606
+        XML_XINCLUDE_TEXT_DOCUMENT                         =    1607
+        XML_XINCLUDE_INVALID_CHAR                          =    1608
+        XML_XINCLUDE_BUILD_FAILED                          =    1609
+        XML_XINCLUDE_UNKNOWN_ENCODING                      =    1610
+        XML_XINCLUDE_MULTIPLE_ROOT                         =    1611
+        XML_XINCLUDE_XPTR_FAILED                           =    1612
+        XML_XINCLUDE_XPTR_RESULT                           =    1613
+        XML_XINCLUDE_INCLUDE_IN_INCLUDE                    =    1614
+        XML_XINCLUDE_FALLBACKS_IN_INCLUDE                  =    1615
+        XML_XINCLUDE_FALLBACK_NOT_IN_INCLUDE               =    1616
+        XML_XINCLUDE_DEPRECATED_NS                         =    1617
+        XML_XINCLUDE_FRAGMENT_ID                           =    1618
+        XML_CATALOG_MISSING_ATTR                           =    1650
+        XML_CATALOG_ENTRY_BROKEN                           =    1651
+        XML_CATALOG_PREFER_VALUE                           =    1652
+        XML_CATALOG_NOT_CATALOG                            =    1653
+        XML_CATALOG_RECURSION                              =    1654
+        XML_SCHEMAP_PREFIX_UNDEFINED                       =    1700
+        XML_SCHEMAP_ATTRFORMDEFAULT_VALUE                  =    1701
+        XML_SCHEMAP_ATTRGRP_NONAME_NOREF                   =    1702
+        XML_SCHEMAP_ATTR_NONAME_NOREF                      =    1703
+        XML_SCHEMAP_COMPLEXTYPE_NONAME_NOREF               =    1704
+        XML_SCHEMAP_ELEMFORMDEFAULT_VALUE                  =    1705
+        XML_SCHEMAP_ELEM_NONAME_NOREF                      =    1706
+        XML_SCHEMAP_EXTENSION_NO_BASE                      =    1707
+        XML_SCHEMAP_FACET_NO_VALUE                         =    1708
+        XML_SCHEMAP_FAILED_BUILD_IMPORT                    =    1709
+        XML_SCHEMAP_GROUP_NONAME_NOREF                     =    1710
+        XML_SCHEMAP_IMPORT_NAMESPACE_NOT_URI               =    1711
+        XML_SCHEMAP_IMPORT_REDEFINE_NSNAME                 =    1712
+        XML_SCHEMAP_IMPORT_SCHEMA_NOT_URI                  =    1713
+        XML_SCHEMAP_INVALID_BOOLEAN                        =    1714
+        XML_SCHEMAP_INVALID_ENUM                           =    1715
+        XML_SCHEMAP_INVALID_FACET                          =    1716
+        XML_SCHEMAP_INVALID_FACET_VALUE                    =    1717
+        XML_SCHEMAP_INVALID_MAXOCCURS                      =    1718
+        XML_SCHEMAP_INVALID_MINOCCURS                      =    1719
+        XML_SCHEMAP_INVALID_REF_AND_SUBTYPE                =    1720
+        XML_SCHEMAP_INVALID_WHITE_SPACE                    =    1721
+        XML_SCHEMAP_NOATTR_NOREF                           =    1722
+        XML_SCHEMAP_NOTATION_NO_NAME                       =    1723
+        XML_SCHEMAP_NOTYPE_NOREF                           =    1724
+        XML_SCHEMAP_REF_AND_SUBTYPE                        =    1725
+        XML_SCHEMAP_RESTRICTION_NONAME_NOREF               =    1726
+        XML_SCHEMAP_SIMPLETYPE_NONAME                      =    1727
+        XML_SCHEMAP_TYPE_AND_SUBTYPE                       =    1728
+        XML_SCHEMAP_UNKNOWN_ALL_CHILD                      =    1729
+        XML_SCHEMAP_UNKNOWN_ANYATTRIBUTE_CHILD             =    1730
+        XML_SCHEMAP_UNKNOWN_ATTR_CHILD                     =    1731
+        XML_SCHEMAP_UNKNOWN_ATTRGRP_CHILD                  =    1732
+        XML_SCHEMAP_UNKNOWN_ATTRIBUTE_GROUP                =    1733
+        XML_SCHEMAP_UNKNOWN_BASE_TYPE                      =    1734
+        XML_SCHEMAP_UNKNOWN_CHOICE_CHILD                   =    1735
+        XML_SCHEMAP_UNKNOWN_COMPLEXCONTENT_CHILD           =    1736
+        XML_SCHEMAP_UNKNOWN_COMPLEXTYPE_CHILD              =    1737
+        XML_SCHEMAP_UNKNOWN_ELEM_CHILD                     =    1738
+        XML_SCHEMAP_UNKNOWN_EXTENSION_CHILD                =    1739
+        XML_SCHEMAP_UNKNOWN_FACET_CHILD                    =    1740
+        XML_SCHEMAP_UNKNOWN_FACET_TYPE                     =    1741
+        XML_SCHEMAP_UNKNOWN_GROUP_CHILD                    =    1742
+        XML_SCHEMAP_UNKNOWN_IMPORT_CHILD                   =    1743
+        XML_SCHEMAP_UNKNOWN_LIST_CHILD                     =    1744
+        XML_SCHEMAP_UNKNOWN_NOTATION_CHILD                 =    1745
+        XML_SCHEMAP_UNKNOWN_PROCESSCONTENT_CHILD           =    1746
+        XML_SCHEMAP_UNKNOWN_REF                            =    1747
+        XML_SCHEMAP_UNKNOWN_RESTRICTION_CHILD              =    1748
+        XML_SCHEMAP_UNKNOWN_SCHEMAS_CHILD                  =    1749
+        XML_SCHEMAP_UNKNOWN_SEQUENCE_CHILD                 =    1750
+        XML_SCHEMAP_UNKNOWN_SIMPLECONTENT_CHILD            =    1751
+        XML_SCHEMAP_UNKNOWN_SIMPLETYPE_CHILD               =    1752
+        XML_SCHEMAP_UNKNOWN_TYPE                           =    1753
+        XML_SCHEMAP_UNKNOWN_UNION_CHILD                    =    1754
+        XML_SCHEMAP_ELEM_DEFAULT_FIXED                     =    1755
+        XML_SCHEMAP_REGEXP_INVALID                         =    1756
+        XML_SCHEMAP_FAILED_LOAD                            =    1757
+        XML_SCHEMAP_NOTHING_TO_PARSE                       =    1758
+        XML_SCHEMAP_NOROOT                                 =    1759
+        XML_SCHEMAP_REDEFINED_GROUP                        =    1760
+        XML_SCHEMAP_REDEFINED_TYPE                         =    1761
+        XML_SCHEMAP_REDEFINED_ELEMENT                      =    1762
+        XML_SCHEMAP_REDEFINED_ATTRGROUP                    =    1763
+        XML_SCHEMAP_REDEFINED_ATTR                         =    1764
+        XML_SCHEMAP_REDEFINED_NOTATION                     =    1765
+        XML_SCHEMAP_FAILED_PARSE                           =    1766
+        XML_SCHEMAP_UNKNOWN_PREFIX                         =    1767
+        XML_SCHEMAP_DEF_AND_PREFIX                         =    1768
+        XML_SCHEMAP_UNKNOWN_INCLUDE_CHILD                  =    1769
+        XML_SCHEMAP_INCLUDE_SCHEMA_NOT_URI                 =    1770
+        XML_SCHEMAP_INCLUDE_SCHEMA_NO_URI                  =    1771
+        XML_SCHEMAP_NOT_SCHEMA                             =    1772
+        XML_SCHEMAP_UNKNOWN_MEMBER_TYPE                    =    1773
+        XML_SCHEMAP_INVALID_ATTR_USE                       =    1774
+        XML_SCHEMAP_RECURSIVE                              =    1775
+        XML_SCHEMAP_SUPERNUMEROUS_LIST_ITEM_TYPE           =    1776
+        XML_SCHEMAP_INVALID_ATTR_COMBINATION               =    1777
+        XML_SCHEMAP_INVALID_ATTR_INLINE_COMBINATION        =    1778
+        XML_SCHEMAP_MISSING_SIMPLETYPE_CHILD               =    1779
+        XML_SCHEMAP_INVALID_ATTR_NAME                      =    1780
+        XML_SCHEMAP_REF_AND_CONTENT                        =    1781
+        XML_SCHEMAP_CT_PROPS_CORRECT_1                     =    1782
+        XML_SCHEMAP_CT_PROPS_CORRECT_2                     =    1783
+        XML_SCHEMAP_CT_PROPS_CORRECT_3                     =    1784
+        XML_SCHEMAP_CT_PROPS_CORRECT_4                     =    1785
+        XML_SCHEMAP_CT_PROPS_CORRECT_5                     =    1786
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_1            =    1787
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_2_1_1        =    1788
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_2_1_2        =    1789
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_2_2          =    1790
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_3            =    1791
+        XML_SCHEMAP_WILDCARD_INVALID_NS_MEMBER             =    1792
+        XML_SCHEMAP_INTERSECTION_NOT_EXPRESSIBLE           =    1793
+        XML_SCHEMAP_UNION_NOT_EXPRESSIBLE                  =    1794
+        XML_SCHEMAP_SRC_IMPORT_3_1                         =    1795
+        XML_SCHEMAP_SRC_IMPORT_3_2                         =    1796
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_4_1          =    1797
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_4_2          =    1798
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_4_3          =    1799
+        XML_SCHEMAP_COS_CT_EXTENDS_1_3                     =    1800
+        XML_SCHEMAV_NOROOT                                 =    1801
+        XML_SCHEMAV_UNDECLAREDELEM                         =    1802
+        XML_SCHEMAV_NOTTOPLEVEL                            =    1803
+        XML_SCHEMAV_MISSING                                =    1804
+        XML_SCHEMAV_WRONGELEM                              =    1805
+        XML_SCHEMAV_NOTYPE                                 =    1806
+        XML_SCHEMAV_NOROLLBACK                             =    1807
+        XML_SCHEMAV_ISABSTRACT                             =    1808
+        XML_SCHEMAV_NOTEMPTY                               =    1809
+        XML_SCHEMAV_ELEMCONT                               =    1810
+        XML_SCHEMAV_HAVEDEFAULT                            =    1811
+        XML_SCHEMAV_NOTNILLABLE                            =    1812
+        XML_SCHEMAV_EXTRACONTENT                           =    1813
+        XML_SCHEMAV_INVALIDATTR                            =    1814
+        XML_SCHEMAV_INVALIDELEM                            =    1815
+        XML_SCHEMAV_NOTDETERMINIST                         =    1816
+        XML_SCHEMAV_CONSTRUCT                              =    1817
+        XML_SCHEMAV_INTERNAL                               =    1818
+        XML_SCHEMAV_NOTSIMPLE                              =    1819
+        XML_SCHEMAV_ATTRUNKNOWN                            =    1820
+        XML_SCHEMAV_ATTRINVALID                            =    1821
+        XML_SCHEMAV_VALUE                                  =    1822
+        XML_SCHEMAV_FACET                                  =    1823
+        XML_SCHEMAV_CVC_DATATYPE_VALID_1_2_1               =    1824
+        XML_SCHEMAV_CVC_DATATYPE_VALID_1_2_2               =    1825
+        XML_SCHEMAV_CVC_DATATYPE_VALID_1_2_3               =    1826
+        XML_SCHEMAV_CVC_TYPE_3_1_1                         =    1827
+        XML_SCHEMAV_CVC_TYPE_3_1_2                         =    1828
+        XML_SCHEMAV_CVC_FACET_VALID                        =    1829
+        XML_SCHEMAV_CVC_LENGTH_VALID                       =    1830
+        XML_SCHEMAV_CVC_MINLENGTH_VALID                    =    1831
+        XML_SCHEMAV_CVC_MAXLENGTH_VALID                    =    1832
+        XML_SCHEMAV_CVC_MININCLUSIVE_VALID                 =    1833
+        XML_SCHEMAV_CVC_MAXINCLUSIVE_VALID                 =    1834
+        XML_SCHEMAV_CVC_MINEXCLUSIVE_VALID                 =    1835
+        XML_SCHEMAV_CVC_MAXEXCLUSIVE_VALID                 =    1836
+        XML_SCHEMAV_CVC_TOTALDIGITS_VALID                  =    1837
+        XML_SCHEMAV_CVC_FRACTIONDIGITS_VALID               =    1838
+        XML_SCHEMAV_CVC_PATTERN_VALID                      =    1839
+        XML_SCHEMAV_CVC_ENUMERATION_VALID                  =    1840
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_2_1                   =    1841
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_2_2                   =    1842
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_2_3                   =    1843
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_2_4                   =    1844
+        XML_SCHEMAV_CVC_ELT_1                              =    1845
+        XML_SCHEMAV_CVC_ELT_2                              =    1846
+        XML_SCHEMAV_CVC_ELT_3_1                            =    1847
+        XML_SCHEMAV_CVC_ELT_3_2_1                          =    1848
+        XML_SCHEMAV_CVC_ELT_3_2_2                          =    1849
+        XML_SCHEMAV_CVC_ELT_4_1                            =    1850
+        XML_SCHEMAV_CVC_ELT_4_2                            =    1851
+        XML_SCHEMAV_CVC_ELT_4_3                            =    1852
+        XML_SCHEMAV_CVC_ELT_5_1_1                          =    1853
+        XML_SCHEMAV_CVC_ELT_5_1_2                          =    1854
+        XML_SCHEMAV_CVC_ELT_5_2_1                          =    1855
+        XML_SCHEMAV_CVC_ELT_5_2_2_1                        =    1856
+        XML_SCHEMAV_CVC_ELT_5_2_2_2_1                      =    1857
+        XML_SCHEMAV_CVC_ELT_5_2_2_2_2                      =    1858
+        XML_SCHEMAV_CVC_ELT_6                              =    1859
+        XML_SCHEMAV_CVC_ELT_7                              =    1860
+        XML_SCHEMAV_CVC_ATTRIBUTE_1                        =    1861
+        XML_SCHEMAV_CVC_ATTRIBUTE_2                        =    1862
+        XML_SCHEMAV_CVC_ATTRIBUTE_3                        =    1863
+        XML_SCHEMAV_CVC_ATTRIBUTE_4                        =    1864
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_3_1                   =    1865
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_3_2_1                 =    1866
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_3_2_2                 =    1867
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_4                     =    1868
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_5_1                   =    1869
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_5_2                   =    1870
+        XML_SCHEMAV_ELEMENT_CONTENT                        =    1871
+        XML_SCHEMAV_DOCUMENT_ELEMENT_MISSING               =    1872
+        XML_SCHEMAV_CVC_COMPLEX_TYPE_1                     =    1873
+        XML_SCHEMAV_CVC_AU                                 =    1874
+        XML_SCHEMAV_CVC_TYPE_1                             =    1875
+        XML_SCHEMAV_CVC_TYPE_2                             =    1876
+        XML_SCHEMAV_CVC_IDC                                =    1877
+        XML_SCHEMAV_CVC_WILDCARD                           =    1878
+        XML_SCHEMAV_MISC                                   =    1879
+        XML_XPTR_UNKNOWN_SCHEME                            =    1900
+        XML_XPTR_CHILDSEQ_START                            =    1901
+        XML_XPTR_EVAL_FAILED                               =    1902
+        XML_XPTR_EXTRA_OBJECTS                             =    1903
+        XML_C14N_CREATE_CTXT                               =    1950
+        XML_C14N_REQUIRES_UTF8                             =    1951
+        XML_C14N_CREATE_STACK                              =    1952
+        XML_C14N_INVALID_NODE                              =    1953
+        XML_C14N_UNKNOW_NODE                               =    1954
+        XML_C14N_RELATIVE_NAMESPACE                        =    1955
+        XML_FTP_PASV_ANSWER                                =    2000
+        XML_FTP_EPSV_ANSWER                                =    2001
+        XML_FTP_ACCNT                                      =    2002
+        XML_FTP_URL_SYNTAX                                 =    2003
+        XML_HTTP_URL_SYNTAX                                =    2020
+        XML_HTTP_USE_IP                                    =    2021
+        XML_HTTP_UNKNOWN_HOST                              =    2022
+        XML_SCHEMAP_SRC_SIMPLE_TYPE_1                      =    3000
+        XML_SCHEMAP_SRC_SIMPLE_TYPE_2                      =    3001
+        XML_SCHEMAP_SRC_SIMPLE_TYPE_3                      =    3002
+        XML_SCHEMAP_SRC_SIMPLE_TYPE_4                      =    3003
+        XML_SCHEMAP_SRC_RESOLVE                            =    3004
+        XML_SCHEMAP_SRC_RESTRICTION_BASE_OR_SIMPLETYPE     =    3005
+        XML_SCHEMAP_SRC_LIST_ITEMTYPE_OR_SIMPLETYPE        =    3006
+        XML_SCHEMAP_SRC_UNION_MEMBERTYPES_OR_SIMPLETYPES   =    3007
+        XML_SCHEMAP_ST_PROPS_CORRECT_1                     =    3008
+        XML_SCHEMAP_ST_PROPS_CORRECT_2                     =    3009
+        XML_SCHEMAP_ST_PROPS_CORRECT_3                     =    3010
+        XML_SCHEMAP_COS_ST_RESTRICTS_1_1                   =    3011
+        XML_SCHEMAP_COS_ST_RESTRICTS_1_2                   =    3012
+        XML_SCHEMAP_COS_ST_RESTRICTS_1_3_1                 =    3013
+        XML_SCHEMAP_COS_ST_RESTRICTS_1_3_2                 =    3014
+        XML_SCHEMAP_COS_ST_RESTRICTS_2_1                   =    3015
+        XML_SCHEMAP_COS_ST_RESTRICTS_2_3_1_1               =    3016
+        XML_SCHEMAP_COS_ST_RESTRICTS_2_3_1_2               =    3017
+        XML_SCHEMAP_COS_ST_RESTRICTS_2_3_2_1               =    3018
+        XML_SCHEMAP_COS_ST_RESTRICTS_2_3_2_2               =    3019
+        XML_SCHEMAP_COS_ST_RESTRICTS_2_3_2_3               =    3020
+        XML_SCHEMAP_COS_ST_RESTRICTS_2_3_2_4               =    3021
+        XML_SCHEMAP_COS_ST_RESTRICTS_2_3_2_5               =    3022
+        XML_SCHEMAP_COS_ST_RESTRICTS_3_1                   =    3023
+        XML_SCHEMAP_COS_ST_RESTRICTS_3_3_1                 =    3024
+        XML_SCHEMAP_COS_ST_RESTRICTS_3_3_1_2               =    3025
+        XML_SCHEMAP_COS_ST_RESTRICTS_3_3_2_2               =    3026
+        XML_SCHEMAP_COS_ST_RESTRICTS_3_3_2_1               =    3027
+        XML_SCHEMAP_COS_ST_RESTRICTS_3_3_2_3               =    3028
+        XML_SCHEMAP_COS_ST_RESTRICTS_3_3_2_4               =    3029
+        XML_SCHEMAP_COS_ST_RESTRICTS_3_3_2_5               =    3030
+        XML_SCHEMAP_COS_ST_DERIVED_OK_2_1                  =    3031
+        XML_SCHEMAP_COS_ST_DERIVED_OK_2_2                  =    3032
+        XML_SCHEMAP_S4S_ELEM_NOT_ALLOWED                   =    3033
+        XML_SCHEMAP_S4S_ELEM_MISSING                       =    3034
+        XML_SCHEMAP_S4S_ATTR_NOT_ALLOWED                   =    3035
+        XML_SCHEMAP_S4S_ATTR_MISSING                       =    3036
+        XML_SCHEMAP_S4S_ATTR_INVALID_VALUE                 =    3037
+        XML_SCHEMAP_SRC_ELEMENT_1                          =    3038
+        XML_SCHEMAP_SRC_ELEMENT_2_1                        =    3039
+        XML_SCHEMAP_SRC_ELEMENT_2_2                        =    3040
+        XML_SCHEMAP_SRC_ELEMENT_3                          =    3041
+        XML_SCHEMAP_P_PROPS_CORRECT_1                      =    3042
+        XML_SCHEMAP_P_PROPS_CORRECT_2_1                    =    3043
+        XML_SCHEMAP_P_PROPS_CORRECT_2_2                    =    3044
+        XML_SCHEMAP_E_PROPS_CORRECT_2                      =    3045
+        XML_SCHEMAP_E_PROPS_CORRECT_3                      =    3046
+        XML_SCHEMAP_E_PROPS_CORRECT_4                      =    3047
+        XML_SCHEMAP_E_PROPS_CORRECT_5                      =    3048
+        XML_SCHEMAP_E_PROPS_CORRECT_6                      =    3049
+        XML_SCHEMAP_SRC_INCLUDE                            =    3050
+        XML_SCHEMAP_SRC_ATTRIBUTE_1                        =    3051
+        XML_SCHEMAP_SRC_ATTRIBUTE_2                        =    3052
+        XML_SCHEMAP_SRC_ATTRIBUTE_3_1                      =    3053
+        XML_SCHEMAP_SRC_ATTRIBUTE_3_2                      =    3054
+        XML_SCHEMAP_SRC_ATTRIBUTE_4                        =    3055
+        XML_SCHEMAP_NO_XMLNS                               =    3056
+        XML_SCHEMAP_NO_XSI                                 =    3057
+        XML_SCHEMAP_COS_VALID_DEFAULT_1                    =    3058
+        XML_SCHEMAP_COS_VALID_DEFAULT_2_1                  =    3059
+        XML_SCHEMAP_COS_VALID_DEFAULT_2_2_1                =    3060
+        XML_SCHEMAP_COS_VALID_DEFAULT_2_2_2                =    3061
+        XML_SCHEMAP_CVC_SIMPLE_TYPE                        =    3062
+        XML_SCHEMAP_COS_CT_EXTENDS_1_1                     =    3063
+        XML_SCHEMAP_SRC_IMPORT_1_1                         =    3064
+        XML_SCHEMAP_SRC_IMPORT_1_2                         =    3065
+        XML_SCHEMAP_SRC_IMPORT_2                           =    3066
+        XML_SCHEMAP_SRC_IMPORT_2_1                         =    3067
+        XML_SCHEMAP_SRC_IMPORT_2_2                         =    3068
+        XML_SCHEMAP_INTERNAL                               =    3069 # 3069 non-W3C
+        XML_SCHEMAP_NOT_DETERMINISTIC                      =    3070 # 3070 non-W3C
+        XML_SCHEMAP_SRC_ATTRIBUTE_GROUP_1                  =    3071
+        XML_SCHEMAP_SRC_ATTRIBUTE_GROUP_2                  =    3072
+        XML_SCHEMAP_SRC_ATTRIBUTE_GROUP_3                  =    3073
+        XML_SCHEMAP_MG_PROPS_CORRECT_1                     =    3074
+        XML_SCHEMAP_MG_PROPS_CORRECT_2                     =    3075
+        XML_SCHEMAP_SRC_CT_1                               =    3076
+        XML_SCHEMAP_DERIVATION_OK_RESTRICTION_2_1_3        =    3077
+        XML_SCHEMAP_AU_PROPS_CORRECT_2                     =    3078
+        XML_SCHEMAP_A_PROPS_CORRECT_2                      =    3079
+        XML_SCHEMAP_C_PROPS_CORRECT                        =    3080
+        XML_SCHEMAP_SRC_REDEFINE                           =    3081
+        XML_SCHEMAP_SRC_IMPORT                             =    3082
+        XML_SCHEMAP_WARN_SKIP_SCHEMA                       =    3083
+        XML_SCHEMAP_WARN_UNLOCATED_SCHEMA                  =    3084
+        XML_SCHEMAP_WARN_ATTR_REDECL_PROH                  =    3085
+        XML_SCHEMAP_WARN_ATTR_POINTLESS_PROH               =    3086 # 3085
+        XML_SCHEMAP_AG_PROPS_CORRECT                       =    3087 # 3086
+        XML_SCHEMAP_COS_CT_EXTENDS_1_2                     =    3088 # 3087
+        XML_SCHEMAP_AU_PROPS_CORRECT                       =    3089 # 3088
+        XML_SCHEMAP_A_PROPS_CORRECT_3                      =    3090 # 3089
+        XML_SCHEMAP_COS_ALL_LIMITED                        =    3091 # 3090
+        XML_SCHEMATRONV_ASSERT                             =    4000
+        XML_SCHEMATRONV_REPORT                             =    4001
+        XML_MODULE_OPEN                                    =    4900
+        XML_MODULE_CLOSE                                   =    4901
+        XML_CHECK_FOUND_ELEMENT                            =    5000
+        XML_CHECK_FOUND_ATTRIBUTE                          =    5001
+        XML_CHECK_FOUND_TEXT                               =    5002
+        XML_CHECK_FOUND_CDATA                              =    5003
+        XML_CHECK_FOUND_ENTITYREF                          =    5004
+        XML_CHECK_FOUND_ENTITY                             =    5005
+        XML_CHECK_FOUND_PI                                 =    5006
+        XML_CHECK_FOUND_COMMENT                            =    5007
+        XML_CHECK_FOUND_DOCTYPE                            =    5008
+        XML_CHECK_FOUND_FRAGMENT                           =    5009
+        XML_CHECK_FOUND_NOTATION                           =    5010
+        XML_CHECK_UNKNOWN_NODE                             =    5011
+        XML_CHECK_ENTITY_TYPE                              =    5012
+        XML_CHECK_NO_PARENT                                =    5013
+        XML_CHECK_NO_DOC                                   =    5014
+        XML_CHECK_NO_NAME                                  =    5015
+        XML_CHECK_NO_ELEM                                  =    5016
+        XML_CHECK_WRONG_DOC                                =    5017
+        XML_CHECK_NO_PREV                                  =    5018
+        XML_CHECK_WRONG_PREV                               =    5019
+        XML_CHECK_NO_NEXT                                  =    5020
+        XML_CHECK_WRONG_NEXT                               =    5021
+        XML_CHECK_NOT_DTD                                  =    5022
+        XML_CHECK_NOT_ATTR                                 =    5023
+        XML_CHECK_NOT_ATTR_DECL                            =    5024
+        XML_CHECK_NOT_ELEM_DECL                            =    5025
+        XML_CHECK_NOT_ENTITY_DECL                          =    5026
+        XML_CHECK_NOT_NS_DECL                              =    5027
+        XML_CHECK_NO_HREF                                  =    5028
+        XML_CHECK_WRONG_PARENT                             =    5029
+        XML_CHECK_NS_SCOPE                                 =    5030
+        XML_CHECK_NS_ANCESTOR                              =    5031
+        XML_CHECK_NOT_UTF8                                 =    5032
+        XML_CHECK_NO_DICT                                  =    5033
+        XML_CHECK_NOT_NCNAME                               =    5034
+        XML_CHECK_OUTSIDE_DICT                             =    5035
+        XML_CHECK_WRONG_NAME                               =    5036
+        XML_CHECK_NAME_NOT_NULL                            =    5037
+        XML_I18N_NO_NAME                                   =    6000
+        XML_I18N_NO_HANDLER                                =    6001
+        XML_I18N_EXCESS_HANDLER                            =    6002
+        XML_I18N_CONV_FAILED                               =    6003
+        XML_I18N_NO_OUTPUT                                 =    6004
+        XML_BUF_OVERFLOW                                   =    7000
+
+    ctypedef enum xmlRelaxNGValidErr:
+        XML_RELAXNG_OK                                     =       0
+        XML_RELAXNG_ERR_MEMORY                             =       1
+        XML_RELAXNG_ERR_TYPE                               =       2
+        XML_RELAXNG_ERR_TYPEVAL                            =       3
+        XML_RELAXNG_ERR_DUPID                              =       4
+        XML_RELAXNG_ERR_TYPECMP                            =       5
+        XML_RELAXNG_ERR_NOSTATE                            =       6
+        XML_RELAXNG_ERR_NODEFINE                           =       7
+        XML_RELAXNG_ERR_LISTEXTRA                          =       8
+        XML_RELAXNG_ERR_LISTEMPTY                          =       9
+        XML_RELAXNG_ERR_INTERNODATA                        =      10
+        XML_RELAXNG_ERR_INTERSEQ                           =      11
+        XML_RELAXNG_ERR_INTEREXTRA                         =      12
+        XML_RELAXNG_ERR_ELEMNAME                           =      13
+        XML_RELAXNG_ERR_ATTRNAME                           =      14
+        XML_RELAXNG_ERR_ELEMNONS                           =      15
+        XML_RELAXNG_ERR_ATTRNONS                           =      16
+        XML_RELAXNG_ERR_ELEMWRONGNS                        =      17
+        XML_RELAXNG_ERR_ATTRWRONGNS                        =      18
+        XML_RELAXNG_ERR_ELEMEXTRANS                        =      19
+        XML_RELAXNG_ERR_ATTREXTRANS                        =      20
+        XML_RELAXNG_ERR_ELEMNOTEMPTY                       =      21
+        XML_RELAXNG_ERR_NOELEM                             =      22
+        XML_RELAXNG_ERR_NOTELEM                            =      23
+        XML_RELAXNG_ERR_ATTRVALID                          =      24
+        XML_RELAXNG_ERR_CONTENTVALID                       =      25
+        XML_RELAXNG_ERR_EXTRACONTENT                       =      26
+        XML_RELAXNG_ERR_INVALIDATTR                        =      27
+        XML_RELAXNG_ERR_DATAELEM                           =      28
+        XML_RELAXNG_ERR_VALELEM                            =      29
+        XML_RELAXNG_ERR_LISTELEM                           =      30
+        XML_RELAXNG_ERR_DATATYPE                           =      31
+        XML_RELAXNG_ERR_VALUE                              =      32
+        XML_RELAXNG_ERR_LIST                               =      33
+        XML_RELAXNG_ERR_NOGRAMMAR                          =      34
+        XML_RELAXNG_ERR_EXTRADATA                          =      35
+        XML_RELAXNG_ERR_LACKDATA                           =      36
+        XML_RELAXNG_ERR_INTERNAL                           =      37
+        XML_RELAXNG_ERR_ELEMWRONG                          =      38
+        XML_RELAXNG_ERR_TEXTWRONG                          =      39
+# --- END: GENERATED CONSTANTS ---
+
+cdef extern from "libxml/xmlerror.h":
+    ctypedef struct xmlError:
+        int domain
+        int code
+        char* message
+        xmlErrorLevel level
+        char* file
+        char* str1
+        char* str2
+        char* str3
+        int line
+        int int1
+        int int2
+
+    ctypedef void (*xmlGenericErrorFunc)(void* ctxt, char* msg, ...) nogil
+    ctypedef void (*xmlStructuredErrorFunc)(void* userData,
+                                            xmlError* error) nogil
+
+    cdef void xmlSetGenericErrorFunc(
+        void* ctxt, xmlGenericErrorFunc func) nogil
+    cdef void xmlSetStructuredErrorFunc(
+        void* ctxt, xmlStructuredErrorFunc func) nogil
+
+cdef extern from "libxml/globals.h":
+    cdef xmlStructuredErrorFunc xmlStructuredError
+    cdef void* xmlStructuredErrorContext
diff --git a/lib/lxml/includes/xmlparser.pxd b/lib/lxml/includes/xmlparser.pxd
new file mode 100644
index 00000000..9b0ded41
--- /dev/null
+++ b/lib/lxml/includes/xmlparser.pxd
@@ -0,0 +1,218 @@
+from libc.string cimport const_char
+
+from lxml.includes.tree cimport xmlDoc, xmlNode, xmlDict, xmlDtd, const_xmlChar
+from lxml.includes.tree cimport xmlInputReadCallback, xmlInputCloseCallback
+from lxml.includes.xmlerror cimport xmlError, xmlStructuredErrorFunc
+
+
+cdef extern from "libxml/parser.h":
+    ctypedef void (*startElementNsSAX2Func)(void* ctx,
+                                            const_xmlChar* localname,
+                                            const_xmlChar* prefix,
+                                            const_xmlChar* URI,
+                                            int nb_namespaces,
+                                            const_xmlChar** namespaces,
+                                            int nb_attributes,
+                                            int nb_defaulted,
+                                            const_xmlChar** attributes)
+
+    ctypedef void (*endElementNsSAX2Func)(void* ctx,
+                                          const_xmlChar* localname,
+                                          const_xmlChar* prefix,
+                                          const_xmlChar* URI)
+
+    ctypedef void (*startElementSAXFunc)(void* ctx, const_xmlChar* name, const_xmlChar** atts)
+
+    ctypedef void (*endElementSAXFunc)(void* ctx, const_xmlChar* name)
+
+    ctypedef void (*charactersSAXFunc)(void* ctx, const_xmlChar* ch, int len)
+
+    ctypedef void (*cdataBlockSAXFunc)(void* ctx, const_xmlChar* value, int len)
+
+    ctypedef void (*commentSAXFunc)(void* ctx, const_xmlChar* value)
+
+    ctypedef void (*processingInstructionSAXFunc)(void* ctx, 
+                                                  const_xmlChar* target,
+                                                  const_xmlChar* data)
+
+    ctypedef void (*internalSubsetSAXFunc)(void* ctx, 
+                                            const_xmlChar* name,
+                                            const_xmlChar* externalID,
+                                            const_xmlChar* systemID)
+
+    ctypedef void (*endDocumentSAXFunc)(void* ctx)
+
+    ctypedef void (*startDocumentSAXFunc)(void* ctx)
+
+    ctypedef void (*referenceSAXFunc)(void * ctx, const_xmlChar* name)
+
+    cdef int XML_SAX2_MAGIC
+
+cdef extern from "libxml/tree.h":
+    ctypedef struct xmlParserInput:
+        int line
+        int length
+        const_xmlChar* base
+        const_xmlChar* cur
+        const_xmlChar* end
+
+    ctypedef struct xmlParserInputBuffer:
+        void* context
+        xmlInputReadCallback  readcallback
+        xmlInputCloseCallback closecallback
+
+    ctypedef struct xmlSAXHandlerV1:
+        # same as xmlSAXHandler, but without namespaces
+        pass
+
+    ctypedef struct xmlSAXHandler:
+        internalSubsetSAXFunc           internalSubset
+        startElementNsSAX2Func          startElementNs
+        endElementNsSAX2Func            endElementNs
+        startElementSAXFunc             startElement
+        endElementSAXFunc               endElement
+        charactersSAXFunc               characters
+        cdataBlockSAXFunc               cdataBlock
+        referenceSAXFunc                reference
+        commentSAXFunc                  comment
+        processingInstructionSAXFunc	processingInstruction
+        startDocumentSAXFunc            startDocument
+        endDocumentSAXFunc              endDocument
+        int                             initialized
+        xmlStructuredErrorFunc          serror
+        void*                           _private
+
+cdef extern from "libxml/xmlIO.h":
+    cdef xmlParserInputBuffer* xmlAllocParserInputBuffer(int enc) nogil
+
+cdef extern from "libxml/parser.h":
+
+    cdef xmlDict* xmlDictCreate() nogil
+    cdef xmlDict* xmlDictCreateSub(xmlDict* subdict) nogil
+    cdef void xmlDictFree(xmlDict* sub) nogil
+    cdef int xmlDictReference(xmlDict* dict) nogil
+    
+    cdef int XML_COMPLETE_ATTRS # SAX option for adding DTD default attributes
+
+    ctypedef struct xmlParserCtxt:
+        xmlDoc* myDoc
+        xmlDict* dict
+        int dictNames
+        void* _private
+        bint wellFormed
+        bint recovery
+        int options
+        bint disableSAX
+        int errNo
+        bint replaceEntities
+        int loadsubset  # != 0 if enabled, int value == why
+        bint validate
+        xmlError lastError
+        xmlNode* node
+        xmlSAXHandler* sax
+        void* userData
+        int* spaceTab
+        int spaceMax
+        bint html
+        bint progressive
+        int inSubset
+        int charset
+        xmlParserInput* input
+
+    ctypedef enum xmlParserOption:
+        XML_PARSE_RECOVER = 1 # recover on errors
+        XML_PARSE_NOENT = 2 # substitute entities
+        XML_PARSE_DTDLOAD = 4 # load the external subset
+        XML_PARSE_DTDATTR = 8 # default DTD attributes
+        XML_PARSE_DTDVALID = 16 # validate with the DTD
+        XML_PARSE_NOERROR = 32 # suppress error reports
+        XML_PARSE_NOWARNING = 64 # suppress warning reports
+        XML_PARSE_PEDANTIC = 128 # pedantic error reporting
+        XML_PARSE_NOBLANKS = 256 # remove blank nodes
+        XML_PARSE_SAX1 = 512 # use the SAX1 interface internally
+        XML_PARSE_XINCLUDE = 1024 # Implement XInclude substitition
+        XML_PARSE_NONET = 2048 # Forbid network access
+        XML_PARSE_NODICT = 4096 # Do not reuse the context dictionnary
+        XML_PARSE_NSCLEAN = 8192 # remove redundant namespaces declarations
+        XML_PARSE_NOCDATA = 16384 # merge CDATA as text nodes
+        XML_PARSE_NOXINCNODE = 32768 # do not generate XINCLUDE START/END nodes
+        # libxml2 2.6.21+ only:
+        XML_PARSE_COMPACT = 65536 # compact small text nodes
+        # libxml2 2.7.0+ only:
+        XML_PARSE_OLD10 = 131072 # parse using XML-1.0 before update 5
+        XML_PARSE_NOBASEFIX = 262144 # do not fixup XINCLUDE xml:base uris
+        XML_PARSE_HUGE = 524288 # relax any hardcoded limit from the parser
+        # libxml2 2.7.3+ only:
+        XML_PARSE_OLDSAX = 1048576 # parse using SAX2 interface before 2.7.0
+        # libxml2 2.8.0+ only:
+        XML_PARSE_IGNORE_ENC = 2097152 # ignore internal document encoding hint
+        # libxml2 2.9.0+ only:
+        XML_PARSE_BIG_LINES = 4194304 # Store big lines numbers in text PSVI field
+
+    cdef void xmlInitParser() nogil
+    cdef void xmlCleanupParser() nogil
+
+    cdef int xmlLineNumbersDefault(int onoff) nogil
+    cdef xmlParserCtxt* xmlNewParserCtxt() nogil
+    cdef xmlParserInput* xmlNewIOInputStream(xmlParserCtxt* ctxt,
+                                             xmlParserInputBuffer* input,
+                                             int enc) nogil
+    cdef int xmlCtxtUseOptions(xmlParserCtxt* ctxt, int options) nogil
+    cdef void xmlFreeParserCtxt(xmlParserCtxt* ctxt) nogil
+    cdef void xmlCtxtReset(xmlParserCtxt* ctxt) nogil
+    cdef void xmlClearParserCtxt(xmlParserCtxt* ctxt) nogil
+    cdef int xmlParseChunk(xmlParserCtxt* ctxt,
+                           char* chunk, int size, int terminate) nogil
+    cdef xmlDoc* xmlCtxtReadDoc(xmlParserCtxt* ctxt,
+                                char* cur, char* URL, char* encoding,
+                                int options) nogil
+    cdef xmlDoc* xmlCtxtReadFile(xmlParserCtxt* ctxt,
+                                 char* filename, char* encoding,
+                                 int options) nogil
+    cdef xmlDoc* xmlCtxtReadIO(xmlParserCtxt* ctxt, 
+                               xmlInputReadCallback ioread, 
+                               xmlInputCloseCallback ioclose, 
+                               void* ioctx,
+                               char* URL, char* encoding,
+                               int options) nogil
+    cdef xmlDoc* xmlCtxtReadMemory(xmlParserCtxt* ctxt,
+                                   char* buffer, int size,
+                                   char* filename, const_char* encoding,
+                                   int options) nogil
+
+# iterparse:
+
+    cdef xmlParserCtxt* xmlCreatePushParserCtxt(xmlSAXHandler* sax,
+                                                void* user_data,
+                                                char* chunk,
+                                                int size,
+                                                char* filename) nogil
+
+    cdef int xmlCtxtResetPush(xmlParserCtxt* ctxt,
+                              char* chunk,
+                              int size,
+                              char* filename,
+                              char* encoding) nogil
+
+# entity loaders:
+
+    ctypedef xmlParserInput* (*xmlExternalEntityLoader)(
+        const_char * URL, const_char * ID, xmlParserCtxt* context) nogil
+    cdef xmlExternalEntityLoader xmlGetExternalEntityLoader() nogil
+    cdef void xmlSetExternalEntityLoader(xmlExternalEntityLoader f) nogil
+
+# DTDs:
+
+    cdef xmlDtd* xmlParseDTD(const_xmlChar* ExternalID, const_xmlChar* SystemID) nogil
+    cdef xmlDtd* xmlIOParseDTD(xmlSAXHandler* sax,
+                               xmlParserInputBuffer* input,
+                               int enc) nogil
+
+cdef extern from "libxml/parserInternals.h":
+    cdef xmlParserInput* xmlNewInputStream(xmlParserCtxt* ctxt)
+    cdef xmlParserInput* xmlNewStringInputStream(xmlParserCtxt* ctxt, 
+                                                 char* buffer) nogil
+    cdef xmlParserInput* xmlNewInputFromFile(xmlParserCtxt* ctxt, 
+                                             char* filename) nogil
+    cdef void xmlFreeInputStream(xmlParserInput* input) nogil
+    cdef int xmlSwitchEncoding(xmlParserCtxt* ctxt, int enc) nogil
diff --git a/lib/lxml/includes/xmlschema.pxd b/lib/lxml/includes/xmlschema.pxd
new file mode 100644
index 00000000..8e93cc57
--- /dev/null
+++ b/lib/lxml/includes/xmlschema.pxd
@@ -0,0 +1,35 @@
+from lxml.includes.tree cimport xmlDoc
+from lxml.includes.xmlparser cimport xmlSAXHandler
+from lxml.includes.xmlerror cimport xmlStructuredErrorFunc
+
+cdef extern from "libxml/xmlschemas.h":
+    ctypedef struct xmlSchema
+    ctypedef struct xmlSchemaParserCtxt
+
+    ctypedef struct xmlSchemaSAXPlugStruct
+    ctypedef struct xmlSchemaValidCtxt
+
+    ctypedef enum xmlSchemaValidOption:
+        XML_SCHEMA_VAL_VC_I_CREATE = 1
+
+    cdef xmlSchemaValidCtxt* xmlSchemaNewValidCtxt(xmlSchema* schema) nogil
+    cdef void xmlSchemaSetParserStructuredErrors(xmlSchemaParserCtxt* ctxt,
+        xmlStructuredErrorFunc serror, void *ctx)
+    cdef void xmlSchemaSetValidStructuredErrors(xmlSchemaValidCtxt* ctxt,
+        xmlStructuredErrorFunc serror, void *ctx)
+
+    cdef int xmlSchemaValidateDoc(xmlSchemaValidCtxt* ctxt, xmlDoc* doc) nogil
+    cdef xmlSchema* xmlSchemaParse(xmlSchemaParserCtxt* ctxt) nogil
+    cdef xmlSchemaParserCtxt* xmlSchemaNewParserCtxt(char* URL) nogil
+    cdef xmlSchemaParserCtxt* xmlSchemaNewDocParserCtxt(xmlDoc* doc) nogil
+    cdef void xmlSchemaFree(xmlSchema* schema) nogil
+    cdef void xmlSchemaFreeParserCtxt(xmlSchemaParserCtxt* ctxt) nogil
+    cdef void xmlSchemaFreeValidCtxt(xmlSchemaValidCtxt* ctxt) nogil
+    cdef int xmlSchemaSetValidOptions(xmlSchemaValidCtxt* ctxt,
+                                      int options) nogil
+
+    cdef xmlSchemaSAXPlugStruct* xmlSchemaSAXPlug(xmlSchemaValidCtxt* ctxt,
+                                                  xmlSAXHandler** sax,
+                                                  void** data) nogil
+    cdef int xmlSchemaSAXUnplug(xmlSchemaSAXPlugStruct* sax_plug)
+    cdef int xmlSchemaIsValid(xmlSchemaValidCtxt* ctxt)
diff --git a/lib/lxml/includes/xpath.pxd b/lib/lxml/includes/xpath.pxd
new file mode 100644
index 00000000..d01735b6
--- /dev/null
+++ b/lib/lxml/includes/xpath.pxd
@@ -0,0 +1,135 @@
+from lxml.includes cimport tree
+from lxml.includes cimport xmlerror
+
+from libc.string cimport const_char
+from lxml.includes.tree cimport xmlChar, const_xmlChar
+
+cdef extern from "libxml/xpath.h":
+    ctypedef enum xmlXPathObjectType:
+        XPATH_UNDEFINED = 0
+        XPATH_NODESET = 1
+        XPATH_BOOLEAN = 2
+        XPATH_NUMBER = 3
+        XPATH_STRING = 4
+        XPATH_POINT = 5
+        XPATH_RANGE = 6
+        XPATH_LOCATIONSET = 7
+        XPATH_USERS = 8
+        XPATH_XSLT_TREE = 9
+
+    ctypedef enum xmlXPathError:
+        XPATH_EXPRESSION_OK = 0
+        XPATH_NUMBER_ERROR = 1
+        XPATH_UNFINISHED_LITERAL_ERROR = 2
+        XPATH_START_LITERAL_ERROR = 3
+        XPATH_VARIABLE_REF_ERROR = 4
+        XPATH_UNDEF_VARIABLE_ERROR = 5
+        XPATH_INVALID_PREDICATE_ERROR = 6
+        XPATH_EXPR_ERROR = 7
+        XPATH_UNCLOSED_ERROR = 8
+        XPATH_UNKNOWN_FUNC_ERROR = 9
+        XPATH_INVALID_OPERAND = 10
+        XPATH_INVALID_TYPE = 11
+        XPATH_INVALID_ARITY = 12
+        XPATH_INVALID_CTXT_SIZE = 13
+        XPATH_INVALID_CTXT_POSITION = 14
+        XPATH_MEMORY_ERROR = 15
+        XPTR_SYNTAX_ERROR = 16
+        XPTR_RESOURCE_ERROR = 17
+        XPTR_SUB_RESOURCE_ERROR = 18
+        XPATH_UNDEF_PREFIX_ERROR = 19
+        XPATH_ENCODING_ERROR = 20
+        XPATH_INVALID_CHAR_ERROR = 21
+        XPATH_INVALID_CTXT = 22
+
+    ctypedef struct xmlNodeSet:
+        int nodeNr
+        int nodeMax
+        tree.xmlNode** nodeTab
+        
+    ctypedef struct xmlXPathObject:
+        xmlXPathObjectType type
+        xmlNodeSet* nodesetval
+        bint boolval
+        double floatval
+        xmlChar* stringval
+
+    ctypedef struct xmlXPathContext:
+        tree.xmlDoc* doc
+        tree.xmlNode* node
+        tree.xmlDict* dict
+        tree.xmlHashTable* nsHash
+        const_xmlChar* function
+        const_xmlChar* functionURI
+        xmlerror.xmlStructuredErrorFunc error
+        xmlerror.xmlError lastError
+        void* userData
+
+    ctypedef struct xmlXPathParserContext:
+        xmlXPathContext* context
+        xmlXPathObject* value
+        tree.xmlNode* ancestor
+        int error
+
+    ctypedef struct xmlXPathCompExpr
+
+    ctypedef void (*xmlXPathFunction)(xmlXPathParserContext* ctxt, int nargs) nogil
+    ctypedef xmlXPathFunction (*xmlXPathFuncLookupFunc)(void* ctxt,
+                                                        const_xmlChar* name,
+                                                        const_xmlChar* ns_uri) nogil
+    
+    cdef xmlXPathContext* xmlXPathNewContext(tree.xmlDoc* doc) nogil
+    cdef xmlXPathObject* xmlXPathEvalExpression(const_xmlChar* str,
+                                                xmlXPathContext* ctxt) nogil
+    cdef xmlXPathObject* xmlXPathCompiledEval(xmlXPathCompExpr* comp,
+                                              xmlXPathContext* ctxt) nogil
+    cdef xmlXPathCompExpr* xmlXPathCompile(const_xmlChar* str) nogil
+    cdef xmlXPathCompExpr* xmlXPathCtxtCompile(xmlXPathContext* ctxt,
+                                               const_xmlChar* str) nogil
+    cdef void xmlXPathFreeContext(xmlXPathContext* ctxt) nogil
+    cdef void xmlXPathFreeCompExpr(xmlXPathCompExpr* comp) nogil
+    cdef void xmlXPathFreeObject(xmlXPathObject* obj) nogil
+    cdef int xmlXPathRegisterNs(xmlXPathContext* ctxt,
+                                const_xmlChar* prefix, const_xmlChar* ns_uri) nogil
+    
+    cdef xmlNodeSet* xmlXPathNodeSetCreate(tree.xmlNode* val) nogil
+    cdef void xmlXPathFreeNodeSet(xmlNodeSet* val) nogil
+
+
+cdef extern from "libxml/xpathInternals.h":
+    cdef int xmlXPathRegisterFunc(xmlXPathContext* ctxt,
+                                  const_xmlChar* name,
+                                  xmlXPathFunction f) nogil
+    cdef int xmlXPathRegisterFuncNS(xmlXPathContext* ctxt,
+                                    const_xmlChar* name,
+                                    const_xmlChar* ns_uri,
+                                    xmlXPathFunction f) nogil
+    cdef void xmlXPathRegisterFuncLookup(xmlXPathContext *ctxt,
+                                         xmlXPathFuncLookupFunc f,
+                                         void *funcCtxt) nogil
+    cdef int xmlXPathRegisterVariable(xmlXPathContext *ctxt, 
+                                      const_xmlChar* name,
+                                      xmlXPathObject* value) nogil
+    cdef int xmlXPathRegisterVariableNS(xmlXPathContext *ctxt, 
+                                        const_xmlChar* name,
+                                        const_xmlChar* ns_uri,
+                                        xmlXPathObject* value) nogil
+    cdef void xmlXPathRegisteredVariablesCleanup(xmlXPathContext *ctxt) nogil
+    cdef void xmlXPathRegisteredNsCleanup(xmlXPathContext *ctxt) nogil
+    cdef xmlXPathObject* valuePop (xmlXPathParserContext *ctxt) nogil
+    cdef int valuePush(xmlXPathParserContext* ctxt, xmlXPathObject *value) nogil
+    
+    cdef xmlXPathObject* xmlXPathNewCString(const_char *val) nogil
+    cdef xmlXPathObject* xmlXPathWrapCString(const_char * val) nogil
+    cdef xmlXPathObject* xmlXPathNewString(const_xmlChar *val) nogil
+    cdef xmlXPathObject* xmlXPathWrapString(const_xmlChar * val) nogil
+    cdef xmlXPathObject* xmlXPathNewFloat(double val) nogil
+    cdef xmlXPathObject* xmlXPathNewBoolean(int val) nogil
+    cdef xmlXPathObject* xmlXPathNewNodeSet(tree.xmlNode* val) nogil
+    cdef xmlXPathObject* xmlXPathNewValueTree(tree.xmlNode* val) nogil
+    cdef void xmlXPathNodeSetAdd(xmlNodeSet* cur,
+                                  tree.xmlNode* val) nogil
+    cdef void xmlXPathNodeSetAddUnique(xmlNodeSet* cur,
+                                        tree.xmlNode* val) nogil
+    cdef xmlXPathObject* xmlXPathWrapNodeSet(xmlNodeSet* val) nogil
+    cdef void xmlXPathErr(xmlXPathParserContext* ctxt, int error) nogil
diff --git a/lib/lxml/includes/xslt.pxd b/lib/lxml/includes/xslt.pxd
new file mode 100644
index 00000000..3ca35d7f
--- /dev/null
+++ b/lib/lxml/includes/xslt.pxd
@@ -0,0 +1,176 @@
+from lxml.includes.tree cimport xmlDoc, xmlNode, xmlDict, xmlChar, const_xmlChar
+from lxml.includes.xpath cimport xmlXPathContext, xmlXPathFunction
+
+from libc.string cimport const_char
+
+cdef extern from "libxslt/xslt.h":
+    cdef int xsltLibxsltVersion
+    cdef int xsltMaxDepth
+
+cdef extern from "libxslt/xsltconfig.h":
+    cdef int LIBXSLT_VERSION
+
+cdef extern from "libxslt/xsltInternals.h":
+    ctypedef enum xsltTransformState:
+        XSLT_STATE_OK       # 0
+        XSLT_STATE_ERROR    # 1
+        XSLT_STATE_STOPPED  # 2
+
+    ctypedef struct xsltDocument:
+        xmlDoc* doc
+
+    ctypedef struct xsltStylesheet:
+        xmlChar* encoding
+        xmlDoc* doc
+        int errors
+
+    ctypedef struct xsltTransformContext:
+        xsltStylesheet* style
+        xmlXPathContext* xpathCtxt
+        xsltDocument* document
+        void* _private
+        xmlDict* dict
+        int profile
+        xmlNode* node
+        xmlDoc* output
+        xmlNode* insert
+        xmlNode* inst
+        xsltTransformState state
+
+    ctypedef struct xsltStackElem
+
+    ctypedef struct xsltTemplate
+
+    cdef xsltStylesheet* xsltParseStylesheetDoc(xmlDoc* doc) nogil
+    cdef void xsltFreeStylesheet(xsltStylesheet* sheet) nogil
+
+cdef extern from "libxslt/extensions.h":
+    ctypedef void (*xsltTransformFunction)(xsltTransformContext* ctxt,
+                                           xmlNode* context_node,
+                                           xmlNode* inst,
+                                           void* precomp_unused) nogil
+
+    cdef int xsltRegisterExtFunction(xsltTransformContext* ctxt,
+                                     const_xmlChar* name,
+                                     const_xmlChar* URI,
+                                     xmlXPathFunction function) nogil
+    cdef int xsltRegisterExtModuleFunction(const_xmlChar* name, const_xmlChar* URI,
+                                           xmlXPathFunction function) nogil
+    cdef int xsltUnregisterExtModuleFunction(const_xmlChar* name, const_xmlChar* URI)
+    cdef xmlXPathFunction xsltExtModuleFunctionLookup(
+        const_xmlChar* name, const_xmlChar* URI) nogil
+    cdef int xsltRegisterExtPrefix(xsltStylesheet* style, 
+                                   const_xmlChar* prefix, const_xmlChar* URI) nogil
+    cdef int xsltRegisterExtElement(xsltTransformContext* ctxt,
+                                    const_xmlChar* name, const_xmlChar* URI,
+                                    xsltTransformFunction function) nogil
+
+cdef extern from "libxslt/documents.h":
+    ctypedef enum xsltLoadType:
+        XSLT_LOAD_START
+        XSLT_LOAD_STYLESHEET
+        XSLT_LOAD_DOCUMENT
+
+    ctypedef xmlDoc* (*xsltDocLoaderFunc)(const_xmlChar* URI, xmlDict* dict,
+                                          int options,
+                                          void* ctxt,
+                                          xsltLoadType type) nogil
+    cdef xsltDocLoaderFunc xsltDocDefaultLoader
+    cdef void xsltSetLoaderFunc(xsltDocLoaderFunc f) nogil
+
+cdef extern from "libxslt/transform.h":
+    cdef xmlDoc* xsltApplyStylesheet(xsltStylesheet* style, xmlDoc* doc,
+                                     const_char** params) nogil
+    cdef xmlDoc* xsltApplyStylesheetUser(xsltStylesheet* style, xmlDoc* doc,
+                                         const_char** params, const_char* output,
+                                         void* profile,
+                                         xsltTransformContext* context) nogil
+    cdef void xsltProcessOneNode(xsltTransformContext* ctxt,
+                                 xmlNode* contextNode,
+                                 xsltStackElem* params) nogil
+    cdef xsltTransformContext* xsltNewTransformContext(xsltStylesheet* style,
+                                                       xmlDoc* doc) nogil
+    cdef void xsltFreeTransformContext(xsltTransformContext* context) nogil
+    cdef void xsltApplyOneTemplate(xsltTransformContext* ctxt,
+                                   xmlNode* contextNode, xmlNode* list,
+                                   xsltTemplate* templ,
+                                   xsltStackElem* params) nogil
+
+cdef extern from "libxslt/xsltutils.h":
+    cdef int xsltSaveResultToString(xmlChar** doc_txt_ptr,
+                                    int* doc_txt_len,
+                                    xmlDoc* result,
+                                    xsltStylesheet* style) nogil
+    
+    cdef void xsltSetGenericErrorFunc(
+        void* ctxt, void (*handler)(void* ctxt, char* msg, ...)) nogil
+    cdef void xsltSetTransformErrorFunc(
+        xsltTransformContext*, void* ctxt,
+        void (*handler)(void* ctxt, char* msg, ...) nogil) nogil
+    cdef void xsltTransformError(xsltTransformContext* ctxt, 
+                                 xsltStylesheet* style, 
+                                 xmlNode* node, char* msg, ...)
+    cdef void xsltSetCtxtParseOptions(
+        xsltTransformContext* ctxt, int options)
+
+cdef extern from "libxslt/security.h":
+    ctypedef struct xsltSecurityPrefs
+    ctypedef enum xsltSecurityOption:
+        XSLT_SECPREF_READ_FILE = 1
+        XSLT_SECPREF_WRITE_FILE = 2
+        XSLT_SECPREF_CREATE_DIRECTORY = 3
+        XSLT_SECPREF_READ_NETWORK = 4
+        XSLT_SECPREF_WRITE_NETWORK = 5
+
+    ctypedef int (*xsltSecurityCheck)(xsltSecurityPrefs* sec,
+                                      xsltTransformContext* ctxt,
+                                      char* value) nogil
+
+    cdef xsltSecurityPrefs* xsltNewSecurityPrefs() nogil
+    cdef void xsltFreeSecurityPrefs(xsltSecurityPrefs* sec) nogil
+    cdef int xsltSecurityForbid(xsltSecurityPrefs* sec,
+                                xsltTransformContext* ctxt,
+                                char* value) nogil
+    cdef int xsltSecurityAllow(xsltSecurityPrefs* sec,
+                                xsltTransformContext* ctxt,
+                                char* value) nogil
+    cdef int xsltSetSecurityPrefs(xsltSecurityPrefs* sec,
+                                  xsltSecurityOption option,
+                                  xsltSecurityCheck func) nogil
+    cdef xsltSecurityCheck xsltGetSecurityPrefs(
+        xsltSecurityPrefs* sec,
+        xsltSecurityOption option) nogil
+    cdef int xsltSetCtxtSecurityPrefs(xsltSecurityPrefs* sec,
+                                      xsltTransformContext* ctxt) nogil
+    cdef xmlDoc* xsltGetProfileInformation(xsltTransformContext* ctxt) nogil
+
+cdef extern from "libxslt/variables.h":
+    cdef int xsltQuoteUserParams(xsltTransformContext* ctxt,
+                                 const_char** params)
+    cdef int xsltQuoteOneUserParam(xsltTransformContext* ctxt,
+                                   const_xmlChar* name,
+                                   const_xmlChar* value)
+
+cdef extern from "libxslt/extra.h":
+    const_xmlChar* XSLT_LIBXSLT_NAMESPACE
+    const_xmlChar* XSLT_XALAN_NAMESPACE
+    const_xmlChar* XSLT_SAXON_NAMESPACE
+    const_xmlChar* XSLT_XT_NAMESPACE
+
+    cdef xmlXPathFunction xsltFunctionNodeSet
+    cdef void xsltRegisterAllExtras() nogil
+
+cdef extern from "libexslt/exslt.h":
+    cdef void exsltRegisterAll() nogil
+
+    # libexslt 1.1.25+
+    const_xmlChar* EXSLT_DATE_NAMESPACE
+    const_xmlChar* EXSLT_SETS_NAMESPACE
+    const_xmlChar* EXSLT_MATH_NAMESPACE
+    const_xmlChar* EXSLT_STRINGS_NAMESPACE
+
+    cdef int exsltDateXpathCtxtRegister(xmlXPathContext* ctxt, const_xmlChar* prefix)
+    cdef int exsltSetsXpathCtxtRegister(xmlXPathContext* ctxt, const_xmlChar* prefix)
+    cdef int exsltMathXpathCtxtRegister(xmlXPathContext* ctxt, const_xmlChar* prefix)
+    cdef int exsltStrXpathCtxtRegister(xmlXPathContext* ctxt, const_xmlChar* prefix)
+
diff --git a/lib/lxml/isoschematron/__init__.py b/lib/lxml/isoschematron/__init__.py
new file mode 100644
index 00000000..f4b091ea
--- /dev/null
+++ b/lib/lxml/isoschematron/__init__.py
@@ -0,0 +1,316 @@
+"""The ``lxml.isoschematron`` package implements ISO Schematron support on top
+of the pure-xslt 'skeleton' implementation.
+"""
+
+import sys
+import os.path
+from lxml import etree as _etree # due to validator __init__ signature
+
+
+# some compat stuff, borrowed from lxml.html
+try:
+    bytes
+except NameError:
+    # Python < 2.6
+    bytes = str
+try:
+    unicode
+except NameError:
+    # Python 3
+    unicode = str
+try:
+    basestring
+except NameError:
+    # Python 3
+    basestring = str
+
+
+__all__ = ['extract_xsd', 'extract_rng', 'iso_dsdl_include',
+           'iso_abstract_expand', 'iso_svrl_for_xslt1',
+           'svrl_validation_errors', 'schematron_schema_valid',
+           'stylesheet_params', 'Schematron'] 
+
+
+# some namespaces
+#FIXME: Maybe lxml should provide a dedicated place for common namespace
+#FIXME: definitions?
+XML_SCHEMA_NS = "http://www.w3.org/2001/XMLSchema"
+RELAXNG_NS = "http://relaxng.org/ns/structure/1.0"
+SCHEMATRON_NS = "http://purl.oclc.org/dsdl/schematron"
+SVRL_NS = "http://purl.oclc.org/dsdl/svrl"
+
+
+# some helpers
+_schematron_root = '{%s}schema' % SCHEMATRON_NS
+_xml_schema_root = '{%s}schema' % XML_SCHEMA_NS
+_resources_dir = os.path.join(os.path.dirname(__file__), 'resources')
+
+
+# the iso-schematron skeleton implementation steps aka xsl transformations
+extract_xsd = _etree.XSLT(_etree.parse(
+    os.path.join(_resources_dir, 'xsl', 'XSD2Schtrn.xsl')))
+extract_rng = _etree.XSLT(_etree.parse(
+    os.path.join(_resources_dir, 'xsl', 'RNG2Schtrn.xsl')))
+iso_dsdl_include = _etree.XSLT(_etree.parse(
+    os.path.join(_resources_dir, 'xsl', 'iso-schematron-xslt1',
+                 'iso_dsdl_include.xsl')))
+iso_abstract_expand = _etree.XSLT(_etree.parse(
+    os.path.join(_resources_dir, 'xsl', 'iso-schematron-xslt1',
+                 'iso_abstract_expand.xsl')))
+iso_svrl_for_xslt1 = _etree.XSLT(_etree.parse(
+    os.path.join(_resources_dir,
+                 'xsl', 'iso-schematron-xslt1', 'iso_svrl_for_xslt1.xsl')))
+
+
+# svrl result accessors
+svrl_validation_errors = _etree.XPath(
+    '//svrl:failed-assert', namespaces={'svrl': SVRL_NS})
+
+
+# RelaxNG validator for schematron schemas
+schematron_schema_valid = _etree.RelaxNG(_etree.parse(
+    os.path.join(_resources_dir, 'rng', 'iso-schematron.rng')))
+
+
+def stylesheet_params(**kwargs):
+    """Convert keyword args to a dictionary of stylesheet parameters.
+    XSL stylesheet parameters must be XPath expressions, i.e.:
+
+    * string expressions, like "'5'"
+    * simple (number) expressions, like "5"
+    * valid XPath expressions, like "/a/b/text()"
+
+    This function converts native Python keyword arguments to stylesheet
+    parameters following these rules:
+    If an arg is a string wrap it with XSLT.strparam().
+    If an arg is an XPath object use its path string.
+    If arg is None raise TypeError.
+    Else convert arg to string.
+    """
+    result = {}
+    for key, val in kwargs.items():
+        if isinstance(val, basestring):
+            val = _etree.XSLT.strparam(val)
+        elif val is None:
+            raise TypeError('None not allowed as a stylesheet parameter')
+        elif not isinstance(val, _etree.XPath):
+            val = unicode(val)
+        result[key] = val
+    return result
+
+
+# helper function for use in Schematron __init__
+def _stylesheet_param_dict(paramsDict, kwargsDict):
+    """Return a copy of paramsDict, updated with kwargsDict entries, wrapped as
+    stylesheet arguments.
+    kwargsDict entries with a value of None are ignored.
+    """
+    # beware of changing mutable default arg
+    paramsDict = dict(paramsDict)
+    for k, v in kwargsDict.items():
+        if v is not None: # None values do not override
+            paramsDict[k] = v
+    paramsDict = stylesheet_params(**paramsDict)
+    return paramsDict
+    
+
+class Schematron(_etree._Validator):
+    """An ISO Schematron validator.
+
+    Pass a root Element or an ElementTree to turn it into a validator.
+    Alternatively, pass a filename as keyword argument 'file' to parse from
+    the file system.
+    Built on the Schematron language 'reference' skeleton pure-xslt
+    implementation, the validator is created as an XSLT 1.0 stylesheet using
+    these steps:
+
+     0) (Extract from XML Schema or RelaxNG schema)
+     1) Process inclusions
+     2) Process abstract patterns
+     3) Compile the schematron schema to XSLT
+
+    The ``include`` and ``expand`` keyword arguments can be used to switch off
+    steps 1) and 2).
+    To set parameters for steps 1), 2) and 3) hand parameter dictionaries to the
+    keyword arguments ``include_params``, ``expand_params`` or
+    ``compile_params``.
+    For convenience, the compile-step parameter ``phase`` is also exposed as a
+    keyword argument ``phase``. This takes precedence if the parameter is also
+    given in the parameter dictionary.
+    If ``store_schematron`` is set to True, the (included-and-expanded)
+    schematron document tree is stored and available through the ``schematron``
+    property.
+    If ``store_xslt`` is set to True, the validation XSLT document tree will be
+    stored and can be retrieved through the ``validator_xslt`` property.
+    With ``store_report`` set to True (default: False), the resulting validation
+    report document gets stored and can be accessed as the ``validation_report``
+    property.
+
+    Schematron is a less well known, but very powerful schema language.  The main
+    idea is to use the capabilities of XPath to put restrictions on the structure
+    and the content of XML documents.  Here is a simple example::
+
+      >>> from lxml import isoschematron
+      >>> schematron = isoschematron.Schematron(etree.XML('''
+      ... <schema xmlns="http://purl.oclc.org/dsdl/schematron" >
+      ...   <pattern id="id_only_attribute">
+      ...     <title>id is the only permitted attribute name</title>
+      ...     <rule context="*">
+      ...       <report test="@*[not(name()='id')]">Attribute
+      ...         <name path="@*[not(name()='id')]"/> is forbidden<name/>
+      ...       </report>
+      ...     </rule>
+      ...   </pattern>
+      ... </schema>
+      ... '''))
+
+      >>> xml = etree.XML('''
+      ... <AAA name="aaa">
+      ...   <BBB id="bbb"/>
+      ...   <CCC color="ccc"/>
+      ... </AAA>
+      ... ''')
+
+      >>> schematron.validate(xml)
+      0
+
+      >>> xml = etree.XML('''
+      ... <AAA id="aaa">
+      ...   <BBB id="bbb"/>
+      ...   <CCC/>
+      ... </AAA>
+      ... ''')
+
+      >>> schematron.validate(xml)
+      1
+    """
+
+    # libxml2 error categorization for validation errors
+    _domain = _etree.ErrorDomains.SCHEMATRONV
+    _level = _etree.ErrorLevels.ERROR
+    _error_type = _etree.ErrorTypes.SCHEMATRONV_ASSERT
+
+    def _extract(self, element):
+        """Extract embedded schematron schema from non-schematron host schema.
+        This method will only be called by __init__ if the given schema document
+        is not a schematron schema by itself.
+        Must return a schematron schema document tree or None.
+        """
+        schematron = None
+        if element.tag == _xml_schema_root:
+            schematron = self._extract_xsd(element)
+        elif element.nsmap[element.prefix] == RELAXNG_NS:
+            # RelaxNG does not have a single unique root element
+            schematron = self._extract_rng(element)
+        return schematron
+    
+    # customization points
+    # etree.XSLT objects that provide the extract, include, expand, compile
+    # steps
+    _extract_xsd = extract_xsd
+    _extract_rng = extract_rng
+    _include = iso_dsdl_include
+    _expand = iso_abstract_expand
+    _compile = iso_svrl_for_xslt1
+    # etree.XPath object that determines input document validity when applied to
+    # the svrl result report; must return a list of result elements (empty if
+    # valid)
+    _validation_errors = svrl_validation_errors
+    
+    def __init__(self, etree=None, file=None, include=True, expand=True,
+                 include_params={}, expand_params={}, compile_params={},
+                 store_schematron=False, store_xslt=False, store_report=False,
+                 phase=None):
+        super(Schematron, self).__init__()
+
+        self._store_report = store_report
+        self._schematron = None
+        self._validator_xslt = None
+        self._validation_report = None
+
+        # parse schema document, may be a schematron schema or an XML Schema or
+        # a RelaxNG schema with embedded schematron rules
+        try:
+            if etree is not None:
+                if isinstance(etree, _etree._Element):
+                    root = etree
+                else:
+                    root = etree.getroot()
+            elif file is not None:
+                root = _etree.parse(file).getroot()
+        except Exception:
+            raise _etree.SchematronParseError(
+                "No tree or file given: %s" % sys.exc_info()[1])
+        if root is None:
+             raise ValueError("Empty tree")
+        if root.tag == _schematron_root:
+            schematron = root
+        else:
+            schematron = self._extract(root)
+        if schematron is None:
+            raise _etree.SchematronParseError(
+                "Document is not a schematron schema or schematron-extractable")
+        # perform the iso-schematron skeleton implementation steps to get a
+        # validating xslt
+        if include:
+            schematron = self._include(schematron, **include_params)
+        if expand:
+            schematron = self._expand(schematron, **expand_params)
+        if not schematron_schema_valid(schematron):
+            raise _etree.SchematronParseError(
+                "invalid schematron schema: %s" %
+                schematron_schema_valid.error_log)
+        if store_schematron:
+            self._schematron = schematron
+        # add new compile keyword args here if exposing them
+        compile_kwargs = {'phase': phase}
+        compile_params = _stylesheet_param_dict(compile_params, compile_kwargs)
+        validator_xslt = self._compile(schematron, **compile_params)
+        if store_xslt:
+            self._validator_xslt = validator_xslt
+        self._validator = _etree.XSLT(validator_xslt)
+        
+    def __call__(self, etree):
+        """Validate doc using Schematron.
+
+        Returns true if document is valid, false if not.
+        """
+        self._clear_error_log()
+        result = self._validator(etree)
+        if self._store_report:
+            self._validation_report = result
+        errors = self._validation_errors(result)
+        if errors:
+            if isinstance(etree, _etree._Element):
+                fname = etree.getroottree().docinfo.URL or '<file>'
+            else:
+                fname = etree.docinfo.URL or '<file>'
+            for error in errors:
+                # Does svrl report the line number, anywhere? Don't think so.
+                self._append_log_message(
+                    domain=self._domain, type=self._error_type,
+                    level=self._level, line=0, message=_etree.tounicode(error),
+                    filename=fname)
+            return False
+        return True
+
+    def schematron(self):
+        """ISO-schematron schema document (None if object has been initialized
+        with store_schematron=False).
+        """
+        return self._schematron
+    schematron = property(schematron, doc=schematron.__doc__)
+
+    def validator_xslt(self):
+        """ISO-schematron skeleton implementation XSLT validator document (None
+        if object has been initialized with store_xslt=False). 
+        """
+        return self._validator_xslt
+    validator_xslt = property(validator_xslt, doc=validator_xslt.__doc__)
+
+    def validation_report(self):
+        """ISO-schematron validation result report (None if result-storing has
+        been turned off).
+        """
+        return self._validation_report
+    validation_report = property(validation_report, doc=validation_report.__doc__)
diff --git a/lib/lxml/isoschematron/resources/rng/iso-schematron.rng b/lib/lxml/isoschematron/resources/rng/iso-schematron.rng
new file mode 100644
index 00000000..d822f0d6
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/rng/iso-schematron.rng
@@ -0,0 +1,622 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+         (c) International Organization for Standardization 2005. 
+        Permission to copy in any form is granted for use with conforming 
+        SGML systems and applications as defined in ISO 8879, 
+        provided this notice is included in all copies.
+-->
+<grammar ns="http://purl.oclc.org/dsdl/schematron" xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <ref name="schema"/>
+  </start>
+  <!-- Element declarations -->
+  <define name="schema">
+    <element name="schema">
+      <optional>
+        <attribute name="id">
+          <data type="ID"/>
+        </attribute>
+      </optional>
+      <ref name="rich"/>
+      <optional>
+        <attribute name="schemaVersion">
+          <ref name="non-empty-string"/>
+        </attribute>
+      </optional>
+      <optional>
+        <attribute name="defaultPhase">
+          <data type="IDREF"/>
+        </attribute>
+      </optional>
+      <optional>
+        <attribute name="queryBinding">
+          <ref name="non-empty-string"/>
+        </attribute>
+      </optional>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <ref name="inclusion"/>
+        </zeroOrMore>
+        <group>
+          <optional>
+            <ref name="title"/>
+          </optional>
+          <zeroOrMore>
+            <ref name="ns"/>
+          </zeroOrMore>
+          <zeroOrMore>
+            <ref name="p"/>
+          </zeroOrMore>
+          <zeroOrMore>
+            <ref name="let"/>
+          </zeroOrMore>
+          <zeroOrMore>
+            <ref name="phase"/>
+          </zeroOrMore>
+          <oneOrMore>
+            <ref name="pattern"/>
+          </oneOrMore>
+          <zeroOrMore>
+            <ref name="p"/>
+          </zeroOrMore>
+          <optional>
+            <ref name="diagnostics"/>
+          </optional>
+        </group>
+      </interleave>
+    </element>
+  </define>
+  <define name="active">
+    <element name="active">
+      <attribute name="pattern">
+        <data type="IDREF"/>
+      </attribute>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <choice>
+            <text/>
+            <ref name="dir"/>
+            <ref name="emph"/>
+            <ref name="span"/>
+          </choice>
+        </zeroOrMore>
+      </interleave>
+    </element>
+  </define>
+  <define name="assert">
+    <element name="assert">
+      <attribute name="test">
+        <ref name="exprValue"/>
+      </attribute>
+      <optional>
+        <attribute name="flag">
+          <ref name="flagValue"/>
+        </attribute>
+      </optional>
+      <optional>
+        <attribute name="id">
+          <data type="ID"/>
+        </attribute>
+      </optional>
+      <optional>
+        <attribute name="diagnostics">
+          <data type="IDREFS"/>
+        </attribute>
+      </optional>
+      <ref name="rich"/>
+      <ref name="linkable"/>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <choice>
+            <text/>
+            <ref name="name"/>
+            <ref name="value-of"/>
+            <ref name="emph"/>
+            <ref name="dir"/>
+            <ref name="span"/>
+          </choice>
+        </zeroOrMore>
+      </interleave>
+    </element>
+  </define>
+  <define name="diagnostic">
+    <element name="diagnostic">
+      <attribute name="id">
+        <data type="ID"/>
+      </attribute>
+      <ref name="rich"/>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <choice>
+            <text/>
+            <ref name="value-of"/>
+            <ref name="emph"/>
+            <ref name="dir"/>
+            <ref name="span"/>
+          </choice>
+        </zeroOrMore>
+      </interleave>
+    </element>
+  </define>
+  <define name="diagnostics">
+    <element name="diagnostics">
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <ref name="inclusion"/>
+        </zeroOrMore>
+        <zeroOrMore>
+          <ref name="diagnostic"/>
+        </zeroOrMore>
+      </interleave>
+    </element>
+  </define>
+  <define name="dir">
+    <element name="dir">
+      <optional>
+        <attribute name="value">
+          <choice>
+            <value>ltr</value>
+            <value>rtl</value>
+          </choice>
+        </attribute>
+      </optional>
+      <interleave>
+        <ref name="foreign"/>
+        <text/>
+      </interleave>
+    </element>
+  </define>
+  <define name="emph">
+    <element name="emph">
+      <text/>
+    </element>
+  </define>
+  <define name="extends">
+    <element name="extends">
+      <attribute name="rule">
+        <data type="IDREF"/>
+      </attribute>
+      <ref name="foreign-empty"/>
+    </element>
+  </define>
+  <define name="let">
+    <element name="let">
+      <attribute name="name">
+        <ref name="nameValue"/>
+      </attribute>
+      <attribute name="value">
+        <data type="string" datatypeLibrary=""/>
+      </attribute>
+    </element>
+  </define>
+  <define name="name">
+    <element name="name">
+      <optional>
+        <attribute name="path">
+          <ref name="pathValue"/>
+        </attribute>
+      </optional>
+      <ref name="foreign-empty"/>
+    </element>
+  </define>
+  <define name="ns">
+    <element name="ns">
+      <attribute name="uri">
+        <ref name="uriValue"/>
+      </attribute>
+      <attribute name="prefix">
+        <ref name="nameValue"/>
+      </attribute>
+      <ref name="foreign-empty"/>
+    </element>
+  </define>
+  <define name="p">
+    <element name="p">
+      <optional>
+        <attribute name="id">
+          <data type="ID"/>
+        </attribute>
+      </optional>
+      <optional>
+        <attribute name="class">
+          <ref name="classValue"/>
+        </attribute>
+      </optional>
+      <optional>
+        <attribute name="icon">
+          <ref name="uriValue"/>
+        </attribute>
+      </optional>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <choice>
+            <text/>
+            <ref name="dir"/>
+            <ref name="emph"/>
+            <ref name="span"/>
+          </choice>
+        </zeroOrMore>
+      </interleave>
+    </element>
+  </define>
+  <define name="param">
+    <element name="param">
+      <attribute name="name">
+        <ref name="nameValue"/>
+      </attribute>
+      <attribute name="value">
+        <ref name="non-empty-string"/>
+      </attribute>
+    </element>
+  </define>
+  <define name="pattern">
+    <element name="pattern">
+      <ref name="rich"/>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <ref name="inclusion"/>
+        </zeroOrMore>
+        <choice>
+          <group>
+            <attribute name="abstract">
+              <value>true</value>
+            </attribute>
+            <attribute name="id">
+              <data type="ID"/>
+            </attribute>
+            <optional>
+              <ref name="title"/>
+            </optional>
+            <group>
+              <zeroOrMore>
+                <ref name="p"/>
+              </zeroOrMore>
+              <zeroOrMore>
+                <ref name="let"/>
+              </zeroOrMore>
+              <zeroOrMore>
+                <ref name="rule"/>
+              </zeroOrMore>
+            </group>
+          </group>
+          <group>
+            <optional>
+              <attribute name="abstract">
+                <value>false</value>
+              </attribute>
+            </optional>
+            <optional>
+              <attribute name="id">
+                <data type="ID"/>
+              </attribute>
+            </optional>
+            <optional>
+              <ref name="title"/>
+            </optional>
+            <group>
+              <zeroOrMore>
+                <ref name="p"/>
+              </zeroOrMore>
+              <zeroOrMore>
+                <ref name="let"/>
+              </zeroOrMore>
+              <zeroOrMore>
+                <ref name="rule"/>
+              </zeroOrMore>
+            </group>
+          </group>
+          <group>
+            <optional>
+              <attribute name="abstract">
+                <value>false</value>
+              </attribute>
+            </optional>
+            <attribute name="is-a">
+              <data type="IDREF"/>
+            </attribute>
+            <optional>
+              <attribute name="id">
+                <data type="ID"/>
+              </attribute>
+            </optional>
+            <optional>
+              <ref name="title"/>
+            </optional>
+            <group>
+              <zeroOrMore>
+                <ref name="p"/>
+              </zeroOrMore>
+              <zeroOrMore>
+                <ref name="param"/>
+              </zeroOrMore>
+            </group>
+          </group>
+        </choice>
+      </interleave>
+    </element>
+  </define>
+  <define name="phase">
+    <element name="phase">
+      <attribute name="id">
+        <data type="ID"/>
+      </attribute>
+      <ref name="rich"/>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <ref name="inclusion"/>
+        </zeroOrMore>
+        <group>
+          <zeroOrMore>
+            <ref name="p"/>
+          </zeroOrMore>
+          <zeroOrMore>
+            <ref name="let"/>
+          </zeroOrMore>
+          <zeroOrMore>
+            <ref name="active"/>
+          </zeroOrMore>
+        </group>
+      </interleave>
+    </element>
+  </define>
+  <define name="report">
+    <element name="report">
+      <attribute name="test">
+        <ref name="exprValue"/>
+      </attribute>
+      <optional>
+        <attribute name="flag">
+          <ref name="flagValue"/>
+        </attribute>
+      </optional>
+      <optional>
+        <attribute name="id">
+          <data type="ID"/>
+        </attribute>
+      </optional>
+      <optional>
+        <attribute name="diagnostics">
+          <data type="IDREFS"/>
+        </attribute>
+      </optional>
+      <ref name="rich"/>
+      <ref name="linkable"/>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <choice>
+            <text/>
+            <ref name="name"/>
+            <ref name="value-of"/>
+            <ref name="emph"/>
+            <ref name="dir"/>
+            <ref name="span"/>
+          </choice>
+        </zeroOrMore>
+      </interleave>
+    </element>
+  </define>
+  <define name="rule">
+    <element name="rule">
+      <optional>
+        <attribute name="flag">
+          <ref name="flagValue"/>
+        </attribute>
+      </optional>
+      <ref name="rich"/>
+      <ref name="linkable"/>
+      <interleave>
+        <ref name="foreign"/>
+        <zeroOrMore>
+          <ref name="inclusion"/>
+        </zeroOrMore>
+        <choice>
+          <group>
+            <attribute name="abstract">
+              <value>true</value>
+            </attribute>
+            <attribute name="id">
+              <data type="ID"/>
+            </attribute>
+            <zeroOrMore>
+              <ref name="let"/>
+            </zeroOrMore>
+            <oneOrMore>
+              <choice>
+                <ref name="assert"/>
+                <ref name="report"/>
+                <ref name="extends"/>
+              </choice>
+            </oneOrMore>
+          </group>
+          <group>
+            <attribute name="context">
+              <ref name="pathValue"/>
+            </attribute>
+            <optional>
+              <attribute name="id">
+                <data type="ID"/>
+              </attribute>
+            </optional>
+            <optional>
+              <attribute name="abstract">
+                <value>false</value>
+              </attribute>
+            </optional>
+            <zeroOrMore>
+              <ref name="let"/>
+            </zeroOrMore>
+            <oneOrMore>
+              <choice>
+                <ref name="assert"/>
+                <ref name="report"/>
+                <ref name="extends"/>
+              </choice>
+            </oneOrMore>
+          </group>
+        </choice>
+      </interleave>
+    </element>
+  </define>
+  <define name="span">
+    <element name="span">
+      <attribute name="class">
+        <ref name="classValue"/>
+      </attribute>
+      <interleave>
+        <ref name="foreign"/>
+        <text/>
+      </interleave>
+    </element>
+  </define>
+  <define name="title">
+    <element name="title">
+      <zeroOrMore>
+        <choice>
+          <text/>
+          <ref name="dir"/>
+        </choice>
+      </zeroOrMore>
+    </element>
+  </define>
+  <define name="value-of">
+    <element name="value-of">
+      <attribute name="select">
+        <ref name="pathValue"/>
+      </attribute>
+      <ref name="foreign-empty"/>
+    </element>
+  </define>
+  <!-- common declarations -->
+  <define name="inclusion">
+    <element name="include">
+      <attribute name="href">
+        <ref name="uriValue"/>
+      </attribute>
+    </element>
+  </define>
+  <define name="rich">
+    <optional>
+      <attribute name="icon">
+        <ref name="uriValue"/>
+      </attribute>
+    </optional>
+    <optional>
+      <attribute name="see">
+        <ref name="uriValue"/>
+      </attribute>
+    </optional>
+    <optional>
+      <attribute name="fpi">
+        <ref name="fpiValue"/>
+      </attribute>
+    </optional>
+    <optional>
+      <attribute name="xml:lang">
+        <ref name="langValue"/>
+      </attribute>
+    </optional>
+    <optional>
+      <attribute name="xml:space">
+        <choice>
+          <value>preserve</value>
+          <value>default</value>
+        </choice>
+      </attribute>
+    </optional>
+  </define>
+  <define name="linkable">
+    <optional>
+      <attribute name="role">
+        <ref name="roleValue"/>
+      </attribute>
+    </optional>
+    <optional>
+      <attribute name="subject">
+        <ref name="pathValue"/>
+      </attribute>
+    </optional>
+  </define>
+  <define name="foreign">
+    <ref name="foreign-attributes"/>
+    <zeroOrMore>
+      <ref name="foreign-element"/>
+    </zeroOrMore>
+  </define>
+  <define name="foreign-empty">
+    <ref name="foreign-attributes"/>
+  </define>
+  <define name="foreign-attributes">
+    <zeroOrMore>
+      <attribute>
+        <anyName>
+          <except>
+            <nsName ns=""/>
+            <nsName ns="http://www.w3.org/XML/1998/namespace"/>
+          </except>
+        </anyName>
+      </attribute>
+    </zeroOrMore>
+  </define>
+  <define name="foreign-element">
+    <element>
+      <anyName>
+        <except>
+          <nsName/>
+        </except>
+      </anyName>
+      <zeroOrMore>
+        <choice>
+          <attribute>
+            <anyName/>
+          </attribute>
+          <ref name="foreign-element"/>
+          <ref name="schema"/>
+          <text/>
+        </choice>
+      </zeroOrMore>
+    </element>
+  </define>
+  <!-- Data types -->
+  <define name="uriValue">
+    <data type="anyURI"/>
+  </define>
+  <define name="pathValue">
+    <data type="string" datatypeLibrary=""/>
+  </define>
+  <define name="exprValue">
+    <data type="string" datatypeLibrary=""/>
+  </define>
+  <define name="fpiValue">
+    <data type="string" datatypeLibrary=""/>
+  </define>
+  <define name="langValue">
+    <data type="language"/>
+  </define>
+  <define name="roleValue">
+    <data type="string" datatypeLibrary=""/>
+  </define>
+  <define name="flagValue">
+    <data type="string" datatypeLibrary=""/>
+  </define>
+  <define name="nameValue">
+    <data type="string" datatypeLibrary=""/>
+  </define>
+  <!-- In the default query language binding, xsd:NCNAME -->
+  <define name="classValue">
+    <data type="string" datatypeLibrary=""/>
+  </define>
+  <define name="non-empty-string">
+    <data type="token">
+      <param name="minLength">1</param>
+    </data>
+  </define>
+</grammar>
diff --git a/lib/lxml/isoschematron/resources/xsl/RNG2Schtrn.xsl b/lib/lxml/isoschematron/resources/xsl/RNG2Schtrn.xsl
new file mode 100644
index 00000000..21a5d2a0
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/xsl/RNG2Schtrn.xsl
@@ -0,0 +1,75 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+	Stylesheet for extracting Schematron information from a RELAX-NG schema.
+	Based on the stylesheet for extracting Schematron information from W3C XML Schema.
+	Created by Eddie Robertsson 2002/06/01
+        2009/12/10      hj: changed Schematron namespace to ISO URI (Holger Joukl)
+-->
+<xsl:transform version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
+xmlns:sch="http://purl.oclc.org/dsdl/schematron" xmlns:rng="http://relaxng.org/ns/structure/1.0">
+	<!-- Set the output to be XML with an XML declaration and use indentation -->
+	<xsl:output method="xml" omit-xml-declaration="no" indent="yes" standalone="yes"/>
+	<!-- -->
+	<!-- match schema and call recursive template to extract included schemas -->
+	<!-- -->
+	<xsl:template match="/rng:grammar | /rng:element">
+		<!-- call the schema definition template ... -->
+		<xsl:call-template name="gatherSchema">
+			<!-- ... with current node as the $schemas parameter ... -->
+			<xsl:with-param name="schemas" select="."/>
+			<!-- ... and any includes in the $include parameter -->
+			<xsl:with-param name="includes" select="document(/rng:grammar/rng:include/@href
+| //rng:externalRef/@href)"/>
+		</xsl:call-template>
+	</xsl:template>
+	<!-- -->
+	<!-- gather all included schemas into a single parameter variable -->
+	<!-- -->
+	<xsl:template name="gatherSchema">
+		<xsl:param name="schemas"/>
+		<xsl:param name="includes"/>
+		<xsl:choose>
+			<xsl:when test="count($schemas) &lt; count($schemas | $includes)">
+				<!-- when $includes includes something new, recurse ... -->
+				<xsl:call-template name="gatherSchema">
+					<!-- ... with current $includes added to the $schemas parameter ... -->
+					<xsl:with-param name="schemas" select="$schemas | $includes"/>
+					<!-- ... and any *new* includes in the $include parameter -->
+					<xsl:with-param name="includes" select="document($includes/rng:grammar/rng:include/@href
+| $includes//rng:externalRef/@href)"/>
+				</xsl:call-template>
+			</xsl:when>
+			<xsl:otherwise>
+				<!-- we have the complete set of included schemas, so now let's output the embedded schematron -->
+				<xsl:call-template name="output">
+					<xsl:with-param name="schemas" select="$schemas"/>
+				</xsl:call-template>
+			</xsl:otherwise>
+		</xsl:choose>
+	</xsl:template>
+	<!-- -->
+	<!-- output the schematron information -->
+	<!-- -->
+	<xsl:template name="output">
+		<xsl:param name="schemas"/>
+		<!-- -->
+		<sch:schema>
+			<!-- get header-type elements - eg title and especially ns -->
+			<!-- title (just one) -->
+			<xsl:copy-of select="$schemas//sch:title[1]"/>
+			<!-- get remaining schematron schema children -->
+			<!-- get non-blank namespace elements, dropping duplicates -->
+			<xsl:for-each select="$schemas//sch:ns">
+				<xsl:if test="generate-id(.) = generate-id($schemas//sch:ns[@prefix = current()/@prefix][1])">
+					<xsl:copy-of select="."/>
+				</xsl:if>
+			</xsl:for-each>
+			<xsl:copy-of select="$schemas//sch:phase"/>
+			<xsl:copy-of select="$schemas//sch:pattern"/>
+			<sch:diagnostics>
+				<xsl:copy-of select="$schemas//sch:diagnostics/*"/>
+			</sch:diagnostics>
+		</sch:schema>
+	</xsl:template>
+	<!-- -->
+</xsl:transform>
diff --git a/lib/lxml/isoschematron/resources/xsl/XSD2Schtrn.xsl b/lib/lxml/isoschematron/resources/xsl/XSD2Schtrn.xsl
new file mode 100644
index 00000000..17f23dec
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/xsl/XSD2Schtrn.xsl
@@ -0,0 +1,77 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+        based on an original transform by Eddie Robertsson
+        2001/04/21      fn: added support for included schemas
+        2001/06/27      er: changed XMl Schema prefix from xsd: to xs: and changed to the Rec namespace
+        2009/12/10      hj: changed Schematron namespace to ISO URI (Holger Joukl)
+-->
+<xsl:transform version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
+xmlns:sch="http://purl.oclc.org/dsdl/schematron" xmlns:xs="http://www.w3.org/2001/XMLSchema">
+        <!-- Set the output to be XML with an XML declaration and use indentation -->
+        <xsl:output method="xml" omit-xml-declaration="no" indent="yes" standalone="yes"/>
+        <!-- -->
+        <!-- match schema and call recursive template to extract included schemas -->
+        <!-- -->
+        <xsl:template match="xs:schema">
+                <!-- call the schema definition template ... -->
+                <xsl:call-template name="gatherSchema">
+                        <!-- ... with current current root as the $schemas parameter ... -->
+                        <xsl:with-param name="schemas" select="/"/>
+                        <!-- ... and any includes in the $include parameter -->
+                        <xsl:with-param name="includes" 
+						select="document(/xs:schema/xs:*[self::xs:include or self::xs:import or self::xs:redefine]/@schemaLocation)"/>
+                </xsl:call-template>
+        </xsl:template>
+        <!-- -->
+        <!-- gather all included schemas into a single parameter variable -->
+        <!-- -->
+        <xsl:template name="gatherSchema">
+                <xsl:param name="schemas"/>
+                <xsl:param name="includes"/>
+                <xsl:choose>
+                        <xsl:when test="count($schemas) &lt; count($schemas | $includes)">
+                                <!-- when $includes includes something new, recurse ... -->
+                                <xsl:call-template name="gatherSchema">
+                                        <!-- ... with current $includes added to the $schemas parameter ... -->
+                                        <xsl:with-param name="schemas" select="$schemas | $includes"/>
+                                        <!-- ... and any *new* includes in the $include parameter -->
+                                        <xsl:with-param name="includes" 
+										select="document($includes/xs:schema/xs:*[self::xs:include or self::xs:import or self::xs:redefine]/@schemaLocation)"/>
+                                </xsl:call-template>
+                        </xsl:when>
+                        <xsl:otherwise>
+                                <!-- we have the complete set of included schemas, 
+								so now let's output the embedded schematron -->
+                                <xsl:call-template name="output">
+                                        <xsl:with-param name="schemas" select="$schemas"/>
+                                </xsl:call-template>
+                        </xsl:otherwise>
+                </xsl:choose>
+        </xsl:template>
+        <!-- -->
+        <!-- output the schematron information -->
+        <!-- -->
+        <xsl:template name="output">
+                <xsl:param name="schemas"/>
+                <!-- -->
+                <sch:schema>
+                        <!-- get header-type elements - eg title and especially ns -->
+                        <!-- title (just one) -->
+                        <xsl:copy-of select="$schemas//xs:appinfo/sch:title[1]"/>
+                        <!-- get remaining schematron schema children -->
+                        <!-- get non-blank namespace elements, dropping duplicates -->
+                        <xsl:for-each select="$schemas//xs:appinfo/sch:ns">
+                                <xsl:if test="generate-id(.) = 
+								generate-id($schemas//xs:appinfo/sch:ns[@prefix = current()/@prefix][1])">
+                                        <xsl:copy-of select="."/>
+                                </xsl:if>
+                        </xsl:for-each>
+                        <xsl:copy-of select="$schemas//xs:appinfo/sch:phase"/>
+                        <xsl:copy-of select="$schemas//xs:appinfo/sch:pattern"/>
+                        <sch:diagnostics>
+                                <xsl:copy-of select="$schemas//xs:appinfo/sch:diagnostics/*"/>
+                        </sch:diagnostics>
+                </sch:schema>
+        </xsl:template>
+        <!-- -->
+</xsl:transform>
diff --git a/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_abstract_expand.xsl b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_abstract_expand.xsl
new file mode 100644
index 00000000..057c7c1f
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_abstract_expand.xsl
@@ -0,0 +1,296 @@
+<?xml version="1.0" encoding="UTF-8"?><?xar XSLT?>
+
+<!-- 
+     OVERVIEW - iso_abstract_expand.xsl
+     
+	    This is a preprocessor for ISO Schematron, which implements abstract patterns. 
+	    It also 
+	       	* extracts a particular schema using an ID, where there are multiple 
+	    schemas, such as when they are embedded in the same NVDL script 
+	    	* experimentally, allows parameter recognition and substitution inside
+	    	text as well as @context, @test, & @select.
+		
+		
+		This should be used after iso-dsdl-include.xsl and before the skeleton or
+		meta-stylesheet (e.g. iso-svrl.xsl) . It only requires XSLT 1.
+		 
+		Each kind of inclusion can be turned off (or on) on the command line.
+		 
+-->
+<!-- 
+  VERSION INFORMATION
+  2008-09-18 RJ
+  		* move out param test from iso:schema template  to work with XSLT 1. (Noah Fontes)
+  		
+  2008-07-29 RJ 
+  		* Create.  Pull out as distinct XSL in its own namespace from old iso_pre_pro.xsl
+  		* Put everything in private namespace
+  		* Rewrite replace_substring named template so that copyright is clear
+  	
+  2008-07-24 RJ
+       * correct abstract patterns so for correct names: param/@name and
+     param/@value
+    
+  2007-01-12  RJ 
+     * Use ISO namespace
+     * Use pattern/@id not  pattern/@name 
+     * Add Oliver Becker's suggests from old Schematron-love-in list for <copy> 
+     * Add XT -ism?
+  2003 RJ
+     * Original written for old namespace
+     * http://www.topologi.com/resources/iso-pre-pro.xsl
+-->	
+<!--
+ LEGAL INFORMATION
+ 
+ Copyright (c) 2000-2008 Rick Jelliffe and Academia Sinica Computing Center, Taiwan
+
+ This software is provided 'as-is', without any express or implied warranty. 
+ In no event will the authors be held liable for any damages arising from 
+ the use of this software.
+
+ Permission is granted to anyone to use this software for any purpose, 
+ including commercial applications, and to alter it and redistribute it freely,
+ subject to the following restrictions:
+
+ 1. The origin of this software must not be misrepresented; you must not claim
+ that you wrote the original software. If you use this software in a product, 
+ an acknowledgment in the product documentation would be appreciated but is 
+ not required.
+
+ 2. Altered source versions must be plainly marked as such, and must not be 
+ misrepresented as being the original software.
+
+ 3. This notice may not be removed or altered from any source distribution.
+-->
+<xslt:stylesheet version="1.0" xmlns:xslt="http://www.w3.org/1999/XSL/Transform" 
+	xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
+    xmlns:iso="http://purl.oclc.org/dsdl/schematron"  
+    xmlns:nvdl="http://purl.oclc.org/dsdl/nvdl"  
+    
+  
+    xmlns:iae="http://www.schematron.com/namespace/iae" 
+     
+      >
+	
+	<xslt:param name="schema-id"></xslt:param>
+	
+	
+	<!-- Driver for the mode -->
+	<xsl:template match="/">
+  		<xsl:apply-templates select="." mode="iae:go" />
+	</xsl:template> 
+	
+	
+	<!-- ================================================================================== -->
+	<!-- Normal processing rules                                                            -->
+	<!-- ================================================================================== -->
+	<!-- Output only the selected schema --> 
+	<xslt:template match="iso:schema" >
+	    <xsl:if test="string-length($schema-id) =0 or @id= $schema-id ">
+	    	<xslt:copy>
+				<xslt:copy-of select="@*" />
+				<xslt:apply-templates  mode="iae:go" /> 
+			</xslt:copy>
+		</xsl:if>
+	</xslt:template>
+	
+ 
+	<!-- Strip out any foreign elements above the Schematron schema .
+		-->
+	<xslt:template match="*[not(ancestor-or-self::iso:*)]"     mode="iae:go"  >
+	   <xslt:apply-templates  mode="iae:go" />
+	</xslt:template>
+	   
+	
+	<!-- ================================================================================== -->
+	<!-- Handle Schematron abstract pattern preprocessing                                   -->
+	<!-- abstract-to-real calls
+			do-pattern calls 
+				macro-expand calls 
+					multi-macro-expand
+						replace-substring                                                   -->
+	<!-- ================================================================================== -->
+	
+	<!--
+		Abstract patterns allow you to say, for example
+		
+		<pattern name="htmlTable" is-a="table">
+			<param name="row" value="html:tr"/>
+			<param name="cell" value="html:td" />
+			<param name="table" value="html:table" />
+		</pattern>
+		
+		For a good introduction, see Uche Ogbujii's article for IBM DeveloperWorks
+		"Discover the flexibility of Schematron abstract patterns"
+		  http://www-128.ibm.com/developerworks/xml/library/x-stron.html
+		However, note that ISO Schematron uses @name and @value attributes on
+		the iso:param element, and @id not @name on the pattern element.
+		
+	-->
+	
+	<!-- Suppress declarations of abstract patterns -->
+	<xslt:template match="iso:pattern[@abstract='true']"  mode="iae:go"  >
+		<xslt:comment>Suppressed abstract pattern <xslt:value-of select="@id"/> was here</xslt:comment>	
+	</xslt:template> 
+	
+	
+	<!-- Suppress uses of abstract patterns -->
+	<xslt:template match="iso:pattern[@is-a]"  mode="iae:go" >
+			
+		<xslt:comment>Start pattern based on abstract <xslt:value-of select="@is-a"/></xslt:comment>
+		
+		<xslt:call-template name="iae:abstract-to-real" >
+			<xslt:with-param name="caller" select="@id" />
+			<xslt:with-param name="is-a" select="@is-a" />
+		</xslt:call-template>
+			
+	</xslt:template>
+	 
+	 
+	
+	<!-- output everything else unchanged -->
+	<xslt:template match="*" priority="-1"  mode="iae:go" >
+	    <xslt:copy>
+			<xslt:copy-of select="@*" />
+			<xslt:apply-templates mode="iae:go"/> 
+		</xslt:copy>
+	</xslt:template>
+	
+	<!-- Templates for macro expansion of abstract patterns -->
+	<!-- Sets up the initial conditions for the recursive call -->
+	<xslt:template name="iae:macro-expand">
+		<xslt:param name="caller"/>
+		<xslt:param name="text" />
+		<xslt:call-template name="iae:multi-macro-expand">
+			<xslt:with-param name="caller" select="$caller"/>
+			<xslt:with-param name="text" select="$text"/>
+			<xslt:with-param name="paramNumber" select="1"/>
+		</xslt:call-template>
+		
+	</xslt:template>
+	
+	<!-- Template to replace the current parameter and then
+	   recurse to replace subsequent parameters. -->
+	    
+	<xslt:template name="iae:multi-macro-expand">
+		<xslt:param name="caller"/>
+		<xslt:param name="text" />
+		<xslt:param name="paramNumber" />
+
+		
+		<xslt:choose>
+			<xslt:when test="//iso:pattern[@id=$caller]/iso:param[ $paramNumber]">
+
+				<xslt:call-template name="iae:multi-macro-expand">
+					<xslt:with-param name="caller" select="$caller"/>	
+					<xslt:with-param name="paramNumber" select="$paramNumber + 1"/>		
+					<xslt:with-param name="text" >
+						<xslt:call-template name="iae:replace-substring">
+							<xslt:with-param name="original" select="$text"/>
+							<xslt:with-param name="substring"
+							select="concat('$', //iso:pattern[@id=$caller]/iso:param[ $paramNumber ]/@name)"/>
+							<xslt:with-param name="replacement"
+								select="//iso:pattern[@id=$caller]/iso:param[ $paramNumber ]/@value"/>			
+						</xslt:call-template>
+					</xslt:with-param>						
+				</xslt:call-template>
+			</xslt:when>
+			<xslt:otherwise><xslt:value-of select="$text" /></xslt:otherwise>		
+		
+		</xslt:choose>
+	</xslt:template>
+	
+	
+	<!-- generate the real pattern from an abstract pattern + parameters-->
+	<xslt:template name="iae:abstract-to-real" >
+		<xslt:param name="caller"/>
+		<xslt:param name="is-a" />
+		<xslt:for-each select="//iso:pattern[@id= $is-a]">
+		<xslt:copy>
+		
+		    <xslt:choose>
+		      <xslt:when test=" string-length( $caller ) = 0">
+		      <xslt:attribute name="id"><xslt:value-of select="concat( generate-id(.) , $is-a)" /></xslt:attribute>
+		      </xslt:when>
+		      <xslt:otherwise>
+				<xslt:attribute name="id"><xslt:value-of select="$caller" /></xslt:attribute>
+		      </xslt:otherwise>
+		    </xslt:choose> 
+			
+			<xslt:apply-templates select="*|text()" mode="iae:do-pattern"    >
+				<xslt:with-param name="caller"><xslt:value-of select="$caller"/></xslt:with-param>
+			</xslt:apply-templates>	
+			
+		</xslt:copy>
+		</xslt:for-each>
+	</xslt:template>
+		
+	
+	<!-- Generate a non-abstract pattern -->
+	<xslt:template mode="iae:do-pattern" match="*">
+		<xslt:param name="caller"/>
+		<xslt:copy>
+			<xslt:for-each select="@*[name()='test' or name()='context' or name()='select']">
+				<xslt:attribute name="{name()}">
+				<xslt:call-template name="iae:macro-expand">
+						<xslt:with-param name="text"><xslt:value-of select="."/></xslt:with-param>
+						<xslt:with-param name="caller"><xslt:value-of select="$caller"/></xslt:with-param>
+					</xslt:call-template>
+				</xslt:attribute>
+			</xslt:for-each>	
+			<xslt:copy-of select="@*[name()!='test'][name()!='context'][name()!='select']" />
+			<xsl:for-each select="node()">
+				<xsl:choose>
+				    <!-- Experiment: replace macros in text as well, to allow parameterized assertions
+				        and so on, without having to have spurious <iso:value-of> calls and multiple
+				        delimiting -->
+					<xsl:when test="self::text()">	
+						<xslt:call-template name="iae:macro-expand">
+							<xslt:with-param name="text"><xslt:value-of select="."/></xslt:with-param>
+							<xslt:with-param name="caller"><xslt:value-of select="$caller"/></xslt:with-param>
+						</xslt:call-template>
+					</xsl:when>
+					<xsl:otherwise>
+						<xslt:apply-templates select="." mode="iae:do-pattern">
+							<xslt:with-param name="caller"><xslt:value-of select="$caller"/></xslt:with-param>
+						</xslt:apply-templates>		
+					</xsl:otherwise>
+				</xsl:choose>
+			</xsl:for-each>			
+		</xslt:copy>
+	</xslt:template>
+	
+	<!-- UTILITIES --> 
+	<!-- Simple version of replace-substring function -->
+	<xslt:template name="iae:replace-substring">
+		<xslt:param name="original" />    
+		<xslt:param name="substring" />   
+		<xslt:param name="replacement" select="''"/>
+		
+  <xsl:choose>
+    <xsl:when test="not($original)" /> 
+    <xsl:when test="not(string($substring))">
+      <xsl:value-of select="$original" />
+    </xsl:when> 
+        <xsl:when test="contains($original, $substring)">
+          <xsl:variable name="before" select="substring-before($original, $substring)" />
+          <xsl:variable name="after" select="substring-after($original, $substring)" />
+          
+          <xsl:value-of select="$before" />
+          <xsl:value-of select="$replacement" />
+          <!-- recursion -->
+          <xsl:call-template name="iae:replace-substring">
+            <xsl:with-param name="original" select="$after" />
+            <xsl:with-param name="substring" select="$substring" />
+            <xsl:with-param name="replacement" select="$replacement" /> 
+            </xsl:call-template>
+        </xsl:when>
+        <xsl:otherwise>
+        	<!-- no substitution -->
+        	<xsl:value-of select="$original" />
+        </xsl:otherwise>
+      </xsl:choose> 
+</xslt:template>
+
+</xslt:stylesheet>
\ No newline at end of file
diff --git a/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_dsdl_include.xsl b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_dsdl_include.xsl
new file mode 100644
index 00000000..44e5573b
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_dsdl_include.xsl
@@ -0,0 +1,1160 @@
+<?xml version="1.0" encoding="UTF-8"?><?xar XSLT?>
+
+<!-- 
+     OVERVIEW : iso_dsdl_include.xsl
+     
+	    This is an inclusion preprocessor for the non-smart text inclusions
+	    of ISO DSDL. It handles 
+	    	<relax:extRef> for ISO RELAX NG
+	    	<sch:include>  for ISO Schematron and Schematron 1.n
+	    	<sch:extends>  for 2009 draft ISO Schematron
+	    	<xi:xinclude>  simple W3C XIncludes for ISO NVRL and DSRL 
+	    	<crdl:ref>     for draft ISO CRDL
+	    	<dtll:include> for draft ISO DTLL
+	    	<* @xlink:href> for simple W3C XLink 1.1 embedded links
+	    	
+		 
+		This should be the first in any chain of processing. It only requires
+		XSLT 1. Each kind of inclusion can be turned off (or on) on the command line.
+		
+		Ids in fragment identifiers or xpointers will be sought in the following
+		order:
+		    * @xml:id
+		    * id() for typed schemas (e.g. from DTD) [NOTE: XInclude does not support this]
+		    * untyped @id 
+		    
+	The proposed behaviour for the update to ISO Schematron has been implemented. If an
+	include points to an element with the same name as the parent, then that element's
+	contents will be included. This supports the merge style of inclusion.    
+	
+	When an inclusion is made, it is preceded by a PI with target DSDL_INCLUDE_START
+	and the href and closed by a PI with target DSDL_INCLUDE_START and the href. This is
+	to allow better location of problems, though only to the file level. 
+	
+	Limitations:
+	* No rebasing: relative paths will be interpreted based on the initial document's
+	path, not the including document. (Severe limitation!)
+	* No checking for circular references
+	* Not full xpointers: only ID matching
+	* <relax:include> not implemented 
+	* XInclude handling of xml:base and xml:lang not implemented   
+-->
+<!-- 
+  VERSION INFORMATION
+	2009-02-25 
+	* Update DSDL namespace to use schematron.com
+	* Tested with SAXON9, Xalan 2.7.1, IE7, 
+	* IE does not like multiple variables in same template with same name: rename.   
+	2008-09-18
+	* Remove new behaviour for include, because it conflicts with existing usage [KH]
+	* Add extends[@href] element with that merge functionality
+	* Generate PIs to notate source of inclusions for potential better diagnostics
+	
+	2008-09-16
+	* Fix for XSLT1
+	
+	2008-08-28
+	* New behaviour for schematron includes: if the pointed to element is the same as the current,
+	include the children.
+	
+	2008-08-20
+	* Fix bug: in XSLT1 cannot do $document/id('x') but need to use for-each
+	
+	2008-08-04
+	* Add support for inclusions in old namespace  
+	
+	2008-08-03
+	* Fix wrong param name include-relaxng & include-crdl (KH, PH)
+	* Allow inclusion of XSLT and XHTML (KH)
+	* Fix inclusion of fragments (KH)
+	
+	2008-07-25
+	* Add selectable input parameter
+	
+	2008-07-24  
+	* RJ New
+-->
+<!--
+	LEGAL INFORMATION
+	
+	Copyright (c) 2008 Rick Jelliffe 
+	
+	This software is provided 'as-is', without any express or implied warranty. 
+	In no event will the authors be held liable for any damages arising from 
+	the use of this software.
+	
+	Permission is granted to anyone to use this software for any purpose, 
+	including commercial applications, and to alter it and redistribute it freely,
+	subject to the following restrictions:
+	
+	1. The origin of this software must not be misrepresented; you must not claim
+	that you wrote the original software. If you use this software in a product, 
+	an acknowledgment in the product documentation would be appreciated but is 
+	not required.
+	
+	2. Altered source versions must be plainly marked as such, and must not be 
+	misrepresented as being the original software.
+	
+	3. This notice may not be removed or altered from any source distribution.
+-->
+<xslt:stylesheet version="1.0"
+	xmlns:xslt="http://www.w3.org/1999/XSL/Transform"
+	xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+	xmlns:iso="http://purl.oclc.org/dsdl/schematron"
+	xmlns:nvdl="http://purl.oclc.org/dsdl/nvdl"
+	xmlns:xhtml="http://www.w3.org/1999/xhtml"
+	xmlns:schold="http://www.ascc.net/xml/schematron"
+	xmlns:crdl="http://purl.oclc.org/dsdl/crepdl/ns/structure/1.0"
+	xmlns:xi="http://www.w3.org/2001/XInclude"
+	xmlns:dtll="http://www.jenitennison.com/datatypes"
+	xmlns:dsdl="http://www.schematron.com/namespace/dsdl"
+	xmlns:relax="http://relaxng.org/ns/structure/1.0"
+	xmlns:xlink="http://www.w3.org/1999/xlink">
+	<!-- Note: The URL for the dsdl namespace is not official -->
+
+
+	<xsl:param name="include-schematron">true</xsl:param>
+	<xsl:param name="include-crdl">true</xsl:param>
+	<xsl:param name="include-xinclude">true</xsl:param>
+	<xsl:param name="include-dtll">true</xsl:param>
+	<xsl:param name="include-relaxng">true</xsl:param>
+	<xsl:param name="include-xlink">true</xsl:param>
+
+	<xsl:template match="/">
+		<xsl:apply-templates select="." mode="dsdl:go" />
+	</xsl:template>
+
+	<!-- output everything else unchanged -->
+	<xslt:template match="node()" priority="-1" mode="dsdl:go">
+		<xslt:copy>
+			<xslt:copy-of select="@*" />
+			<xslt:apply-templates mode="dsdl:go" />
+		</xslt:copy>
+	</xslt:template>
+
+
+
+	<!-- =========================================================== -->
+	<!-- ISO/IEC 19757 - DSDL Document Schema Definition Languages   -->
+	<!-- Part 2 - Regular grammar-based validation - RELAX NG        -->
+	<!-- This only implements relax:extRef not relax:include which   -->
+	<!-- is complex.                                                 -->
+	<!-- =========================================================== -->
+	<xslt:template match="relax:extRef" mode="dsdl:go">
+
+
+		<!-- Insert subschema -->
+
+		<xsl:variable name="document-uri"
+			select="substring-before(concat(@href,'#'), '#')" />
+		<xsl:variable name="fragment-id"
+			select="substring-after(@href, '#')" />
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_START">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+		<xsl:choose>
+			<xsl:when test="not( $include-relaxng = 'true' )">
+				<xslt:copy>
+					<xslt:copy-of select="@*" />
+					<xslt:apply-templates mode="dsdl:go" />
+				</xslt:copy>
+			</xsl:when>
+			<xsl:otherwise>
+
+				<xsl:choose>
+
+					<xsl:when
+						test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0">
+						<xsl:message>
+							Error: Impossible URL in RELAX NG extRef
+							include
+						</xsl:message>
+					</xsl:when>
+
+					<!-- this case is when there is in embedded schema in the same document elsewhere -->
+					<xslt:when
+						test="string-length( $document-uri ) = 0">
+						<xslt:apply-templates mode="dsdl:go"
+							select="//*[@xml:id= $fragment-id ] | id( $fragment-id) | //*[@id= $fragment-id ]" />
+					</xslt:when>
+
+					<xsl:when
+						test="string-length( $fragment-id ) &gt; 0">
+						<xsl:variable name="theDocument_1"
+							select="document( $document-uri,/ )" />
+
+						<xsl:if test="not($theDocument_1)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<!-- use a for-each so that the id() function works correctly on the external document -->
+						<xsl:for-each select="$theDocument_1">
+							<xsl:variable name="theFragment_1"
+								select="$theDocument_1//*[@xml:id= $fragment-id ]        
+                  |  id( $fragment-id)          
+              | $theDocument_1//*[@id= $fragment-id ]" />
+							<xsl:if test="not($theFragment_1)">
+								<xsl:message terminate="no">
+									<xsl:text>Unable to locate id attribute: </xsl:text>
+									<xsl:value-of select="@href" />
+								</xsl:message>
+							</xsl:if>
+							<xsl:apply-templates
+								select=" $theFragment_1[1]" mode="dsdl:go" />
+						</xsl:for-each>
+					</xsl:when>
+
+					<xsl:otherwise>
+						<xsl:variable name="theDocument_2"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="theFragment_2"
+							select="$theDocument_2/*" />
+						<xsl:if test="not($theDocument_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+
+						<xsl:if test="not($theFragment_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to locate id attribute: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<xsl:apply-templates select="$theFragment_2 "
+							mode="dsdl:go" />
+					</xsl:otherwise>
+				</xsl:choose>
+
+			</xsl:otherwise>
+		</xsl:choose>
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_END">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+	</xslt:template>
+
+
+
+	<!-- =========================================================== -->
+	<!-- ISO/IEC 19757 - DSDL Document Schema Definition Languages   -->
+	<!-- Part 3 - Rule-based validation - Schematron                 -->
+	<!-- =========================================================== -->
+
+
+	<!-- Extend the URI syntax to allow # references -->
+	<!-- Add experimental support for simple containers like  /xxx:xxx/iso:pattern to allow better includes -->
+	<xsl:template match="iso:include" mode="dsdl:go">
+
+		<xsl:variable name="document-uri"
+			select="substring-before(concat(@href,'#'), '#')" />
+		<xsl:variable name="fragment-id"
+			select="substring-after(@href, '#')" />
+
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_START">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+
+		<xsl:choose>
+			<xsl:when test="not( $include-schematron = 'true' )">
+				<xslt:copy>
+					<xslt:copy-of select="@*" />
+					<xslt:apply-templates mode="dsdl:go" />
+				</xslt:copy>
+			</xsl:when>
+			<xsl:otherwise>
+
+				<xsl:choose>
+
+					<xsl:when
+						test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0">
+						<xsl:message>
+							Error: Impossible URL in Schematron include
+						</xsl:message>
+					</xsl:when>
+
+					<!-- this case is when there is in embedded schema in the same document elsewhere -->
+					<xslt:when
+						test="string-length( $document-uri ) = 0">
+						<xslt:apply-templates mode="dsdl:go"
+							select="//iso:*[@xml:id= $fragment-id ] 
+              	 |id( $fragment-id)
+              	 | //iso:*[@id= $fragment-id ]" />
+					</xslt:when>
+
+					<!-- case where there is a fragment in another document (should be an iso: element) -->
+					<!-- There are three cases for includes with fragment:
+						0) No href file or no matching id - error!
+						1) REMOVED
+						
+						2) The linked-to element is sch:schema however the parent of the include
+						is not a schema. In this case, it is an error. (Actually, it should
+						be an error for other kinds of containment problems, but we won't
+						check for them in this version.)
+						
+						3) Otherwise, include the pointed-to element
+					-->
+
+					<xsl:when
+						test="string-length( $fragment-id ) &gt; 0">
+						<xsl:variable name="theDocument_1"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="originalParent" select=".." />
+
+						<!-- case 0 -->
+						<xsl:if test="not($theDocument_1)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<!-- use for-each to rebase id() to external document -->
+						<xsl:for-each select="$theDocument_1">
+							<xsl:variable name="theFragment_1"
+								select=" $theDocument_1//iso:*[@xml:id= $fragment-id ] |
+              	 		id($fragment-id) |
+              			$theDocument_1//iso:*[@id= $fragment-id ]" />
+
+
+							<xsl:choose>
+								<!-- case 0 -->
+								<xsl:when test="not($theFragment_1)">
+									<xsl:message terminate="no">
+										<xsl:text>Unable to locate id attribute: </xsl:text>
+										<xsl:value-of select="@href" />
+									</xsl:message>
+								</xsl:when>
+
+
+								<!-- case 1 REMOVED -->
+
+								<!-- case 2 -->
+								<xsl:when
+									test=" $theFragment_1/self::iso:schema ">
+									<xsl:message>
+										Schema error: Use include to
+										include fragments, not a whole
+										schema
+									</xsl:message>
+								</xsl:when>
+
+								<!-- case 3 -->
+								<xsl:otherwise>
+									<xsl:apply-templates
+										select=" $theFragment_1[1]" mode="dsdl:go" />
+								</xsl:otherwise>
+							</xsl:choose>
+						</xsl:for-each>
+					</xsl:when>
+
+					<!-- Case where there is no ID so we include the whole document -->
+					<!-- Experimental addition: include fragments of children -->
+					<xsl:otherwise>
+						<xsl:variable name="theDocument_2"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="theFragment_2"
+							select="$theDocument_2/iso:*" />
+						<xsl:variable name="theContainedFragments"
+							select="$theDocument_2/*/iso:* | $theDocument_2/*/xsl:* | $theDocument_2/*/xhtml:*" />
+						<xsl:if test="not($theDocument_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+
+						<!-- There are three cases for includes:
+							0) No text specified- error!
+							
+							1) REMOVED
+							
+							2) The linked-to element is sch:schema however the parent of the include
+							is not a schema. In this case, it is an error. (Actually, it should
+							be an error for other kinds of containment problems, but we won't
+							check for them in this version.)
+							
+							3) Otherwise, include the pointed-to element
+						-->
+						<xsl:choose>
+							<!-- case 0 -->
+							<xsl:when
+								test="not($theFragment_2) and not ($theContainedFragments)">
+								<xsl:message terminate="no">
+									<xsl:text>Unable to locate id attribute: </xsl:text>
+									<xsl:value-of select="@href" />
+								</xsl:message>
+							</xsl:when>
+
+							<!-- case 1 removed -->
+
+							<!-- case 2 -->
+							<xsl:when
+								test=" $theFragment_2/self::iso:schema or $theContainedFragments/self::iso:schema">
+								<xsl:message>
+									Schema error: Use include to include
+									fragments, not a whole schema
+								</xsl:message>
+							</xsl:when>
+
+							<!-- If this were XLST 2, we could use  
+								if ($theFragment) then $theFragment else $theContainedFragments
+								here (thanks to KN)
+							-->
+							<!-- case 3 -->
+							<xsl:otherwise>
+								<xsl:apply-templates
+									select="$theFragment_2 " mode="dsdl:go" />
+							</xsl:otherwise>
+						</xsl:choose>
+					</xsl:otherwise>
+				</xsl:choose>
+			</xsl:otherwise>
+		</xsl:choose>
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_END">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+	</xsl:template>
+
+
+	<!-- WARNING   sch:extends[@href] is experimental and non standard  -->
+	<!-- Basically, it adds the children of the selected element, not the element itself.  -->
+	<xsl:template match="iso:extends[@href]" mode="dsdl:go">
+
+		<xsl:variable name="document-uri"
+			select="substring-before(concat(@href,'#'), '#')" />
+		<xsl:variable name="fragment-id"
+			select="substring-after(@href, '#')" />
+
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_START">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+
+		<xsl:choose>
+			<xsl:when test="not( $include-schematron = 'true' )">
+				<xslt:copy>
+					<xslt:copy-of select="@*" />
+					<xslt:apply-templates mode="dsdl:go" />
+				</xslt:copy>
+			</xsl:when>
+			<xsl:otherwise>
+
+				<xsl:choose>
+
+					<xsl:when
+						test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0">
+						<xsl:message>
+							Error: Impossible URL in Schematron include
+						</xsl:message>
+					</xsl:when>
+
+					<!-- this case is when there is in embedded schema in the same document elsewhere -->
+					<xslt:when
+						test="string-length( $document-uri ) = 0">
+						<xslt:apply-templates mode="dsdl:go"
+							select="//iso:*[@xml:id= $fragment-id ]/* 
+              	 |id( $fragment-id)/*
+              	 | //iso:*[@id= $fragment-id ]/*" />
+					</xslt:when>
+
+					<!-- case where there is a fragment in another document (should be an iso: element) -->
+					<!-- There are three cases for includes with fragment:
+						0) No href file or no matching id - error!
+						1) REMOVED
+						
+						2) REMOVED
+						
+						3) Otherwise, include the pointed-to element
+					-->
+
+					<xsl:when
+						test="string-length( $fragment-id ) &gt; 0">
+						<xsl:variable name="theDocument_1"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="originalParent" select=".." />
+
+						<!-- case 0 -->
+						<xsl:if test="not($theDocument_1)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<!-- use for-each to rebase id() to external document -->
+						<xsl:for-each select="$theDocument_1">
+							<xsl:variable name="theFragment_1"
+								select=" $theDocument_1//iso:*[@xml:id= $fragment-id ] |
+              	 		id($fragment-id) |
+              			$theDocument_1//iso:*[@id= $fragment-id ]" />
+
+
+							<xsl:choose>
+								<!-- case 0 -->
+								<xsl:when test="not($theFragment_1)">
+									<xsl:message terminate="no">
+										<xsl:text>Unable to locate id attribute: </xsl:text>
+										<xsl:value-of select="@href" />
+									</xsl:message>
+								</xsl:when>
+
+
+								<!-- case 1 REMOVED -->
+
+								<!-- case 2 REMOVED -->
+
+
+								<!-- case 3 -->
+								<xsl:otherwise>
+
+									<xsl:apply-templates
+										select=" $theFragment_1[1]/*" mode="dsdl:go" />
+								</xsl:otherwise>
+							</xsl:choose>
+						</xsl:for-each>
+					</xsl:when>
+
+					<!-- Case where there is no ID so we include the whole document -->
+					<!-- Experimental addition: include fragments of children -->
+					<xsl:otherwise>
+						<xsl:variable name="theDocument_2"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="theFragment_2"
+							select="$theDocument_2/iso:*" />
+						<xsl:variable name="theContainedFragments"
+							select="$theDocument_2/*/iso:* | $theDocument_2/*/xsl:* | $theDocument_2/*/xhtml:*" />
+						<xsl:if test="not($theDocument_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+
+						<!-- There are three cases for includes:
+							0) No text specified- error!
+							
+							1) REMOVED
+							
+							2) REMOVED
+							
+							3) Otherwise, include the pointed-to element
+						-->
+						<xsl:choose>
+							<!-- case 0 -->
+							<xsl:when
+								test="not($theFragment_2) and not ($theContainedFragments)">
+								<xsl:message terminate="no">
+									<xsl:text>Unable to locate id attribute: </xsl:text>
+									<xsl:value-of select="@href" />
+								</xsl:message>
+							</xsl:when>
+
+							<!-- case 1 removed -->
+
+							<!-- case 2 removed -->
+
+							<!-- If this were XLST 2, we could use  
+								if ($theFragment) then $theFragment else $theContainedFragments
+								here (thanks to KN)
+							-->
+							<!-- case 3 -->
+							<xsl:otherwise>
+								<xsl:apply-templates
+									select="$theFragment_2/* " mode="dsdl:go" />
+							</xsl:otherwise>
+						</xsl:choose>
+					</xsl:otherwise>
+				</xsl:choose>
+			</xsl:otherwise>
+		</xsl:choose>
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_END">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+	</xsl:template>
+
+
+
+	<!-- =========================================================== -->
+	<!-- Handle Schematron 1.6 inclusions: clone of ISO code above   -->
+	<!-- =========================================================== -->
+
+
+	<!-- Extend the URI syntax to allow # references -->
+	<!-- Add experimental support for simple containers like  /xxx:xxx/schold:pattern to allow better includes -->
+	<xsl:template match="schold:include" mode="dsdl:go">
+		<xsl:variable name="document-uri"
+			select="substring-before(concat(@href,'#'), '#')" />
+		<xsl:variable name="fragment-id"
+			select="substring-after(@href, '#')" />
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_START">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+
+		<xsl:choose>
+			<xsl:when test="not( $include-schematron = 'true' )">
+				<xslt:copy>
+					<xslt:copy-of select="@*" />
+					<xslt:apply-templates mode="dsdl:go" />
+				</xslt:copy>
+			</xsl:when>
+			<xsl:otherwise>
+				<xsl:choose>
+
+					<xsl:when
+						test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0">
+						<xsl:message>
+							Error: Impossible URL in Schematron include
+						</xsl:message>
+					</xsl:when>
+
+					<!-- this case is when there is in embedded schema in the same document elsewhere -->
+					<xslt:when
+						test="string-length( $document-uri ) = 0">
+						<xslt:apply-templates mode="dsdl:go"
+							select="//schold:*[@xml:id= $fragment-id ] 
+              	 |id( $fragment-id)
+              	 | //schold:*[@id= $fragment-id ]" />
+					</xslt:when>
+
+					<!-- case where there is a fragment in another document (should be an iso: element) -->
+					<xsl:when
+						test="string-length( $fragment-id ) &gt; 0">
+						<xsl:variable name="theDocument_1"
+							select="document( $document-uri,/ )" />
+						<xsl:if test="not($theDocument_1)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<!-- use for-each to rebase id() to $theDocument -->
+						<xsl:for-each select="$theDocument_1">
+							<xsl:variable name="theFragment_1"
+								select=" $theDocument_1//schold:*[@xml:id= $fragment-id ] |
+              	id($fragment-id) |
+              	$theDocument_1//schold:*[@id= $fragment-id ]" />
+							<xsl:if
+								test=" $theFragment_1/self::schold:schema ">
+								<xsl:message>
+									Schema error: Use include to include
+									fragments, not a whole schema
+								</xsl:message>
+							</xsl:if>
+							<xsl:if test="not($theFragment_1)">
+								<xsl:message terminate="no">
+									<xsl:text>Unable to locate id attribute: </xsl:text>
+									<xsl:value-of select="@href" />
+								</xsl:message>
+							</xsl:if>
+							<xsl:apply-templates
+								select=" $theFragment_1[1]" mode="dsdl:go" />
+						</xsl:for-each>
+					</xsl:when>
+
+					<!-- Case where there is no ID so we include the whole document -->
+					<!-- Experimental addition: include fragments of children -->
+					<xsl:otherwise>
+						<xsl:variable name="theDocument_2"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="theFragment_2"
+							select="$theDocument_2/iso:*" />
+						<xsl:variable name="theContainedFragments"
+							select="$theDocument_2/*/schold:* | $theDocument_2/*/xsl:* | $theDocument_2/*/xhtml:*" />
+						<xsl:if test="not($theDocument_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+
+						<xsl:if
+							test=" $theFragment_2/self::schold:schema or $theContainedFragments/self::schold:schema">
+							<xsl:message>
+								Schema error: Use include to include
+								fragments, not a whole schema
+							</xsl:message>
+						</xsl:if>
+						<xsl:if
+							test="not($theFragment_2) and not ($theContainedFragments)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to locate id attribute: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<!-- If this were XLST 2, we could use  
+							if ($theFragment) then $theFragment else $theContainedFragments
+							here (thanks to KN)
+						-->
+						<xsl:choose>
+							<xsl:when test=" $theFragment_2 ">
+								<xsl:apply-templates
+									select="$theFragment_2 " mode="dsdl:go" />
+							</xsl:when>
+							<xsl:otherwise>
+								<!-- WARNING!  EXPERIMENTAL! Use at your own risk. This may be discontinued! -->
+								<xsl:apply-templates
+									select="  $theContainedFragments " mode="dsdl:go" />
+							</xsl:otherwise>
+						</xsl:choose>
+					</xsl:otherwise>
+				</xsl:choose>
+
+			</xsl:otherwise>
+		</xsl:choose>
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_END">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+	</xsl:template>
+	<!-- =========================================================== -->
+	<!-- ISO/IEC 19757 - DSDL Document Schema Definition Languages   -->
+	<!-- Part 5 - DataType Library Language - DTLL                   -->
+	<!-- Committee Draft  Experimental support only                  -->
+	<!-- The <include> element may well be replaced by XInclude in   -->
+	<!-- any final version.                                          -->
+	<!-- =========================================================== -->
+	<xslt:template match="dtll:include" mode="dsdl:go">
+		<!-- Insert subschema -->
+
+		<xsl:variable name="document-uri"
+			select="substring-before(concat(@href,'#'), '#')" />
+		<xsl:variable name="fragment-id"
+			select="substring-after(@href, '#')" />
+		<xsl:processing-instruction name="DSDL_INCLUDE_START">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+		<xsl:choose>
+			<xsl:when test="not( $include-dtll = 'true' )">
+				<xslt:copy>
+					<xslt:copy-of select="@*" />
+					<xslt:apply-templates mode="dsdl:go" />
+				</xslt:copy>
+			</xsl:when>
+			<xsl:otherwise>
+				<xsl:choose>
+
+					<xsl:when
+						test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0">
+						<xsl:message>
+							Error: Impossible URL in DTLL include
+						</xsl:message>
+					</xsl:when>
+
+					<!-- this case is when there is in embedded schema in the same document elsewhere -->
+					<xslt:when
+						test="string-length( $document-uri ) = 0">
+						<xslt:apply-templates mode="dsdl:go"
+							select="//*[@xml:id= $fragment-id ] | id( $fragment-id) 
+              	| //*[@id= $fragment-id ]" />
+					</xslt:when>
+
+					<xsl:when
+						test="string-length( $fragment-id ) &gt; 0">
+						<xsl:variable name="theDocument_1"
+							select="document( $document-uri,/ )" />
+						<xsl:if test="not($theDocument_1)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<!-- use for-each to rebase id() to $theDocument -->
+						<xsl:for-each select="$theDocument_1">
+							<xsl:variable name="theFragment_1"
+								select="$theDocument_1//*[@xml:id= $fragment-id ]
+               | id( $fragment-id ) 
+               | $theDocument_1//*[@id= $fragment-id ]" />
+							<xsl:if test="not($theFragment_1)">
+								<xsl:message terminate="no">
+									<xsl:text>Unable to locate id attribute: </xsl:text>
+									<xsl:value-of select="@href" />
+								</xsl:message>
+							</xsl:if>
+							<xsl:apply-templates
+								select=" $theFragment_1[1]" mode="dsdl:go" />
+						</xsl:for-each>
+					</xsl:when>
+
+					<xsl:otherwise>
+						<xsl:variable name="theDocument_2"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="theFragment_2"
+							select="$theDocument_2/*" />
+
+						<xsl:if test="not($theDocument_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+
+						<xsl:if test="not($theFragment_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to locate id attribute: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<xsl:apply-templates select="$theFragment_2 "
+							mode="dsdl:go" />
+					</xsl:otherwise>
+				</xsl:choose>
+
+			</xsl:otherwise>
+		</xsl:choose>
+		<xsl:processing-instruction name="DSDL_INCLUDE_END">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+	</xslt:template>
+
+	<!-- =========================================================== -->
+	<!-- ISO/IEC 19757 - DSDL Document Schema Definition Languages   -->
+	<!-- Part 7 - Character Repertoire Description Language - CRDL   -->
+	<!-- Final Committee Draft 2008-01-11 Experimental support only  -->
+	<!-- =========================================================== -->
+	<xslt:template match="crdl:ref" mode="dsdl:go">
+		<!-- Insert subschema -->
+
+		<xsl:variable name="document-uri"
+			select="substring-before(concat(@href,'#'), '#')" />
+		<xsl:variable name="fragment-id"
+			select="substring-after(@href, '#')" />
+		<xsl:processing-instruction name="DSDL_INCLUDE_START">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+		<xsl:choose>
+			<xsl:when test="not( $include-crdl = 'true' )">
+				<xslt:copy>
+					<xslt:copy-of select="@*" />
+					<xslt:apply-templates mode="dsdl:go" />
+				</xslt:copy>
+			</xsl:when>
+			<xsl:otherwise>
+				<xsl:choose>
+
+					<xsl:when
+						test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0">
+						<xsl:message>
+							Error: Impossible URL in CRDL include
+						</xsl:message>
+					</xsl:when>
+
+					<!-- this case is when there is in embedded schema in the same document elsewhere -->
+					<xslt:when
+						test="string-length( $document-uri ) = 0">
+
+						<xslt:apply-templates mode="dsdl:go"
+							select="//*[@xml:id= $fragment-id ] | id( $fragment-id)
+              	| //*[@id= $fragment-id ]" />
+					</xslt:when>
+
+					<xsl:when
+						test="string-length( $fragment-id ) &gt; 0">
+						<xsl:variable name="theDocument_1"
+							select="document( $document-uri,/ )" />
+						<xsl:if test="not($theDocument_1)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<!-- use for-each to rebase id() to $theDocument -->
+						<xsl:for-each select="$theDocument_1">
+							<xsl:variable name="theFragment_1"
+								select="$theDocument_1//*[@xml:id= $fragment-id ]
+               | id( $fragment-id )
+               | $theDocument_1//*[@id= $fragment-id ]" />
+
+							<xsl:if test="not($theFragment_1)">
+								<xsl:message terminate="no">
+									<xsl:text>Unable to locate id attribute: </xsl:text>
+									<xsl:value-of select="@href" />
+								</xsl:message>
+							</xsl:if>
+							<xsl:apply-templates select=" $theFragment_1 "
+								mode="dsdl:go" />
+						</xsl:for-each>
+					</xsl:when>
+
+					<xsl:otherwise>
+						<xsl:variable name="theDocument_2"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="theFragment_2"
+							select="$theDocument_2/*" />
+
+						<xsl:if test="not($theDocument_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+						<xsl:if test="not($theFragment_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to locate id attribute: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+
+						<xsl:apply-templates select="$theFragment_2"
+							mode="dsdl:go" />
+					</xsl:otherwise>
+				</xsl:choose>
+
+			</xsl:otherwise>
+		</xsl:choose>
+		<xsl:processing-instruction name="DSDL_INCLUDE_END">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+	</xslt:template>
+
+
+	<!-- =========================================================== -->
+	<!-- ISO/IEC 19757 - DSDL Document Schema Definition Languages   -->
+	<!-- Part 4 - Namespace-based Validation Dispatching Language - NVDL -->
+	<!-- Note: This does not include schemas referenced for          -->
+	<!-- validation, it merely handles any simple XIncludes          -->
+	<!-- =========================================================== -->
+	<!-- ISO/IEC 19757 - DSDL Document Schema Definition Languages   -->
+	<!-- Part 8 - Document Schema Renaming Language - DSRL           -->
+	<!-- Note: Final? Committee Draft   Experimental support only    -->
+	<!-- =========================================================== -->
+	<!-- XInclude support for id based references only, with 1 level -->
+	<!-- of fallback.                                                -->
+	<!-- =========================================================== -->
+
+	<xslt:template mode="dsdl:go"
+		match="xi:include[@href][not(@parseType) or @parseType ='xml']">
+		<!-- Simple inclusions only here -->
+		<xsl:processing-instruction name="DSDL_INCLUDE_START">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+		<xsl:choose>
+			<xsl:when test="not( $include-xinclude = 'true' )">
+				<xslt:copy>
+					<xslt:copy-of select="@*" />
+					<xslt:apply-templates mode="dsdl:go" />
+				</xslt:copy>
+			</xsl:when>
+			<xsl:otherwise>
+				<xsl:choose>
+
+					<xsl:when test="contains( @href, '#')">
+						<xsl:message terminate="yes">
+							Fatal error: Xinclude href contains fragment
+							identifier #
+						</xsl:message>
+					</xsl:when>
+
+
+					<xsl:when test="contains( @xpointer, '(')">
+						<xsl:message terminate="yes">
+							Fatal error: Sorry, this software only
+							supports simple ids in XInclude xpointers
+						</xsl:message>
+					</xsl:when>
+
+					<xsl:when
+						test="string-length( @href ) = 0 and string-length( @xpointer ) = 0">
+
+						<xsl:message terminate="yes">
+							Fatal Error: Impossible URL in XInclude
+							include
+						</xsl:message>
+					</xsl:when>
+
+					<!-- this case is when there is in embedded schema in the same document elsewhere -->
+					<xslt:when test="string-length( @href ) = 0">
+
+						<xslt:apply-templates mode="dsdl:go"
+							select="//*[@xml:id= current()/@xpointer  ] | id( @xpointer)
+              	| //*[@id= current()/@xpointer  ]" />
+					</xslt:when>
+
+					<xsl:when
+						test="string-length( @xpointer ) &gt; 0">
+						<xsl:variable name="theDocument_1"
+							select="document( @href,/ )" />
+						<xsl:variable name="theFragment_1"
+							select="$theDocument_1//*[@xml:id= current()/@xpointer  ]
+             
+              | $theDocument_1//*[@id= current()/@xpointer  ]" />
+						<!-- removed
+							| $theDocument_1/id( @xpointer)
+							because it requires rebasing in XSLT1 and that would mess up the use of current()
+						-->
+
+
+						<!-- Allow one level of fallback, to another XInclude -->
+						<xsl:if test="not($theDocument_1)">
+							<xsl:choose>
+								<xsl:when test="xi:fallback">
+									<xsl:variable name="theDocument_2"
+										select="document( xi:fallback[1]/xi:include[not(@parseType)
+                    	 or @parseType='xml']/@href,/ )" />
+									<xsl:variable name="theFragment_2"
+										select="$theDocument_2//*[@xml:id= current()/xi:fallback[1]/xi:include/@xpointer  ]
+              				| $theDocument_2//*[@id= current()/xi:fallback[1]/xi:include/@xpointer  ]" />
+									<!-- removed 
+										| $theDocument_2/id( xi:fallback[1]/xi:include/@xpointer)
+										because it id() would need rebasing in XSLT1 and that would mess up use of current()
+									-->
+
+									<xsl:if
+										test="not($theDocument_2)">
+
+										<xsl:message terminate="no">
+											<xsl:text>Unable to open referenced included file and fallback
+									file: </xsl:text>
+											<xsl:value-of
+												select="@href" />
+										</xsl:message>
+									</xsl:if>
+								</xsl:when>
+								<xsl:otherwise>
+									<xsl:message terminate="no">
+										<xsl:text>Unable to open referenced included file: </xsl:text>
+										<xsl:value-of select="@href" />
+									</xsl:message>
+								</xsl:otherwise>
+							</xsl:choose>
+						</xsl:if>
+						<xsl:apply-templates select=" $theFragment_1"
+							mode="dsdl:go" />
+					</xsl:when>
+
+					<!-- Document but no fragment specified -->
+					<xsl:otherwise>
+						<xsl:variable name="theDocument_3"
+							select="document( @href,/ )" />
+						<xsl:variable name="theFragment_3"
+							select="$theDocument_3/*" />
+
+						<xsl:if test="not($theDocument_3)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@href" />
+							</xsl:message>
+						</xsl:if>
+
+						<xsl:apply-templates select="$theFragment_3 "
+							mode="dsdl:go" />
+					</xsl:otherwise>
+				</xsl:choose>
+
+			</xsl:otherwise>
+		</xsl:choose>
+		<xsl:processing-instruction name="DSDL_INCLUDE_END">
+			<xsl:value-of select="@href" />
+		</xsl:processing-instruction>
+	</xslt:template>
+
+	<!-- =========================================================== -->
+	<!-- W3C XLink 1.1 embedded simple links                        -->
+	<!-- =========================================================== -->
+	<xslt:template
+		match="*[@xlink:href][not(parent::*[@xlink:type='complex'])]
+	           [not(@xlink:type) or (@xlink:type='simple')]
+	           [@xlink:show='embed']
+	           [not(@xlink:actuate) or (@xlink:actuate='onLoad')]"
+		mode="dsdl:go" priority="1">
+
+		<xsl:variable name="document-uri"
+			select="substring-before(concat(@xlink:href,'#'), '#')" />
+		<xsl:variable name="fragment-id"
+			select="substring-after(@xlink:href, '#')" />
+		<xsl:processing-instruction name="DSDL_INCLUDE_START">
+			<xsl:value-of select="@xlink:href" />
+		</xsl:processing-instruction>
+		<xsl:choose>
+			<xsl:when test="not( $include-xlink = 'true' )">
+				<xslt:copy>
+					<xslt:copy-of select="@*" />
+					<xslt:apply-templates mode="dsdl:go" />
+				</xslt:copy>
+			</xsl:when>
+			<xsl:otherwise>
+				<xsl:choose>
+
+					<xsl:when
+						test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0">
+						<xsl:message>
+							Error: Impossible URL in XLink embedding
+							link
+						</xsl:message>
+					</xsl:when>
+
+					<!-- this case is when there is in embedded schema in the same document elsewhere -->
+					<xslt:when
+						test="string-length( $document-uri ) = 0">
+						<xslt:apply-templates mode="dsdl:go"
+							select="//*[@xml:id= $fragment-id ] | id( $fragment-id) 
+              	| //*[@id= $fragment-id ]" />
+					</xslt:when>
+
+					<xsl:when
+						test="string-length( $fragment-id ) &gt; 0">
+						<xsl:variable name="theDocument_1"
+							select="document( $document-uri,/ )" />
+						<xsl:if test="not($theDocument_1)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@xlink:href" />
+							</xsl:message>
+						</xsl:if>
+						<!-- use for-each to rebase id() to $theDocument -->
+						<xsl:for-each select="$theDocument_1">
+							<xsl:variable name="theFragment_1"
+								select="$theDocument_1//*[@xml:id= $fragment-id ]
+               | id( $fragment-id ) 
+               | $theDocument_1//*[@id= $fragment-id ]" />
+							<xsl:if test="not($theFragment_1)">
+								<xsl:message terminate="no">
+									<xsl:text>Unable to locate id attribute: </xsl:text>
+									<xsl:value-of select="@xlink:href" />
+								</xsl:message>
+							</xsl:if>
+							<xsl:apply-templates
+								select=" $theFragment_1[1]" mode="dsdl:go" />
+						</xsl:for-each>
+					</xsl:when>
+
+					<xsl:otherwise>
+						<xsl:variable name="theDocument_2"
+							select="document( $document-uri,/ )" />
+						<xsl:variable name="theFragment_2"
+							select="$theDocument_2/*" />
+
+						<xsl:if test="not($theDocument_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to open referenced included file: </xsl:text>
+								<xsl:value-of select="@xlink:href" />
+							</xsl:message>
+						</xsl:if>
+
+						<xsl:if test="not($theFragment_2)">
+							<xsl:message terminate="no">
+								<xsl:text>Unable to locate id attribute: </xsl:text>
+								<xsl:value-of select="@xlink:href" />
+							</xsl:message>
+						</xsl:if>
+						<xsl:apply-templates select="$theFragment_2 "
+							mode="dsdl:go" />
+					</xsl:otherwise>
+				</xsl:choose>
+
+			</xsl:otherwise>
+		</xsl:choose>
+
+		<xsl:processing-instruction name="DSDL_INCLUDE_END">
+			<xsl:value-of select="@xlink:href" />
+		</xsl:processing-instruction>
+	</xslt:template>
+
+
+</xslt:stylesheet>
\ No newline at end of file
diff --git a/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_schematron_message.xsl b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_schematron_message.xsl
new file mode 100644
index 00000000..d59b8f38
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_schematron_message.xsl
@@ -0,0 +1,55 @@
+<?xml version="1.0" ?><?xar XSLT?>
+<!-- Implmentation for the Schematron XML Schema Language.
+	http://www.ascc.net/xml/resource/schematron/schematron.html
+ 
+ Copyright (c) 2000,2001 Rick Jelliffe and Academia Sinica Computing Center, Taiwan
+
+ This software is provided 'as-is', without any express or implied warranty. 
+ In no event will the authors be held liable for any damages arising from 
+ the use of this software.
+
+ Permission is granted to anyone to use this software for any purpose, 
+ including commercial applications, and to alter it and redistribute it freely,
+ subject to the following restrictions:
+
+ 1. The origin of this software must not be misrepresented; you must not claim
+ that you wrote the original software. If you use this software in a product, 
+ an acknowledgment in the product documentation would be appreciated but is 
+ not required.
+
+ 2. Altered source versions must be plainly marked as such, and must not be 
+ misrepresented as being the original software.
+
+ 3. This notice may not be removed or altered from any source distribution.
+-->
+
+<!-- Schematron message -->
+
+<xsl:stylesheet
+   version="1.0"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+   xmlns:axsl="http://www.w3.org/1999/XSL/TransformAlias">
+
+<xsl:import href="iso_schematron_skeleton_for_xslt1.xsl"/>
+
+<xsl:template name="process-prolog">
+   <axsl:output method="text" />
+</xsl:template>
+
+<!-- use default rule for process-root:  copy contens / ignore title -->
+<!-- use default rule for process-pattern: ignore name and see -->
+<!-- use default rule for process-name:  output name -->
+<!-- use default rule for process-assert and process-report:
+     call process-message -->
+
+<xsl:template name="process-message">
+   <xsl:param name="pattern" />
+   <xsl:param name="role" />
+   <axsl:message>
+      <xsl:apply-templates mode="text"  
+      /> (<xsl:value-of select="$pattern" />
+      <xsl:if test="$role"> / <xsl:value-of select="$role" />
+      </xsl:if>)</axsl:message>
+</xsl:template>
+
+</xsl:stylesheet>
\ No newline at end of file
diff --git a/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_schematron_skeleton_for_xslt1.xsl b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_schematron_skeleton_for_xslt1.xsl
new file mode 100644
index 00000000..b0e7175c
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_schematron_skeleton_for_xslt1.xsl
@@ -0,0 +1,1796 @@
+<?xml version="1.0"?><?xar XSLT?>
+
+<!-- 
+   OVERVIEW
+   
+   ASCC/Schematron.com Skeleton Module for ISO Schematron (for XSLT1 systems)
+   
+   ISO Schematron is a language for making assertion about the presence or absence
+   of patterns in XML documents. It is typically used for as a schema language, or
+   to augment existing schema languages, and to check business rules. It is very
+   powerful, yet quite simple: a developer only need know XPath and about five other
+   elements.
+   
+   This is an open source implementation of ISO Schematron in XSLT. Although ISO does
+   not allow reference implementations which might compete with the text of the
+   standard, this code has been compiled by Rick Jelliffe, inventor of Schematron
+   and editor of the ISO standard; so developers can certainly use it as an 
+   unofficial reference implementation for clarification. 
+   
+   This implementation is based on one by Oliver Becker. API documentation is 
+   available separately; try www.schematron.com for this. Funding for this
+   stylesheet over the years has come from Topologi Pty. Ltd., Geotempo Ltd.,
+   and ASCC, Tapei.
+   
+   There are two versions of this skeleton: one is tailored for XSLT1 processors
+   and the other is tailored for XSLT2 processors. Future versions of the
+   XSLT2 skeleton may support more features than that the XSLT 1 skeleton.
+-->
+<!--
+   TIPS
+      
+   A tip for new users of Schematron: make your assertions contain positive messages
+   about what is expected, rather than error messages. For example, use the form
+   "An X should have a Y, because Z". 
+   
+   Another tip is that Schematron provides an
+   element <sch:ns> for declaring the namespaces and prefixes used in Xpaths in 
+   attribute values; it does not extend the XML Namespaces mechanism: if a name
+   in an XPath has a prefix, there must be an <sch:ns> element for that prefix; if
+   a name in an XPath does not have a prefix, it is always in no namespace.
+   
+   A tip for implementers of Schematron, either using this API or re-implementing it:
+   make the value of the diagnostics, flags and richer features available if possible;
+   Schematron has many of the optional richer features which, if implemented, provide
+   a compelling alternative approach to validation and business-rules checking compared
+   to other schema languages and programs. 
+   
+   If you create your own meta-stylesheet to override this one, it is a
+   good idea to have both in the same directory and to run the stylesheet
+   from that directory, as many XSLT implementations have ideosyncratic
+   handling of URLs: keep it simple.
+-->
+ 
+
+<!--
+  INVOCATION INFORMATION
+  
+  The following parameters are available
+  
+    phase           NMTOKEN | "#ALL" (default) Select the phase for validation
+    allow-foreign   "true" | "false" (default)   Pass non-Schematron elements to the generated stylesheet
+    sch.exslt.imports semi-colon delimited string of filenames for some EXSLT implementations  
+    message-newline "true" (default) | "false"   Generate an extra newline at the end of messages
+    optimize        "visit-no-attributes"     
+    debug	    "true" | "false" (default)  Debug mode lets compilation continue despite problems
+    attributes "true" | "false"  (Autodetecting) Use only when the schema has no attributes as the context nodes
+    only-child-elements "true" | "false" (Autodetecting) Use only when the schema has no comments
+    or PI  as the context nodes
+    
+  The following parameters can be specified as Schematron variables in diagnostics, assertions and so on.
+    fileNameParameter string	  
+    fileDirParameter string				
+    archiveNameParameter string	  In case of ZIP files
+    archiveDirParameter string	  In case of ZIP files	
+    output-encoding				  Use when outputting to XML
+ 
+ Experimental: USE AT YOUR OWN RISK   
+    visit-text "true" "false"   Also visist text nodes for context. WARNING: NON_STARDARD.
+    select-contents '' | 'key' | '//'   Select different implementation strategies
+ 
+ Conventions: Meta-stylesheets that override this may use the following parameters
+    generate-paths=true|false   generate the @location attribute with XPaths
+    diagnose= yes | no    Add the diagnostics to the assertion test in reports
+    terminate= yes | no   Terminate on the first failed assertion or successful report
+-->
+
+<!-- 
+  XSLT VERSION SUPPORT
+
+  XSLT 1:
+     A schema using the standard XSLT 1 query binding will have a /schema/@queryBinding='xslt' or 
+     nothing.
+
+       * Note: XT does not implement key() and will die if given it. 
+       * Add all formal parameters to default templates
+       * Fix missing apply-templates from process-ns and add params back
+
+  EXSLT:  Experimental support
+     A schema using the EXSLT query binding will have a /schema/@queryBinding='exslt'.
+     It is built on XSLT 1. After experience is gained, this binding is expected to be 
+     formalized as part of ISO Schematron, which currently reserves the "exslt" name for this purpose.
+
+     Some EXSLT engines have the extra functions built-in. For these, there is no need to
+     provide library locations. For engines that require the functions, either hard code
+     them in this script or provide them on the command-line argument.
+ 
+-->
+<!--
+   PROCESS INFORMATION
+   
+   This stylesheet compiles a Schematron schema (*.sch) into XSLT code (*.xsl). 
+   The generated XSLT code can then be run against an XML file (*.xml, etc) and
+   will produce validation results.
+   
+   The output of validation results is performed using named templates (process-*). 
+   These can be overridden easily by making a new XSLT stylesheet that imports this 
+   stylesheet but has its own version of the relevant process-* templates. Several
+   of these invoking stylesheets are available: "iso_svrl.xsl", for example generates
+   ISO Schematron Validation Report Language format results.
+   
+   In this version of the stylesheet, the ISO feature called "abstract patterns" is
+   implemented using macro processing: a prior XSLT stage to which converts uses
+   of abstract patterns into normal patterns. If you do not use abstract patterns,
+   it is not necessary to preprocess the schema.
+   
+   To summarize, a basic process flow for some commandline processor is like this:
+     XSLT -input=xxx.sch  -output=xxx.xsl  -stylesheet=iso_schematron_skeleton.xsl
+     XSLT -input=document.xml  -output=xxx-document.results  -stylesheet=xxx.xsl
+   
+   iso_svrl.xslt is an implementation of Schematron that can use this skeleton and
+   generate ISO SVRL reports. A process flow for some commandline processor would
+   be like this:
+     XSLT -input=xxx.sch  -output=xxx.xsl  -stylesheet=iso_svrl.xsl
+     XSLT -input=document.xml  -output=xxx-document.results  -stylesheet=xxx.xsl
+     
+   It is not impossible that ultimately a third stage, to handle macro-preprocessing
+   and inclusion, might be necessary. (The trade-off is in making this XSLT more
+   complex compared to making the outer process more complex.)
+             
+  This version has so far been tested with
+     Saxon 8
+     MSXML 4 (or 6?)   
+
+ Please note that if you are using SAXON and JAXP, then you should use 
+  System.setProperty("javax.xml.transform.TransformerFactory",
+                          "net.sf.saxon.TransformerFactoryImpl");
+ rather than 
+  System.setProperty("javax.xml.xpath.TransformerFactory",
+                           "net.sf.saxon.TransformerFactoryImpl");
+ which is does not work, at least for the versions of SAXON we tried.
+-->
+<!--
+ LEGAL INFORMATION
+ 
+ Copyright (c) 2000-2008 Rick Jelliffe and Academia Sinica Computing Center, Taiwan
+
+ This software is provided 'as-is', without any express or implied warranty. 
+ In no event will the authors be held liable for any damages arising from 
+ the use of this software.
+
+ Permission is granted to anyone to use this software for any purpose, 
+ including commercial applications, and to alter it and redistribute it freely,
+ subject to the following restrictions:
+
+ 1. The origin of this software must not be misrepresented; you must not claim
+ that you wrote the original software. If you use this software in a product, 
+ an acknowledgment in the product documentation would be appreciated but is 
+ not required.
+
+ 2. Altered source versions must be plainly marked as such, and must not be 
+ misrepresented as being the original software.
+
+ 3. This notice may not be removed or altered from any source distribution.
+-->
+<!--
+  NOTE: Compared to the iso_schematron_skeleton_for_saxon.xsl code, this version is currently missing
+     1) localization
+     2) properties
+     3) pattern/@documents
+
+  VERSION INFORMATION 
+   2009-02-25 RJ
+        * Fix up variable names so none are used twice in same template
+        * Tested on SAXON 9, Xalan 2.7.1. Partly tested MSXML.  
+   2008-09-19 RJ
+        * Add mode schematron-select-full-path and param full-path-notation 
+   
+   2008-08-11
+   		* TT report/@flag was missing
+   2008-08-06
+   		* TT Top-level lets need to be implemented using xsl:param not xsl:variable
+   		* TT xsl:param/@select must have XPath or not be specified
+   		
+    Version: 2008-07-28
+   		* KH schematron-get-full-path-3 has [index] even on top step
+   		* RJ fix schematron-get-full-path to have namespace predicate, I don't know why this was removed
+   		
+   Version: 2008-07-24
+   		* RJ clean out commented out namespace handling code
+   		* RJ add support for experimental non-standard attribute report/@action
+   		and assert/@action, and add parameter not in the published API (should
+   		not break anything, it is XSLT1)
+   		* RJ Remove remaining XSLT2 code for ease of reading
+   		
+   Version: 2008-07-14 minor update for inclusion experiments
+   	* RJ Clean up zero-length fragment test on include
+   	* RJ Add experimental support for include containers 
+   	* RJ For path generation, test for //iso:schema not just /iso:schema, for potential embedded Schematron support   
+   	* RJ Don't generate double error messages for old namespace elements
+   	* RJ Experimental iso:rule/iso:title just kept as comment (bigger request Uche Ogbuji)
+   	* RJ Remove spurious debug messages
+   	* RJ Fix bug that prevented including patterns in this (report Roger
+   	Costello)
+  
+   Version: 2007-10-17
+     From this version on I am forking XSLT2 support to a different version of the script.
+     This is due to the increasingly horrible state of the namespace handling code as well
+     as other inconsistencies between the major implementations of different versions.
+     The intent is that future versions of this will have XSLT2 isms removed and be simplified
+     to cope with only XSLT1 and EXLST. Note that though this version is called
+     iso_schematron_skeleton_for_xslt1, the various meta-stylesheets will continue to just call
+     iso_schematron_skeleton: it is up to you to rename the stylesheet to the one you want to
+     use.
+
+       * RJ fix FULL-PATH problem with attribute names
+
+
+   Version: 2007-07-19
+     Accept most changes in David Carlisle's fork, but continue as XSLT1 script: 
+    	http://dpcarlisle.blogspot.com/search/label/schematron
+    	* DPC Remove "optimize" parameter
+    	* DPC Add autodetecting optimize parameter attribute to skip checking attribute
+    	context
+    	* DPC Add autodetecting optimize parameter only-child-elements turn off checking for 
+    	comments and PIs
+    	* DPC (Experimental: NON_STANDARD DANGER!) Add param visit-text to viist text
+    	nodes too for context 
+    	* DPC Fix inclusion syntax to allow #
+    	* DPC Priorities count up from 1000 not down from 4000 to allow more rules
+        * RJ Add new template for titles of schemas, with existing behaviour.  
+        Override process-schema-title for custom processing of title
+    		
+    
+   Version: 2007-04-04
+   	* RJ debug mode param
+	* RJ alter mixed test to only test mixed branches, so the same document
+	could have old and new namespaces schemas in it, but each schema must
+	be distinct, just so as not to overconstrain things.
+   	* KH zero-length include/@href is fatal error, but allow debug mode
+	* SB add hint on SAXON and JAXP
+	* DC generate-full-path-1 generates XLST1 code by default
+   Version: 2007-03-05
+      	* AS Typo for EXSLT randome, improve comment
+      	* KH get-schematron-full-path-2 needs to apply to attributes too
+      	* DP document policy on extensions better
+      	* DC use copy-of not copy for foreign elements
+      	* DC add generate-path-2
+      	* DC don't try to apply templates to attribute axis on attribute nodes, to
+      	stop SAXON warning.
+      	* RJ improve reporting of typos 
+   
+   Version: 2007-02-08
+   		* KH Schematron fullpath implementation: @* handled twice and / missing
+   		* KH Change stylesheetbody from named template to mode to allow implementers more flexibility.
+   		  Move process-ns to outside the stylesheet body.
+   		* DP, FG, fix handling of xslt:key
+   		* FG no iso:title/@class
+   		* Experimental optimization 'visit-no-attributes'
+   		* KH Experimental added schematron-get-full-path-2 which gives prefixed version for humans
+ 		* DC Move stylesheet/@version generation to after namespace handling
+ 		* DC, FG EXSLT namespace handling code
+ 		* FG add ref and commented code from FG's page on namespaces
+ 		* Start adding normalize-space() to parameter code
+ 		* Add a space between diagnostics
+   		   		 
+   Version: 2007-01-22
+   	* DP change = ($start) to = $start and =($phase) to =$phase 
+   	to run under Saxon 8.8j
+	* FG better title section using ( @id | sch:title)[last()]
+	* Default query language binding is "xslt" not "xslt1"
+  
+   Version: 2007-01-19
+   		* Simplify message newline code
+   		* Remove termination and xpath appending to message options: 
+   		   factor out as  iso_schematron_terminator.xsl
+   		* Comment out XSLT2 namespace fix temporarily
+  
+   Version: 2007-01-18 (First beta candidate for comment)
+          * DC remove xml:space="preserve"
+          * FG improve comment on import statement
+          * DC improve comments on invocation section
+          * Add exploratory support for sch:schema[@queryBinding='xpath']
+             by allowing it and warning as lets are found
+          * Be strict about queryBinding spelling errors
+          * Extra comments on the different queryBindings
+          * KH Add option "message-paths" to generate XPath from output 
+          * KH Add option "terminate" to halt with an error after the first assertion
+          * KH refactor paths in schematron-full-path
+          * Improve (?) namespace handling: no dummy attributes for prefix "xsl" generated
+   
+   Version: 2007-01-15
+          * FG fix for calling templates
+          * Add formal parameters to default templates: may help XSLT 2
+          * Fix get-schematron-full-path
+          * Include skeleton1-6 is commented out by default
+
+   Version:2007-01-12 (Pre-beta release to Schematron-love-in maillist)
+           * Add many extra parameters to the process-* calls, so that almost
+           all the information in the schema can be provided to client programs.
+           Also, rearrange the parameters to fit in with the ISO schema, which
+           has "rich" and "linkable" attribute groups.
+           * Warn on diagnostics with no ID once only
+           * Improved path reporting, to handle for namespaces
+           * Add process-title dummy template for API
+           * Add command-line parameter allow-foreign (true|false) to suppress
+            warnings one foreign elements and pass them through to the generated
+            stylesheet
+           * remove legacy templates for the old ASCC namespace and no namespace, 
+              and use an import statement instead. Much cleaner now!
+           * patterns use @id not @name
+           * titles can contain sub-elements
+           * start change sch:rule to allow attributes, PIs and comments 
+           * the default process-* for inline elements add a leading and trailing 
+             space, to reduce the chance of concatenation.
+           * add comments to make the generated code clearer
+           
+   Version:2006-11-07 (ISO: first release private to schematron-love-in maillist for review)
+           * Duplicate pattern templates, for handling ISO namespace
+           * Add priority onto default and paragraph templates
+           * Add namespace checks
+           * Handle key in xsl namespace not iso
+           * Add include
+           * Improve namespace handling
+           * Preliminary XSLT2 and EXSLT support
+	       * Refactor iso:schema for clarity
+
+    Version: 2003-05-26 
+    	    * Fix bug with key 
+    Version: 2003-04-16
+    	   * handle 1.6 let expressions
+    	   * make key use XSLT names, and allow anywhere
+    Version: 2001-06-13
+           * same skeleton now supports namespace or no namespace
+           * parameters to handlers updated for all 1.5 attributes 
+           * diagnostic hints supported: command-line option diagnose=yes|no
+           * phases supported: command-line option phase=#ALL|...
+           * abstract rules
+           * compile-time error messages  
+	   * add utility routine generate-id-from-path
+          
+    Contributors: Rick Jelliffe (original), Oliver Becker (architecture, XSLT2), 
+             Miloslav Nic (diagnostic, phase, options), Ludwig Svenonius (abstract)
+             Uche Ogbuji (misc. bug fixes), Jim Ancona (SAXON workaround),
+	 	     Francis Norton (generate-id-from-path), Robert Leftwich, Bryan Rasmussen,
+             Dave Pawson (include, fallback), Florent Georges (namespaces, exslt, attribute
+             context), Benoit Maisonny (attribute context), John Dumps (process-message newline),
+             Cliff Stanford (diagnostics and other newlines)
+
+    
+    KNOWN TYPICAL LIMITATIONS:
+      * Don't use <sch:ns prefix="xsl" .../> with a namespace other than the standard
+      XSLT one. This would be a bizarre thing to do anyway. 
+      * Don't use other prefixes for the XSLT namespace either; some implementations will
+      not handle it correctly.
+     
+     EXTENSIONS:
+      ISO Schematron is designed as a framework with some standard query language
+      bindings. If you need to support other features, please do so safely by making
+      up your own @queryLanguage name: this makes it clear that your schema requires
+      special features. For example, default ISO Schematron does not support user
+      defined functions; so if you want to use the user defined function feature
+      in XSLT, you need to have a schema with some queryBinding attribute name like
+      "XSLT-with-my-functions" or whatever.
+-->
+
+
+
+
+<xsl:stylesheet version="1.0" 
+	xmlns:xsl="http://www.w3.org/1999/XSL/Transform" 
+	xmlns:axsl="http://www.w3.org/1999/XSL/TransformAlias" 
+	xmlns:sch="http://www.ascc.net/xml/schematron"
+    xmlns:iso="http://purl.oclc.org/dsdl/schematron" 
+    xmlns:exsl="http://exslt.org/common"
+    xmlns:msxsl="urn:schemas-microsoft-com:xslt"
+    extension-element-prefixes="exsl  msxsl"
+	 >
+<!-- This program implements ISO Schematron, except for abstract patterns which require a preprocess. -->
+  
+
+<xsl:namespace-alias stylesheet-prefix="axsl" result-prefix="xsl"/>
+
+
+<!-- Category: top-level-element -->
+<xsl:output method="xml" omit-xml-declaration="no" standalone="yes"  indent="yes"/>
+
+
+<xsl:param name="phase">
+  <xsl:choose>
+    <xsl:when test="//sch:schema/@defaultPhase">
+      <xsl:value-of select="//sch:schema/@defaultPhase"/>
+    </xsl:when>   
+    <xsl:when test="//iso:schema/@defaultPhase">
+      <xsl:value-of select="//iso:schema/@defaultPhase"/>
+    </xsl:when>
+    <xsl:otherwise>#ALL</xsl:otherwise>
+  </xsl:choose>
+</xsl:param>
+
+<xsl:param name="allow-foreign">false</xsl:param>
+
+<xsl:param name="message-newline">true</xsl:param>
+
+<!-- DPC set to true if contexts should be checked on attribute nodes
+         defaults to true if there is any possibility that a context could match an attribute,
+         err on the side if caution, a context of *[.='@'] would cause this param to defualt to true
+         even though @ is in a string
+-->
+<xsl:param name="attributes">
+  <xsl:choose>
+    <xsl:when test="//iso:rule[contains(@context,'@') or contains(@context,'attribute')]">true</xsl:when>
+    <xsl:otherwise>false</xsl:otherwise>
+  </xsl:choose>
+</xsl:param>
+
+<!-- DPC set to true if contexts should be checked on just elements in the child axis
+         defaults to true if there is any possibility that a context could match an comment or PI
+         err on the side if caution, a context of *[.='('] would cause this param to defualt to true
+         even though ( is in a string, but node() comment() and processing-instruction()  all have a (
+-->
+<xsl:param name="only-child-elements">
+  <xsl:choose>
+    <xsl:when test="//iso:rule[contains(@context,'(')]">true</xsl:when>
+    <xsl:otherwise>false</xsl:otherwise>
+  </xsl:choose>
+</xsl:param>
+
+<!-- DPC set to true if contexts should be checked on text nodes nodes (if only-child-elements is false)
+         THIS IS NON CONFORMANT BEHAVIOUR JUST FOR DISCUSSION OF A POSSIBLE CHANGE TO THE
+         SPECIFICATION. THIS PARAM SHOULD GO IF THE FINAL DECISION IS THAT THE SPEC DOES NOT CHANGE.
+	 Always defaults to false
+-->
+<xsl:param name="visit-text" select="'false'"/>
+
+<!-- DPC
+  When selecting contexts the specified behaviour is
+    @*|node()[not(self::text())]
+    The automatic settings may use
+      node()[not(self::text())]
+      @*|*
+      *
+  instead for schema for which they are equivalent.
+  If the params are set explictly the above may be used, and also either if
+      @*
+      @*|node()
+   in all cases the result may not be equivalent, for example if you specify no attributes and the schema 
+   does have attribute contexts they will be silently ignored.
+
+  after testing it turns out that
+  node()[not(self::text())] is slower in saxon than *|comment()|processing-instruction() 
+  which I find a bit surprising but anyway I'll use the longr faster version.
+-->
+<xsl:variable name="context-xpath">
+  <xsl:if test="$attributes='true'">@*|</xsl:if>
+  <xsl:choose>
+    <xsl:when test="$only-child-elements='true'">*</xsl:when>
+    <xsl:when test="$visit-text='true'">node()</xsl:when>
+    <xsl:otherwise>*|comment()|processing-instruction()</xsl:otherwise>
+  </xsl:choose>
+</xsl:variable>
+
+<!-- DPC if this is set to 
+    '' use recursive templates to iterate over document tree,
+    'key' select  all contexts with a key rather than walking the tree explictly in each mode
+    '//' select all contexts with // a key rather than walking the tree explictly in each mode (XSLT2 only)
+-->
+<xsl:param name="select-contexts" select="''"/>
+
+
+<xsl:param name="output-encoding"/>
+<!-- e.g. saxon file.xml file.xsl "sch.exslt.imports=.../string.xsl;.../math.xsl" -->
+<xsl:param name="sch.exslt.imports"/>
+
+<!-- Set the language code for messages -->
+<xsl:param name="langCode">default</xsl:param>
+
+<xsl:param name="debug">false</xsl:param>
+
+
+<!-- Set the default for schematron-select-full-path, i.e. the notation for svrl's @location-->
+<xsl:param name="full-path-notation">1</xsl:param>
+
+<!-- Simple namespace check -->
+<xsl:template match="/">
+    <xsl:if  test="//sch:*[ancestor::iso:* or descendant::iso:*]">
+	<xsl:message>Schema error: Schematron elements in old and new namespaces found</xsl:message>
+	<xsl:if test=" $debug = 'false' " />
+    </xsl:if>
+
+    <xsl:apply-templates />
+</xsl:template>
+
+
+<!-- ============================================================== -->
+<!-- ISO SCHEMATRON SCHEMA ELEMENT  -->
+<!-- Not handled: Abstract patterns. A pre-processor is assumed. -->
+<!-- ============================================================== -->
+
+<!-- SCHEMA -->
+<!-- Default uses XSLT 1 -->
+<xsl:template match="iso:schema[not(@queryBinding) or @queryBinding='xslt' 
+     or @queryBinding='xslt1' or @queryBinding='XSLT' or @queryBinding='XSLT1'
+     or @queryBinding='xpath']">
+     <xsl:if test="
+	     @queryBinding='xslt1' or @queryBinding='XSLT' or @queryBinding='XSLT1'">
+	     <xsl:message>Schema error: in the queryBinding attribute, use 'xslt'</xsl:message>
+	</xsl:if>
+	<axsl:stylesheet>
+	    <xsl:apply-templates select="iso:ns"/>
+	    <!-- Handle the namespaces before the version attribute: reported to help SAXON -->
+	    <xsl:attribute name="version">1.0</xsl:attribute>
+	    
+		<xsl:apply-templates select="." mode="stylesheetbody"/>
+		<!-- was xsl:call-template name="stylesheetbody"/ -->
+	</axsl:stylesheet>
+</xsl:template>
+
+<!-- Using EXSLT with all modeles (except function module: not applicable) -->
+<xsl:template match="iso:schema[@queryBinding='exslt']" priority="10">
+    <xsl:comment>This XSLT was automatically generated from a Schematron schema.</xsl:comment>
+	<axsl:stylesheet
+ 	  	xmlns:date="http://exslt.org/dates-and-times"
+ 	  	xmlns:dyn="http://exslt.org/dynamic"
+		xmlns:exsl="http://exslt.org/common"
+		xmlns:math="http://exslt.org/math"
+   		xmlns:random="http://exslt.org/random"
+  		xmlns:regexp="http://exslt.org/regular-expressions"
+   		xmlns:set="http://exslt.org/sets"
+   		xmlns:str="http://exslt.org/strings"
+   		extension-element-prefixes="date dyn exsl math random regexp set str" >
+	
+        <xsl:apply-templates select="iso:ns"/>
+	    <!-- Handle the namespaces before the version attribute: reported to help SAXON -->
+	    <xsl:attribute name="version">1.0</xsl:attribute>
+	    
+	    <xsl:apply-templates select="." mode="stylesheetbody"/>
+		<!-- was xsl:call-template name="stylesheetbody"/ -->
+	</axsl:stylesheet>
+</xsl:template>
+
+
+<!-- Default uses XSLT 1 -->
+<xsl:template match="iso:schema" priority="-1">
+	<xsl:message terminate="yes" >Fail: This implementation of ISO Schematron does not work with 
+	schemas using the "<xsl:value-of select="@queryBinding"/>" query language.</xsl:message>        
+</xsl:template>
+
+<xsl:template match="*" mode="stylesheetbody">
+	<!--xsl:template name="stylesheetbody"-->
+    <xsl:comment>Implementers: please note that overriding process-prolog or process-root is 
+    the preferred method for meta-stylesheets to use where possible. </xsl:comment><xsl:text>&#10;</xsl:text>
+
+   <!-- These parameters may contain strings with the name and directory of the file being
+   validated. For convenience, if the caller only has the information in a single string,
+   that string could be put in fileDirParameter. The archives parameters are available
+   for ZIP archives.
+	-->
+
+	<axsl:param name="archiveDirParameter" />
+	<axsl:param name="archiveNameParameter" />
+	<axsl:param name="fileNameParameter" />
+	<axsl:param name="fileDirParameter" />
+
+    <xsl:call-template name="iso:exslt.add.imports" />
+    <xsl:text>&#10;&#10;</xsl:text><xsl:comment>PHASES</xsl:comment><xsl:text>&#10;</xsl:text>
+	<xsl:call-template name="handle-phase"/>
+    <xsl:text>&#10;&#10;</xsl:text><xsl:comment>PROLOG</xsl:comment><xsl:text>&#10;</xsl:text>
+	<xsl:call-template name="process-prolog"/>
+    <xsl:text>&#10;&#10;</xsl:text><xsl:comment>KEYS</xsl:comment><xsl:text>&#10;</xsl:text>
+	<xsl:apply-templates mode="do-keys"   select="xsl:key  "/>
+    <xsl:text>&#10;&#10;</xsl:text><xsl:comment>DEFAULT RULES</xsl:comment><xsl:text>&#10;</xsl:text>
+    <xsl:call-template name="generate-default-rules" />
+    <xsl:text>&#10;&#10;</xsl:text><xsl:comment>SCHEMA METADATA</xsl:comment><xsl:text>&#10;</xsl:text>
+    <xsl:call-template name="handle-root"/>
+    <xsl:text>&#10;&#10;</xsl:text><xsl:comment>SCHEMATRON PATTERNS</xsl:comment><xsl:text>&#10;</xsl:text>
+ 
+	<xsl:apply-templates select="*[not(self::iso:ns)] " />
+</xsl:template>
+ 
+    <xsl:template name="iso:exslt.add.imports">
+      <xsl:param name="imports" select="$sch.exslt.imports"/>
+      <xsl:choose>
+        <xsl:when test="contains($imports, ';')">
+          <axsl:import href="{ substring-before($imports, ';') }"/>
+          <xsl:call-template name="iso:exslt.add.imports">
+            <xsl:with-param name="imports"  select="substring-after($imports, ';')"/>
+          </xsl:call-template>
+        </xsl:when>
+        <xsl:when test="$imports">
+          <axsl:import href="{ $imports }"/>
+        </xsl:when>
+      </xsl:choose>
+    </xsl:template>
+
+<xsl:template name="handle-phase" >
+	<xsl:if test="not(normalize-space( $phase ) = '#ALL')">
+	  <xsl:if test="not(iso:phase[@id = normalize-space( $phase )])">
+		  <xsl:message>Phase Error: no phase with name <xsl:value-of select="normalize-space( $phase )"
+		  /> has been defined.</xsl:message>
+	  </xsl:if>
+     </xsl:if>
+</xsl:template>
+
+<xsl:template name="generate-default-rules">
+		<xsl:text>&#10;&#10;</xsl:text>
+		<xsl:comment>MODE: SCHEMATRON-SELECT-FULL-PATH</xsl:comment><xsl:text>&#10;</xsl:text>
+		<xsl:comment>This mode can be used to generate an ugly though full XPath for locators</xsl:comment><xsl:text>&#10;</xsl:text>
+   		<axsl:template match="*" mode="schematron-select-full-path">
+   			<xsl:choose>
+   				<xsl:when test=" $full-path-notation = '1' ">
+   					<!-- Use for computers, but rather unreadable for humans -->
+					<axsl:apply-templates select="." mode="schematron-get-full-path"/>
+				</xsl:when>
+   				<xsl:when test=" $full-path-notation = '2' ">
+   					<!-- Use for humans, but no good for paths unless namespaces are known out-of-band -->
+					<axsl:apply-templates select="." mode="schematron-get-full-path-2"/>
+				</xsl:when>
+   				<xsl:when test=" $full-path-notation = '3' "> 
+   					<!-- Obsolescent. Use for humans, but no good for paths unless namespaces are known out-of-band -->
+					<axsl:apply-templates select="." mode="schematron-get-full-path-3"/>
+				</xsl:when>
+
+                   <xsl:otherwise >
+                       <!-- Use for computers, but rather unreadable for humans -->
+                    <axsl:apply-templates select="." mode="schematron-get-full-path"/>
+                </xsl:otherwise>
+			</xsl:choose>
+		</axsl:template>
+	
+
+		<xsl:text>&#10;&#10;</xsl:text>
+		<xsl:comment>MODE: SCHEMATRON-FULL-PATH</xsl:comment><xsl:text>&#10;</xsl:text>
+		<xsl:comment>This mode can be used to generate an ugly though full XPath for locators</xsl:comment><xsl:text>&#10;</xsl:text>
+   		<axsl:template match="*" mode="schematron-get-full-path">
+			<axsl:apply-templates select="parent::*" mode="schematron-get-full-path"/>
+			
+			<!-- XSLT1 syntax -->
+
+			<axsl:text>/</axsl:text>
+			<axsl:choose>
+			<axsl:when test="namespace-uri()=''">
+			<axsl:value-of select="name()"/>
+			<axsl:variable name="p_1" select="1+
+			count(preceding-sibling::*[name()=name(current())])" />
+		<axsl:if test="$p_1&gt;1 or following-sibling::*[name()=name(current())]">
+		  <xsl:text/>[<axsl:value-of select="$p_1"/>]<xsl:text/>
+		</axsl:if>
+		</axsl:when>
+		<axsl:otherwise>
+		<axsl:text>*[local-name()='</axsl:text>
+		<axsl:value-of select="local-name()"/><axsl:text>' and namespace-uri()='</axsl:text>
+		<axsl:value-of select="namespace-uri()"/>
+		<axsl:text>']</axsl:text>
+		<axsl:variable name="p_2" select="1+
+		count(preceding-sibling::*[local-name()=local-name(current())])" />
+		<axsl:if test="$p_2&gt;1 or following-sibling::*[local-name()=local-name(current())]">
+		  <xsl:text/>[<axsl:value-of select="$p_2"/>]<xsl:text/>
+		</axsl:if>
+		</axsl:otherwise>
+		</axsl:choose> 
+       	 	</axsl:template>
+       	 	
+       	 	
+		<axsl:template match="@*" mode="schematron-get-full-path">
+		
+			<!-- XSLT1 syntax -->
+		<axsl:text>/</axsl:text>
+		<axsl:choose>
+		<axsl:when test="namespace-uri()=''">@<axsl:value-of
+		select="name()"/></axsl:when>
+		<axsl:otherwise>
+		<axsl:text>@*[local-name()='</axsl:text>
+		<axsl:value-of select="local-name()"/>
+		<axsl:text>' and namespace-uri()='</axsl:text>
+		<axsl:value-of select="namespace-uri()"/>
+		<axsl:text>']</axsl:text>
+		</axsl:otherwise>
+		</axsl:choose>   
+
+		</axsl:template>
+	
+	
+	<xsl:text>&#10;&#10;</xsl:text>
+	
+	<xsl:comment>MODE: SCHEMATRON-FULL-PATH-2</xsl:comment>
+	<xsl:text>&#10;</xsl:text>
+	<xsl:comment>This mode can be used to generate prefixed XPath for humans</xsl:comment>
+	<xsl:text>&#10;</xsl:text>
+	<!--simplify the error messages by using the namespace prefixes of the
+     instance rather than the generic namespace-uri-styled qualification-->
+	<axsl:template match="node() | @*" mode="schematron-get-full-path-2">
+	<!--report the element hierarchy-->
+		<axsl:for-each select="ancestor-or-self::*">
+			<axsl:text>/</axsl:text>
+			<axsl:value-of select="name(.)"/>
+			<axsl:if test="preceding-sibling::*[name(.)=name(current())]">
+				<axsl:text>[</axsl:text>
+				<axsl:value-of
+					select="count(preceding-sibling::*[name(.)=name(current())])+1"/>
+				<axsl:text>]</axsl:text>
+			</axsl:if>
+		</axsl:for-each>
+		<!--report the attribute-->
+		<axsl:if test="not(self::*)">
+			<axsl:text/>/@<axsl:value-of select="name(.)"/>
+		</axsl:if>
+	</axsl:template>
+
+		<xsl:text>&#10;&#10;</xsl:text>
+		<xsl:comment>MODE: GENERATE-ID-FROM-PATH </xsl:comment><xsl:text>&#10;</xsl:text>
+		<!-- repeatable-id maker derived from Francis Norton's. -->
+		<!-- use this if you need generate ids in separate passes,
+		     because generate-id() is not guaranteed to produce the same
+		     results each time. These ids are not XML names but closer to paths. -->
+		<axsl:template match="/" mode="generate-id-from-path"/>
+		<axsl:template match="text()" mode="generate-id-from-path">
+			<axsl:apply-templates select="parent::*" mode="generate-id-from-path"/>
+			<axsl:value-of select="concat('.text-', 1+count(preceding-sibling::text()), '-')"/>
+		</axsl:template>
+		<axsl:template match="comment()" mode="generate-id-from-path">
+			<axsl:apply-templates select="parent::*" mode="generate-id-from-path"/>
+			<axsl:value-of select="concat('.comment-', 1+count(preceding-sibling::comment()), '-')"/>
+		</axsl:template>
+		<axsl:template match="processing-instruction()" mode="generate-id-from-path">
+			<axsl:apply-templates select="parent::*" mode="generate-id-from-path"/>
+			<axsl:value-of 
+			select="concat('.processing-instruction-', 1+count(preceding-sibling::processing-instruction()), '-')"/>
+		</axsl:template>
+		<axsl:template match="@*" mode="generate-id-from-path">
+			<axsl:apply-templates select="parent::*" mode="generate-id-from-path"/>
+			<axsl:value-of select="concat('.@', name())"/>
+		</axsl:template>
+		<axsl:template match="*" mode="generate-id-from-path" priority="-0.5">
+			<axsl:apply-templates select="parent::*" mode="generate-id-from-path"/>
+			<axsl:text>.</axsl:text>
+<!--
+			<axsl:choose>
+				<axsl:when test="count(. | ../namespace::*) = count(../namespace::*)">
+					<axsl:value-of select="concat('.namespace::-',1+count(namespace::*),'-')"/>
+				</axsl:when>
+				<axsl:otherwise>
+-->
+				<axsl:value-of 
+				select="concat('.',name(),'-',1+count(preceding-sibling::*[name()=name(current())]),'-')"/>
+<!--
+				</axsl:otherwise>
+			</axsl:choose>
+-->
+		</axsl:template>
+		
+		
+	<xsl:comment>MODE: SCHEMATRON-FULL-PATH-3</xsl:comment>
+	
+	<xsl:text>&#10;</xsl:text>
+	<xsl:comment>This mode can be used to generate prefixed XPath for humans 
+	(Top-level element has index)</xsl:comment>
+	<xsl:text>&#10;</xsl:text>
+	<!--simplify the error messages by using the namespace prefixes of the
+     instance rather than the generic namespace-uri-styled qualification-->
+	<axsl:template match="node() | @*" mode="schematron-get-full-path-3">
+	<!--report the element hierarchy-->
+		<axsl:for-each select="ancestor-or-self::*">
+			<axsl:text>/</axsl:text>
+			<axsl:value-of select="name(.)"/>
+			<axsl:if test="parent::*">
+				<axsl:text>[</axsl:text>
+				<axsl:value-of
+					select="count(preceding-sibling::*[name(.)=name(current())])+1"/>
+				<axsl:text>]</axsl:text>
+			</axsl:if>
+		</axsl:for-each>
+		<!--report the attribute-->
+		<axsl:if test="not(self::*)">
+			<axsl:text/>/@<axsl:value-of select="name(.)"/>
+		</axsl:if>
+	</axsl:template>
+
+		<xsl:text>&#10;&#10;</xsl:text>
+		<xsl:comment>MODE: GENERATE-ID-2 </xsl:comment><xsl:text>&#10;</xsl:text>
+		<!-- repeatable-id maker from David Carlisle. -->
+		<!-- use this if you need generate IDs in separate passes,
+		     because generate-id() is not guaranteed to produce the same
+		     results each time. These IDs are well-formed XML NMTOKENS -->
+	<axsl:template match="/" mode="generate-id-2">U</axsl:template>
+
+	<axsl:template match="*" mode="generate-id-2" priority="2">
+		<axsl:text>U</axsl:text>
+		<axsl:number level="multiple" count="*"/>
+	</axsl:template>
+
+	<axsl:template match="node()" mode="generate-id-2">
+		<axsl:text>U.</axsl:text>
+		<axsl:number level="multiple" count="*"/>
+		<axsl:text>n</axsl:text>
+		<axsl:number count="node()"/>
+	</axsl:template>
+
+	<axsl:template match="@*" mode="generate-id-2">
+		<axsl:text>U.</axsl:text>
+		<axsl:number level="multiple" count="*"/>
+		<axsl:text>_</axsl:text>
+		<axsl:value-of select="string-length(local-name(.))"/>
+		<axsl:text>_</axsl:text>
+		<axsl:value-of select="translate(name(),':','.')"/>
+	</axsl:template> 
+
+
+		<xsl:comment>Strip characters</xsl:comment>
+		<axsl:template match="text()" priority="-1" />
+			
+  </xsl:template>
+
+ <xsl:template name="handle-root">
+		<!-- Process the top-level element -->
+		<axsl:template match="/">
+			<xsl:call-template name="process-root">
+				<xsl:with-param 	
+				name="title" select="(@id | iso:title)[last()]"/>
+				<xsl:with-param name="version" select="'iso'" />
+				<xsl:with-param name="schemaVersion" select="@schemaVersion" />
+				<xsl:with-param name="queryBinding" select="@queryBinding" />
+				<xsl:with-param name="contents">
+					<xsl:apply-templates mode="do-all-patterns"/>
+				</xsl:with-param>
+				
+				<!-- "Rich" properties -->
+				<xsl:with-param name="fpi" select="@fpi"/>
+				<xsl:with-param name="icon" select="@icon"/>
+				<xsl:with-param name="id" select="@id"/>
+				<xsl:with-param name="lang" select="@xml:lang"/>
+				<xsl:with-param name="see" select="@see" />
+				<xsl:with-param name="space" select="@xml:space" />
+				
+				
+				<!-- Non-standard extensions not part of the API yet -->
+				<xsl:with-param name="action" select="@action" />
+			</xsl:call-template>
+		</axsl:template>
+ 
+      
+</xsl:template>
+
+<!-- ============================================================== -->
+<!-- ISO SCHEMATRON ELEMENTS -->
+<!-- ============================================================== -->
+
+	<!-- ISO ACTIVE -->
+	<xsl:template match="iso:active">
+                <xsl:if test="not(@pattern)">
+                    <xsl:message>Markup Error: no pattern attribute in &lt;active></xsl:message>
+                </xsl:if>
+
+                <xsl:if test="not(../../iso:pattern[@id = current()/@pattern])
+                and not(../../iso:include)">
+                           <xsl:message>Reference Error: the pattern  "<xsl:value-of select="@pattern"
+						   />" has been activated but is not declared</xsl:message>
+                </xsl:if>
+        </xsl:template>
+
+	<!-- ISO ASSERT and REPORT -->
+	<xsl:template match="iso:assert">
+  
+                <xsl:if test="not(@test)">
+                    <xsl:message>Markup Error: no test attribute in &lt;assert</xsl:message>
+                </xsl:if>
+        <xsl:text>&#10;&#10;		</xsl:text>
+		<xsl:comment>ASSERT <xsl:value-of select="@role" /> </xsl:comment><xsl:text>&#10;</xsl:text>      
+	
+		<axsl:choose>
+			<axsl:when test="{@test}"/>
+			<axsl:otherwise>
+				<xsl:call-template name="process-assert">
+					<xsl:with-param name="test" select="normalize-space(@test)" />
+					<xsl:with-param name="diagnostics" select="@diagnostics"/>
+					<xsl:with-param name="flag" select="@flag"/>
+					
+					<!-- "Rich" properties -->
+					<xsl:with-param name="fpi" select="@fpi"/>
+					<xsl:with-param name="icon" select="@icon"/>
+					<xsl:with-param name="id" select="@id"/>
+					<xsl:with-param name="lang" select="@xml:lang"/>
+					<xsl:with-param name="see" select="@see" />
+					<xsl:with-param name="space" select="@xml:space" />
+					
+					<!-- "Linking" properties -->
+					<xsl:with-param name="role" select="@role" />
+					<xsl:with-param name="subject" select="@subject" />
+				</xsl:call-template>
+ 			
+			</axsl:otherwise>
+		</axsl:choose>
+	</xsl:template>
+	<xsl:template match="iso:report">
+		 
+                <xsl:if test="not(@test)">
+                    <xsl:message>Markup Error: no test attribute in &lt;report></xsl:message>
+                </xsl:if>
+                
+        <xsl:text>&#10;&#10;		</xsl:text>
+		<xsl:comment>REPORT <xsl:value-of select="@role" /> </xsl:comment><xsl:text>&#10;</xsl:text>      
+	
+		<axsl:if test="{@test}">
+		
+			<xsl:call-template name="process-report">
+				<xsl:with-param name="test" select="normalize-space(@test)" />
+				<xsl:with-param name="diagnostics" select="@diagnostics"/>
+					<xsl:with-param name="flag" select="@flag"/>
+					
+					<!-- "Rich" properties -->
+					<xsl:with-param name="fpi" select="@fpi"/>
+					<xsl:with-param name="icon" select="@icon"/>
+					<xsl:with-param name="id" select="@id"/>
+					<xsl:with-param name="lang" select="@xml:lang"/>
+					<xsl:with-param name="see" select="@see" />
+					<xsl:with-param name="space" select="@xml:space" />
+					
+					<!-- "Linking" properties -->
+					<xsl:with-param name="role" select="@role" />
+					<xsl:with-param name="subject" select="@subject" />
+			</xsl:call-template>
+				
+		</axsl:if>
+	</xsl:template>
+
+
+	<!-- ISO DIAGNOSTIC -->
+	<!-- We use a mode here to maintain backwards compatability, instead of adding it
+	     to the other mode.
+	-->
+	<xsl:template match="iso:diagnostic" mode="check-diagnostics">
+              <xsl:if test="not(@id)">
+                    <xsl:message>Markup Error: no id attribute in &lt;diagnostic></xsl:message>
+               </xsl:if>
+    </xsl:template>
+    
+    <xsl:template match="iso:diagnostic"  >
+                <xsl:call-template name="process-diagnostic">
+                
+					<!-- "Rich" properties -->
+					<xsl:with-param name="fpi" select="@fpi"/>
+					<xsl:with-param name="icon" select="@icon"/>
+					<xsl:with-param name="id" select="@id"/>
+					<xsl:with-param name="lang" select="@xml:lang"/>
+					<xsl:with-param name="see" select="@see" />
+					<xsl:with-param name="space" select="@xml:space" />
+               </xsl:call-template>
+        </xsl:template>
+
+	<!-- ISO DIAGNOSTICS -->
+	<xsl:template match="iso:diagnostics" >
+		<xsl:apply-templates mode="check-diagnostics" select="*" />
+	</xsl:template>
+
+	<!-- ISO DIR -->
+	<xsl:template match="iso:dir"  mode="text" >
+		<xsl:call-template name="process-dir">
+			<xsl:with-param name="value" select="@value"/>
+		</xsl:call-template>
+	</xsl:template>
+
+	<!-- ISO EMPH -->
+	<xsl:template match="iso:emph"  mode="text">
+	 
+		<xsl:call-template name="process-emph"/> 
+
+	</xsl:template>
+
+	<!-- ISO EXTENDS -->
+	<xsl:template match="iso:extends">
+		<xsl:if test="not(@rule)">
+                   <xsl:message>Markup Error: no rule attribute in &lt;extends></xsl:message>
+                </xsl:if>
+     		<xsl:if test="not(//iso:rule[@abstract='true'][@id= current()/@rule] )">
+                    <xsl:message>Reference Error: the abstract rule  "<xsl:value-of select="@rule"
+					/>" has been referenced but is not declared</xsl:message>
+                </xsl:if>
+	        <xsl:call-template name="IamEmpty" />
+
+  		<xsl:if test="//iso:rule[@id=current()/@rule]">
+    			<xsl:apply-templates select="//iso:rule[@id=current()/@rule]"
+				mode="extends"/>
+  		</xsl:if>
+
+	</xsl:template>
+
+	<!-- KEY: ISO has no KEY -->
+	<!-- NOTE: 
+	     Key has had a checkered history. Schematron 1.0 allowed it in certain places, but
+	     users came up with a different location, which has now been adopted. 
+	     
+	     XT, the early XSLT processor, did not implement key and died when it was present. 
+	     So there are some versions of the Schematron skeleton for XT that strip out all
+	     key elements.
+	     
+	     Xalan (e.g. Xalan4C 1.0 and a Xalan4J) also had a funny. A fix involved making 
+	     a top-level parameter called $hiddenKey and then using that instead of matching
+	     "key". This has been removed.
+	-->
+	<xsl:template  match="xsl:key" mode="do-keys" >
+	     <xsl:if test="not(@name)">
+              <xsl:message>Markup Error: no name attribute in &lt;key></xsl:message>
+         </xsl:if>
+                <xsl:if test="not(@path) and not(@use)">
+                    <xsl:message>Markup Error: no path or use attribute in &lt;key></xsl:message>
+                </xsl:if>         
+	     <xsl:choose>
+	     	<xsl:when test="parent::iso:rule ">
+	        <xsl:call-template name="IamEmpty" />
+	       <xsl:choose>
+	       	<xsl:when test="@path">
+				<axsl:key match="{../@context}" name="{@name}" use="{@path}"/>
+			</xsl:when>
+			<xsl:otherwise>
+							<axsl:key match="{../@context}" name="{@name}" use="{@use}"/>
+			</xsl:otherwise>
+			</xsl:choose>	
+		</xsl:when>
+		<xsl:otherwise>
+                <xsl:if test="not(@match) ">
+                    <xsl:message>Markup Error: no path or use attribute in &lt;key></xsl:message>
+                </xsl:if>   		
+			<axsl:key>
+      			<xsl:copy-of select="@*"/>
+    		</axsl:key>	
+		</xsl:otherwise>
+		</xsl:choose>
+	</xsl:template>
+
+	<xsl:template match="xsl:key "  /><!-- swallow -->
+
+	<xsl:template match="iso:key "  >
+		<xsl:message>Schema error: The key element is not in the ISO Schematron namespace. Use the XSLT namespace.</xsl:message>
+    </xsl:template>
+
+   <!-- ISO INCLUDE -->
+   <!-- This is only a fallback. Include really needs to have been done before this as a separate pass.-->
+
+   <xsl:template match="iso:include[not(normalize-space(@href))]"
+	   priority="1">
+	<xsl:if test=" $debug = 'false' ">
+		<xsl:message terminate="yes">Schema error: Empty href= attribute for include directive.</xsl:message>
+	</xsl:if>
+
+   </xsl:template>
+
+   <!-- Extend the URI syntax to allow # refererences -->
+   <!-- Add experimental support for simple containers like  /xxx:xxx/iso:pattern to allow better includes -->
+   <xsl:template match="iso:include">
+       <xsl:variable name="document-uri" select="substring-before(concat(@href,'#'), '#')"/>
+       <xsl:variable name="fragment-id" select="substring-after(@href, '#')"/>
+       
+       <xsl:choose> 
+          
+          <xsl:when test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0" >
+          	<xsl:message>Error: Impossible URL in Schematron include</xsl:message>
+          </xsl:when> 
+          
+          <xsl:when test="string-length( $fragment-id ) &gt; 0">
+              <xsl:variable name="theDocument_1" select="document( $document-uri,/ )" />
+              <xsl:variable name="theFragment_1" select="$theDocument_1//iso:*[@id= $fragment-id ]" />
+              <xsl:if test=" $theFragment_1/self::iso:schema ">
+                 <xsl:message>Schema error: Use include to include fragments, not a whole schema</xsl:message>
+              </xsl:if>
+              <xsl:apply-templates select=" $theFragment_1"/>
+		   </xsl:when>
+		  
+		   <xsl:otherwise>
+              <xsl:variable name="theDocument_2" select="document( $document-uri,/ )" />
+              <xsl:variable name="theFragment_2" select="$theDocument_2/iso:*" />
+              <xsl:variable name="theContainedFragments" select="$theDocument_2/*/iso:*" />
+              <xsl:if test=" $theFragment_2/self::iso:schema or $theContainedFragments/self::iso:schema">
+                 <xsl:message>Schema error: Use include to include fragments, not a whole schema</xsl:message>
+              </xsl:if>
+       		<xsl:apply-templates select="$theFragment_2 | $theContainedFragments "/>
+       	   </xsl:otherwise>
+       </xsl:choose>
+   </xsl:template>
+
+   <!-- This is to handle the particular case of including patterns -->  
+   <xsl:template match="iso:include" mode="do-all-patterns">
+       <xsl:variable name="document-uri" select="substring-before(concat(@href,'#'), '#')"/>
+       <xsl:variable name="fragment-id" select="substring-after(@href, '#')"/>
+ 
+       <xsl:choose> 
+          
+          <xsl:when test="string-length( $document-uri ) = 0 and string-length( $fragment-id ) = 0" >
+          	<xsl:message>Error: Impossible URL in Schematron include</xsl:message>
+          </xsl:when> 
+          
+          <xsl:when test="string-length( $fragment-id ) &gt; 0">
+              <xsl:variable name="theDocument_1" select="document( $document-uri,/ )" />
+              <xsl:variable name="theFragment_1" select="$theDocument_1//iso:*[@id= $fragment-id ]" />
+              <xsl:if test=" $theFragment_1/self::iso:schema ">
+                 <xsl:message>Schema error: Use include to include fragments, not a whole schema</xsl:message>
+              </xsl:if>
+              <xsl:apply-templates select=" $theFragment_1" mode="do-all-patterns"/>
+		   </xsl:when>
+		  
+		   <xsl:otherwise>
+		   	  <!-- Import the top-level element if it is in schematron namespace,
+		   	  or its children otherwise, to allow a simple containment mechanism. -->
+              <xsl:variable name="theDocument_2" select="document( $document-uri,/ )" />
+              <xsl:variable name="theFragment_2" select="$theDocument_2/iso:*" />
+              <xsl:variable name="theContainedFragments" select="$theDocument_2/*/iso:*" />
+              <xsl:if test=" $theFragment_2/self::iso:schema or $theContainedFragments/self::iso:schema">
+                 <xsl:message>Schema error: Use include to include fragments, not a whole schema</xsl:message>
+              </xsl:if>
+       		<xsl:apply-templates select="$theFragment_2 | $theContainedFragments "
+       		mode="do-all-patterns" />
+       	   </xsl:otherwise>
+       </xsl:choose>
+   </xsl:template>
+   
+	<!-- ISO LET -->
+	<xsl:template match="iso:let" >
+	  <xsl:if test="ancestor::iso:schema[@queryBinding='xpath']">
+                    <xsl:message>Warning: Variables should not be used with the "xpath" query language binding.</xsl:message>
+       </xsl:if>
+		
+       <!-- lets at the top-level are implemented as parameters -->
+ 
+       	<xsl:choose>
+       		<xsl:when test="parent::iso:schema">
+       			<!-- it is an error to have an empty param/@select because an XPath is expected -->
+	      		 <axsl:param name="{@name}" select="{@value}">
+	      		 		<xsl:if test="string-length(@value) &gt; 0">
+	      		 			<xsl:attribute name="select"><xsl:value-of select="@value"/></xsl:attribute>
+	      		 		</xsl:if>
+	      		 </axsl:param> 
+       		</xsl:when>
+       		<xsl:otherwise>
+				<axsl:variable name="{@name}" select="{@value}"/>
+			</xsl:otherwise>
+		</xsl:choose>
+		  
+	</xsl:template>	
+
+	<!-- ISO NAME -->
+	<xsl:template match="iso:name" mode="text">
+	
+		<xsl:if test="@path">
+			<xsl:call-template name="process-name">
+				<xsl:with-param name="name" select="concat('name(',@path,')')"/>
+			</xsl:call-template>
+		</xsl:if>
+		<xsl:if test="not(@path)">
+			<xsl:call-template name="process-name">
+				<xsl:with-param name="name" select="'name(.)'"/>
+			</xsl:call-template>
+		</xsl:if>
+	    <xsl:call-template name="IamEmpty" />
+	</xsl:template>
+
+	<!-- ISO NS -->
+	<!-- Namespace handling is XSLT is quite tricky and implementation dependent -->
+	<xsl:template match="iso:ns">
+ 		<xsl:call-template name="handle-namespace" />
+	</xsl:template>
+
+    <!-- This template is just to provide the API hook -->
+	<xsl:template match="iso:ns"  mode="do-all-patterns" >
+               <xsl:if test="not(@uri)">
+                    <xsl:message>Markup Error: no uri attribute in &lt;ns></xsl:message>
+                </xsl:if>
+               <xsl:if test="not(@prefix)">
+                    <xsl:message>Markup Error: no prefix attribute in &lt;ns></xsl:message>
+                </xsl:if>
+	        <xsl:call-template name="IamEmpty" />
+		<xsl:call-template name="process-ns" >
+			<xsl:with-param name="prefix" select="@prefix"/>
+			<xsl:with-param name="uri" select="@uri"/>
+		</xsl:call-template>
+	</xsl:template>
+
+	<!-- ISO P -->
+	<xsl:template match="iso:schema/iso:p " mode="do-schema-p" >
+		<xsl:call-template name="process-p">
+			<xsl:with-param name="class" select="@class"/>
+			<xsl:with-param name="icon" select="@icon"/>
+			<xsl:with-param name="id" select="@id"/>
+			<xsl:with-param name="lang" select="@xml:lang"/>
+		</xsl:call-template>
+	</xsl:template>
+	<xsl:template match="iso:pattern/iso:p " mode="do-pattern-p" >
+		<xsl:call-template name="process-p">
+			<xsl:with-param name="class" select="@class"/>
+			<xsl:with-param name="icon" select="@icon"/>
+			<xsl:with-param name="id" select="@id"/>
+			<xsl:with-param name="lang" select="@xml:lang"/>
+		</xsl:call-template>
+	</xsl:template>
+	
+    <!-- Currently, iso:p in other position are not passed through to the API -->
+	<xsl:template match="iso:phase/iso:p" />
+	<xsl:template match="iso:p " priority="-1" />
+
+	<!-- ISO PATTERN -->
+	<xsl:template match="iso:pattern" mode="do-all-patterns">
+	<xsl:if test="($phase = '#ALL') 
+	or (../iso:phase[@id= $phase]/iso:active[@pattern= current()/@id])">
+		<xsl:call-template name="process-pattern">
+			<!-- the following select statement assumes that
+			@id | sch:title returns node-set in document order:
+			we want the title if it is there, otherwise the @id attribute -->
+			<xsl:with-param name="name" select="(@id | iso:title )[last()]"/>
+			<xsl:with-param name="is-a" select="''"/>
+			
+					<!-- "Rich" properties -->
+					<xsl:with-param name="fpi" select="@fpi"/>
+					<xsl:with-param name="icon" select="@icon"/>
+					<xsl:with-param name="id" select="@id"/>
+					<xsl:with-param name="lang" select="@xml:lang"/>
+					<xsl:with-param name="see" select="@see" />
+					<xsl:with-param name="space" select="@xml:space" />
+		</xsl:call-template>
+		<xsl:choose>
+		  <xsl:when test="$select-contexts='key'">
+		    <axsl:apply-templates select="key('M','M{count(preceding-sibling::*)}')" mode="M{count(preceding-sibling::*)}"/>
+		  </xsl:when>
+		  <xsl:when test="$select-contexts='//'">
+		    <axsl:apply-templates mode="M{count(preceding-sibling::*)}">
+		      <xsl:attribute name="select">
+			<xsl:text>//(</xsl:text>
+			<xsl:for-each select="iso:rule/@context">
+			  <xsl:text>(</xsl:text>
+			  <xsl:value-of select="."/>
+			  <xsl:text>)</xsl:text>
+			  <xsl:if test="position()!=last()">|</xsl:if>
+			</xsl:for-each>
+			<xsl:text>)</xsl:text>
+			<xsl:if test="$visit-text='false'">[not(self::text())]</xsl:if>
+		      </xsl:attribute>
+		    </axsl:apply-templates>
+		  </xsl:when>
+		  <xsl:otherwise>
+		    <axsl:apply-templates select="/" mode="M{count(preceding-sibling::*)}"/>
+		  </xsl:otherwise>
+		</xsl:choose>
+        </xsl:if>
+	</xsl:template>
+	
+	<xsl:template match="iso:pattern[@abstract='true']">
+    
+             <xsl:message>Schema implementation error: This schema has abstract patterns, yet they are supposed to be preprocessed out already
+             </xsl:message>
+    </xsl:template>
+
+    <!-- Here is the template for the normal case of patterns -->
+	<xsl:template match="iso:pattern[not(@abstract='true')]">
+     
+      <xsl:if test="($phase = '#ALL') 
+	          or (../iso:phase[@id= $phase]/iso:active[@pattern= current()/@id])">
+ 
+		<xsl:text>&#10;&#10;</xsl:text>
+		<xsl:comment>PATTERN <xsl:value-of select="@id" /> <xsl:value-of select="iso:title" /> </xsl:comment><xsl:text>&#10;</xsl:text>      
+		<xsl:apply-templates />
+		
+		<!-- DPC select-contexts test -->
+		<xsl:if test="not($select-contexts)">
+		  <axsl:template match="text()" priority="-1" mode="M{count(preceding-sibling::*)}">
+		    <!-- strip characters -->
+		  </axsl:template>
+		  
+		  <!-- DPC introduce context-xpath variable -->
+		  <axsl:template match="@*|node()"
+				 priority="-2"
+				 mode="M{ count(preceding-sibling::*) }">
+		    <axsl:apply-templates select="{$context-xpath}" mode="M{count(preceding-sibling::*)}"/>
+		  </axsl:template>
+		</xsl:if>
+      </xsl:if>
+	</xsl:template>
+
+	<!-- ISO PHASE -->
+	<xsl:template match="iso:phase" >
+                <xsl:if test="not(@id)">
+                    <xsl:message>Markup Error: no id attribute in &lt;phase></xsl:message>
+                </xsl:if>
+		  <xsl:apply-templates/>
+	</xsl:template>
+
+	<!-- ISO RULE -->
+	<xsl:template match="iso:rule[not(@abstract='true')] ">
+                <xsl:if test="not(@context)">
+                    <xsl:message>Markup Error: no context attribute in &lt;rule></xsl:message>
+                </xsl:if>
+        <xsl:text>&#10;&#10;	</xsl:text>
+		<xsl:comment>RULE <xsl:value-of select="@id" /> </xsl:comment><xsl:text>&#10;</xsl:text>   
+        <xsl:if test="iso:title">
+		    <xsl:comment><xsl:value-of select="iso:title" /></xsl:comment>
+		  </xsl:if>
+		<!-- DPC select-contexts -->
+		<xsl:if test="$select-contexts='key'">
+		    <axsl:key name="M"
+			      match="{@context}" 
+			      use="'M{count(../preceding-sibling::*)}'"/>
+		</xsl:if>
+   
+	
+<!-- DPC priorities count up from 1000 not down from 4000 (templates in same priority order as before) -->
+		<axsl:template match="{@context}"
+		priority="{1000 + count(following-sibling::*)}" mode="M{count(../preceding-sibling::*)}">
+			<xsl:call-template name="process-rule">
+				<xsl:with-param name="context" select="@context"/>
+				
+					<!-- "Rich" properties -->
+					<xsl:with-param name="fpi" select="@fpi"/>
+					<xsl:with-param name="icon" select="@icon"/>
+					<xsl:with-param name="id" select="@id"/>
+					<xsl:with-param name="lang" select="@xml:lang"/>
+					<xsl:with-param name="see" select="@see" />
+					<xsl:with-param name="space" select="@xml:space" />
+					
+					<!-- "Linking" properties -->
+					<xsl:with-param name="role" select="@role" />
+					<xsl:with-param name="subject" select="@subject" />
+			</xsl:call-template>
+			<xsl:apply-templates/>
+			<!-- DPC introduce context-xpath and select-contexts variables -->
+			<xsl:if test="not($select-contexts)">
+			  <axsl:apply-templates select="{$context-xpath}" mode="M{count(../preceding-sibling::*)}"/>
+			</xsl:if>
+		</axsl:template>
+	</xsl:template>
+
+
+	<!-- ISO ABSTRACT RULE -->
+	<xsl:template match="iso:rule[@abstract='true'] " >
+		<xsl:if test=" not(@id)">
+                    <xsl:message>Markup Error: no id attribute on abstract &lt;rule></xsl:message>
+                </xsl:if>
+ 		<xsl:if test="@context">
+                    <xsl:message>Markup Error: (2) context attribute on abstract &lt;rule></xsl:message>
+                </xsl:if>
+	</xsl:template>
+
+	<xsl:template match="iso:rule[@abstract='true']"
+		mode="extends" >
+                <xsl:if test="@context">
+                    <xsl:message>Markup Error: context attribute on abstract &lt;rule></xsl:message>
+                </xsl:if>
+			<xsl:apply-templates/>
+	</xsl:template>
+
+	<!-- ISO SPAN -->
+	<xsl:template match="iso:span" mode="text">
+		<xsl:call-template name="process-span">
+			<xsl:with-param name="class" select="@class"/>
+		</xsl:call-template>
+	</xsl:template>
+
+	<!-- ISO TITLE -->
+	
+	<xsl:template match="iso:schema/iso:title"  priority="1">
+	     <xsl:call-template name="process-schema-title" />
+	</xsl:template>
+ 
+	
+	<xsl:template match="iso:title" >
+	     <xsl:call-template name="process-title" />
+	</xsl:template>
+ 
+
+	<!-- ISO VALUE-OF -->
+	<xsl:template match="iso:value-of" mode="text" >
+        <xsl:if test="not(@select)">
+            <xsl:message>Markup Error: no select attribute in &lt;value-of></xsl:message>
+        </xsl:if>
+	    <xsl:call-template name="IamEmpty" />
+	         
+		<xsl:choose>
+			<xsl:when test="@select">
+				<xsl:call-template name="process-value-of">
+					<xsl:with-param name="select" select="@select"/>  
+				</xsl:call-template>
+			</xsl:when>
+			<xsl:otherwise >
+				<xsl:call-template name="process-value-of">
+					<xsl:with-param name="select" select="'.'"/>
+				</xsl:call-template>
+			</xsl:otherwise>
+        </xsl:choose> 
+        
+	</xsl:template>
+
+
+<!-- ============================================================== -->
+<!-- DEFAULT TEXT HANDLING  -->
+<!-- ============================================================== -->
+	<xsl:template match="text()" priority="-1" mode="do-keys">
+		<!-- strip characters -->
+	</xsl:template>
+	<xsl:template match="text()" priority="-1" mode="do-all-patterns">
+		<!-- strip characters -->
+	</xsl:template>
+        <xsl:template match="text()" priority="-1" mode="do-schema-p">
+		<!-- strip characters -->
+	</xsl:template>
+        <xsl:template match="text()" priority="-1" mode="do-pattern-p">
+		<!-- strip characters -->
+	</xsl:template>
+	
+	<xsl:template match="text()" priority="-1">
+		<!-- Strip characters -->
+	</xsl:template>
+	
+	<xsl:template match="text()" mode="text">
+		<xsl:value-of select="."/>
+	</xsl:template>
+
+	<xsl:template match="text()" mode="inline-text">
+		<xsl:value-of select="."/>
+	</xsl:template>
+
+<!-- ============================================================== -->
+<!-- UTILITY TEMPLATES -->
+<!-- ============================================================== -->
+<xsl:template name="IamEmpty">
+	<xsl:if test="count( * )">
+		<xsl:message>
+			<xsl:text>Warning: </xsl:text>
+			<xsl:value-of select="name(.)"/>
+			<xsl:text> must not contain any child elements</xsl:text>
+		</xsl:message>
+	</xsl:if>
+</xsl:template>
+
+<xsl:template name="diagnosticsSplit">
+  <!-- Process at the current point the first of the <diagnostic> elements
+       referred to parameter str, and then recurse -->
+  <xsl:param name="str"/>
+  <xsl:variable name="start">
+    <xsl:choose>
+      <xsl:when test="contains($str,' ')">
+	<xsl:value-of  select="substring-before($str,' ')"/>
+      </xsl:when>
+      <xsl:otherwise><xsl:value-of select="$str"/></xsl:otherwise>
+    </xsl:choose>
+  </xsl:variable>
+
+  <xsl:variable name="end">
+    <xsl:if test="contains($str,' ')">
+      <xsl:value-of select="substring-after($str,' ')"/>
+    </xsl:if>
+  </xsl:variable>
+
+  <!-- This works with all namespaces -->
+  <xsl:if test="not(string-length(normalize-space($start)) = 0)
+  		and not(//iso:diagnostic[@id = $start])
+		and not(//sch:diagnostic[@id = $start]) 
+		and not(//diagnostic[@id = $start])">
+	<xsl:message>Reference error: A diagnostic "<xsl:value-of select="string($start)"
+	/>" has been referenced but is not declared</xsl:message>
+  </xsl:if>
+
+  <xsl:if test="string-length(normalize-space($start)) > 0">
+     <xsl:text> </xsl:text>
+     <xsl:apply-templates 
+        select="//iso:diagnostic[@id = $start ]
+        	| //sch:diagnostic[@id = $start ] 
+            | //diagnostic[@id= $start ]"/>
+  </xsl:if>
+
+  <xsl:if test="not($end='')">
+    <xsl:call-template name="diagnosticsSplit">
+      <xsl:with-param name="str" select="$end"/>
+    </xsl:call-template>
+  </xsl:if>
+</xsl:template>
+
+<!-- It would be nice to use this but xsl:namespace does not
+  allow a fallback -->
+<!--xsl:template name="handle-namespace" version="2.0">
+   <xsl:namespace name="{@prefix}" select="@uri">
+</xsl:template-->
+
+<xsl:template name="handle-namespace">
+       <!-- experimental code from http://eccnet.eccnet.com/pipermail/schematron-love-in/2006-June/000104.html -->
+       <!-- Handle namespaces differently for exslt systems, msxml, and default, only using XSLT1 syntax -->
+       <!-- For more info see  http://fgeorges.blogspot.com/2007/01/creating-namespace-nodes-in-xslt-10.html -->
+       <xsl:choose>
+          <!-- The following code works for XSLT1 -->
+        <xsl:when test="function-available('exsl:node-set')">
+           <xsl:variable name="ns-dummy-elements">
+             <xsl:element name="{@prefix}:dummy" namespace="{@uri}"/>
+           </xsl:variable>
+       	   <xsl:variable name="p" select="@prefix"/>
+           <xsl:copy-of select="exsl:node-set($ns-dummy-elements)
+                                  /*/namespace::*[local-name()=$p]"/>
+         </xsl:when>        
+
+   			<!-- End XSLT1  code -->
+  
+        <!-- Not tested yet       
+    	<xsl:when test="function-available('msxsl:node-set')">
+      		<xsl:variable name="ns-dummy-elements">
+        		<xsl:element name="{ $prefix }:e" namespace="{ $uri }"/>
+      		</xsl:variable>
+      		<xsl:copy-of select="msxsl:node-set($ns-dummy-elements)/*/namespace::*"/>
+    	</xsl:when>
+        -->
+        
+        <xsl:when test="@prefix = 'xsl' ">
+           <!-- Do not generate dummy attributes with the xsl: prefix, as these
+                are errors against XSLT, because we presume that the output
+                stylesheet uses the xsl prefix. In any case, there would already
+                be a namespace declaration for the XSLT namespace generated
+                automatically, presumably using "xsl:".
+           -->
+        </xsl:when>
+        
+        <xsl:when test="@uri = 'http://www.w3.org/1999/XSL/Transform'">
+          <xsl:message terminate="yes">
+            <xsl:text>Using the XSLT namespace with a prefix other than "xsl" in </xsl:text>
+            <xsl:text>Schematron rules is not supported </xsl:text>
+            <xsl:text>in this processor: </xsl:text>
+            <xsl:value-of select="system-property('xsl:vendor')"/>
+          </xsl:message>
+        </xsl:when>
+
+        <xsl:otherwise>
+          <xsl:attribute name="{concat(@prefix,':dummy-for-xmlns')}" namespace="{@uri}" />
+           
+        </xsl:otherwise>
+      </xsl:choose>
+
+
+</xsl:template>
+
+<!-- ============================================================== -->
+<!-- UNEXPECTED ELEMENTS -->
+<!-- ============================================================== -->
+
+	<xsl:template match="iso:*"  priority="-2">
+	   <xsl:message>
+			<xsl:text>Error: unrecognized element in ISO Schematron namespace: check spelling
+			and capitalization</xsl:text>
+			<xsl:value-of select="name(.)"/>
+		</xsl:message>
+	</xsl:template>
+	
+	
+	<!-- Swallow old namespace elements: there is an upfront test for them elsewhere -->
+	<xsl:template match="sch:*"  priority="-2" />
+	
+	<xsl:template match="*"  priority="-3">
+	    <xsl:choose>
+	       <xsl:when test=" $allow-foreign = 'false' ">
+				<xsl:message>
+					<xsl:text>Warning: unrecognized element </xsl:text>
+					<xsl:value-of select="name(.)"/>
+				</xsl:message>
+			</xsl:when>
+			<xsl:otherwise>
+				<xsl:copy-of select="." />
+			</xsl:otherwise>
+		</xsl:choose>
+	</xsl:template>
+	
+	<xsl:template match="iso:*" mode="text" priority="-2" />
+	<xsl:template match="*" mode="text" priority="-3">
+	    <xsl:choose>
+	       <xsl:when test=" $allow-foreign = 'false' ">
+				<xsl:message>
+					<xsl:text>Warning: unrecognized element </xsl:text>
+					<xsl:value-of select="name(.)"/>
+				</xsl:message>
+			</xsl:when>
+			<xsl:otherwise>
+				<xsl:copy-of select="." />
+			</xsl:otherwise>
+		</xsl:choose>
+	</xsl:template>
+
+<!-- ============================================================== -->
+<!-- DEFAULT NAMED TEMPLATES -->
+<!-- These are the actions that are performed unless overridden -->
+<!-- ============================================================== -->
+ 
+	<xsl:template name="process-prolog"/>
+	<!-- no params -->
+
+	<xsl:template name="process-root">
+		<xsl:param name="contents"/>
+		<xsl:param name="id" />
+		<xsl:param name="version" />
+		<xsl:param name="schemaVersion" />
+		<xsl:param name="queryBinding" />
+		<xsl:param name="title" />
+
+
+		<!-- "Rich" parameters -->
+		<xsl:param name="fpi" />
+		<xsl:param name="icon" />
+		<xsl:param name="lang" />
+		<xsl:param name="see" />
+		<xsl:param name="space" />
+
+		<xsl:copy-of select="$contents"/>
+	</xsl:template>
+
+	<xsl:template name="process-assert">
+
+		<xsl:param name="test"/>
+		<xsl:param name="diagnostics" />
+		<xsl:param name="id" />
+		<xsl:param name="flag" />
+
+           	<!-- "Linkable" parameters -->
+		<xsl:param name="role"/>
+		<xsl:param name="subject"/>
+
+		<!-- "Rich" parameters -->
+		<xsl:param name="fpi" />
+		<xsl:param name="icon" />
+		<xsl:param name="lang" />
+		<xsl:param name="see" />
+		<xsl:param name="space" />
+
+
+		<xsl:call-template name="process-message">
+			<xsl:with-param name="pattern" select="$test"/>
+			<xsl:with-param name="role" select="$role"/>
+		</xsl:call-template>
+		
+		
+	</xsl:template>
+
+	<xsl:template name="process-report">
+		<xsl:param name="test"/>
+		<xsl:param name="diagnostics" />
+		<xsl:param name="id" />
+		<xsl:param name="flag" />
+
+           	<!-- "Linkable" parameters -->
+		<xsl:param name="role"/>
+		<xsl:param name="subject"/>
+
+		<!-- "Rich" parameters -->
+		<xsl:param name="fpi" />
+		<xsl:param name="icon" /> 
+		<xsl:param name="lang" />
+		<xsl:param name="see" />
+		<xsl:param name="space" />
+
+		<xsl:call-template name="process-message">
+			<xsl:with-param name="pattern" select="$test"/>
+			<xsl:with-param name="role" select="$role"/>
+		</xsl:call-template>
+	</xsl:template>
+
+	<xsl:template name="process-diagnostic">
+		<xsl:param name="id" />
+
+		<!-- "Rich" parameters -->
+		<xsl:param name="fpi" />
+		<xsl:param name="icon" />
+		<xsl:param name="lang" />
+		<xsl:param name="see" />
+		<xsl:param name="space" />
+		
+	    <!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<xsl:apply-templates mode="text"/>
+		<axsl:text> </axsl:text>
+	</xsl:template>
+
+	<xsl:template name="process-dir">
+      	<xsl:param name="value" />
+
+	    <!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<xsl:apply-templates mode="inline-text"/>
+		<axsl:text> </axsl:text>
+	</xsl:template>
+
+	<xsl:template name="process-emph"> 
+	    <!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<xsl:apply-templates mode="inline-text"/>
+		<axsl:text> </axsl:text>
+	</xsl:template>
+	
+	<xsl:template name="process-name">
+		<xsl:param name="name"/>
+		
+		<!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<axsl:value-of select="{$name}"/>
+		<axsl:text> </axsl:text>
+		
+    </xsl:template>
+
+	<xsl:template name="process-ns" >
+	<!-- Note that process-ns is for reporting. The sch:ns elements are 
+	     independently used in the sch:schema template to provide namespace bindings -->
+		<xsl:param name="prefix"/>
+		<xsl:param name="uri" />
+      </xsl:template>
+
+	<xsl:template name="process-p">
+		<xsl:param name="id" />
+		<xsl:param name="class" />
+		<xsl:param name="icon" />
+		<xsl:param name="lang" />
+      </xsl:template>
+
+	<xsl:template name="process-pattern">
+		<xsl:param name="id" />
+		<xsl:param name="name" />
+		<xsl:param name="is-a" />
+
+		<!-- "Rich" parameters -->
+		<xsl:param name="fpi" />
+		<xsl:param name="icon" />
+		<xsl:param name="lang" />
+		<xsl:param name="see" />
+		<xsl:param name="space" />
+      </xsl:template>
+      
+
+	<xsl:template name="process-rule">
+		<xsl:param name="context" />
+
+		<xsl:param name="id" />
+		<xsl:param name="flag" />
+
+           	<!-- "Linkable" parameters -->
+		<xsl:param name="role"/>
+		<xsl:param name="subject"/>
+  
+		<!-- "Rich" parameters -->
+		<xsl:param name="fpi" />
+		<xsl:param name="icon" />
+		<xsl:param name="lang" />
+		<xsl:param name="see" />
+		<xsl:param name="space" />
+      </xsl:template>
+
+	<xsl:template name="process-span" >
+		<xsl:param name="class" />
+
+	    <!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<xsl:apply-templates mode="inline-text"/>
+		<axsl:text> </axsl:text>		
+	</xsl:template>
+
+	<xsl:template name="process-title" >
+		<xsl:param name="class" />
+	   <xsl:call-template name="process-p">
+	      <xsl:with-param  name="class">title</xsl:with-param>
+	   </xsl:call-template>
+	</xsl:template>
+		
+	<xsl:template name="process-schema-title" >
+		<xsl:param name="class" />
+	   <xsl:call-template name="process-title">
+	      <xsl:with-param  name="class">schema-title</xsl:with-param>
+	   </xsl:call-template>
+	</xsl:template>
+
+	<xsl:template name="process-value-of">
+		<xsl:param name="select"/>
+		
+	    <!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<axsl:value-of select="{$select}"/>
+		<axsl:text> </axsl:text>
+	</xsl:template>
+
+	<!-- default output action: the simplest customization is to just override this -->
+	<xsl:template name="process-message">
+		<xsl:param name="pattern" />
+            <xsl:param name="role" />
+
+		<xsl:apply-templates mode="text"/>	
+		 <xsl:if test=" $message-newline = 'true'" >
+			<axsl:value-of  select="string('&#10;')"/>
+		</xsl:if>
+		
+	</xsl:template>
+</xsl:stylesheet>
+
+
+
diff --git a/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_svrl_for_xslt1.xsl b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_svrl_for_xslt1.xsl
new file mode 100644
index 00000000..dae74ff6
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_svrl_for_xslt1.xsl
@@ -0,0 +1,588 @@
+<?xml version="1.0" ?>
+<!-- 
+   ISO_SVRL.xsl   
+
+   Implementation of Schematron Validation Report Language from ISO Schematron
+   ISO/IEC 19757 Document Schema Definition Languages (DSDL) 
+     Part 3: Rule-based validation  Schematron 
+     Annex D: Schematron Validation Report Language 
+
+  This ISO Standard is available free as a Publicly Available Specification in PDF from ISO.
+  Also see www.schematron.com for drafts and other information.
+
+  This implementation of SVRL is designed to run with the "Skeleton" implementation 
+  of Schematron which Oliver Becker devised. The skeleton code provides a 
+  Schematron implementation but with named templates for handling all output; 
+  the skeleton provides basic templates for output using this API, but client
+  validators can be written to import the skeleton and override the default output
+  templates as required. (In order to understand this, you must understand that
+  a named template such as "process-assert" in this XSLT stylesheet overrides and
+  replaces any template with the same name in the imported skeleton XSLT file.)
+
+  The other important thing to understand in this code is that there are different
+  versions of the Schematron skeleton. These track the development of Schematron through
+  Schematron 1.5, Schematron 1.6 and now ISO Schematron. One only skeleton must be
+  imported. The code has templates for the different skeletons commented out for 
+  convenience. ISO Schematron has a different namespace than Schematron 1.5 and 1.6;
+  so the ISO Schematron skeleton has been written itself with an optional import
+  statement to in turn import the Schematron 1.6 skeleton. This will allow you to 
+  validate with schemas from either namespace.
+  
+
+  History:  
+    2009-03-18
+    	* Fix atrribute with space "see " which generates wrong name in some processors
+    2008-08-11
+   		* RJ Fix attribute/@select which saxon allows  in XSLT 1
+   2008-08-07
+    	* RJ Add output-encoding attribute to specify final encoding to use
+    	* Alter allow-foreign functionality so that Schematron span, emph and dir elements make 
+    	  it to the output, for better formatting and because span can be used to mark up
+    	  semantically interesting information embedded in diagnostics, which reduces the
+    	  need to extend SVRL itself
+    	* Diagnostic-reference had an invalid attribute @id that duplicated @diagnostic: removed
+  	2008-08-06
+    	* RJ Fix invalid output:  svrl:diagnostic-reference is not contained in an svrl:text
+    	* Output comment to SVRL file giving filename if available (from command-line parameter)
+  	2008-08-04
+  		* RJ move sch: prefix to schold: prefix to prevent confusion (we want people to
+  		be able to switch from old namespace to new namespace without changing the
+  		sch: prefix, so it is better to keep that prefix completely out of the XSLT)
+  		* Extra signature fixes (PH)
+    2008-08-03
+    	* Repair missing class parameter on process-p
+    2008-07-31
+    	* Update skeleton names
+    2007-04-03 
+    	* Add option generate-fired-rule (RG)
+    2007-02-07
+    	* Prefer true|false for parameters. But allow yes|no on some old for compatability
+    	* DP Diagnostics output to svrl:text. Diagnosis put out after assertion text.
+      	* Removed non-SVRL elements and attributes: better handled as an extra layer that invokes this one
+      	* Add more formal parameters
+      	* Correct confusion between $schemaVersion and $queryBinding
+     	* Indent
+     	* Validate against RNC schemas for XSLT 1 and 2 (with regex tests removed)
+     	* Validate output with UniversalTest.sch against RNC schema for ISO SVRL
+    	
+    2007-02-01
+       	* DP. Update formal parameters of overriding named templates to handle more attributes.
+       	* DP. Refactor handling of rich and linkable parameters to a named template.
+
+    2007-01-22
+    	* DP change svrl:ns to svrl:ns-in-attribute-value
+		* Change default when no queryBinding from "unknown" to "xslt"
+	
+    2007-01-18:
+     	* Improve documentation
+     	* KH Add command-line options to generate paths or not 
+       	* Use axsl:attribute rather than xsl:attribute to shut XSLT2 up
+       	* Add extra command-line options to pass to the iso_schematron_skeleton
+  
+    2006-12-01: iso_svrl.xsl Rick Jelliffe, 
+          * update namespace, 
+          * update phase handling,
+          * add flag param to process-assert and process-report & @ flag on output
+  
+    2001: Conformance1-5.xsl Rick Jelliffe, 
+          * Created, using the skeleton code contributed by Oliver Becker
+-->
+<!--
+ Derived from Conformance1-5.xsl.
+
+ Copyright (c) 2001, 2006 Rick Jelliffe and Academia Sinica Computing Center, Taiwan
+
+ This software is provided 'as-is', without any express or implied warranty. 
+ In no event will the authors be held liable for any damages arising from 
+ the use of this software.
+
+ Permission is granted to anyone to use this software for any purpose, 
+ including commercial applications, and to alter it and redistribute it freely,
+ subject to the following restrictions:
+
+ 1. The origin of this software must not be misrepresented; you must not claim
+ that you wrote the original software. If you use this software in a product, 
+ an acknowledgment in the product documentation would be appreciated but is 
+ not required.
+
+ 2. Altered source versions must be plainly marked as such, and must not be 
+ misrepresented as being the original software.
+
+ 3. This notice may not be removed or altered from any source distribution.
+-->
+
+<!-- Ideas nabbed from schematrons by Francis N., Miloslav N. and David C. -->
+
+<!-- The command-line parameters are:
+  			phase           NMTOKEN | "#ALL" (default) Select the phase for validation
+    		allow-foreign   "true" | "false" (default)   Pass non-Schematron elements  and rich markup  to the generated stylesheet
+            diagnose= true | false|yes|no    Add the diagnostics to the assertion test in reports (yes|no are obsolete)
+            generate-paths=true|false|yes|no   generate the @location attribute with XPaths (yes|no are obsolete)
+            sch.exslt.imports semi-colon delimited string of filenames for some EXSLT implementations          
+   		 optimize        "visit-no-attributes"     Use only when the schema has no attributes as the context nodes
+		 generate-fired-rule "true"(default) | "false"  Generate fired-rule elements
+            
+-->
+
+<xsl:stylesheet
+   version="1.0"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+	xmlns:xs="http://www.w3.org/2001/XMLSchema"
+   xmlns:axsl="http://www.w3.org/1999/XSL/TransformAlias"
+   xmlns:schold="http://www.ascc.net/xml/schematron" 
+   xmlns:iso="http://purl.oclc.org/dsdl/schematron"
+   xmlns:svrl="http://purl.oclc.org/dsdl/svrl" 
+>
+
+<!-- Select the import statement and adjust the path as 
+   necessary for your system.
+   If not XSLT2 then also remove svrl:active-pattern/@document="{document-uri()}" from process-pattern()
+-->
+<!--
+<xsl:import href="iso_schematron_skeleton_for_saxon.xsl"/>
+--> 
+  
+<xsl:import href="iso_schematron_skeleton_for_xslt1.xsl"/>
+ <!--
+<xsl:import href="iso_schematron_skeleton.xsl"/>
+<xsl:import href="skeleton1-5.xsl"/>
+<xsl:import href="skeleton1-6.xsl"/>
+-->
+
+<xsl:param name="diagnose" >true</xsl:param>
+<xsl:param name="phase" >
+	<xsl:choose>
+		<!-- Handle Schematron 1.5 and 1.6 phases -->
+		<xsl:when test="//schold:schema/@defaultPhase">
+			<xsl:value-of select="//schold:schema/@defaultPhase"/>
+		</xsl:when>
+		<!-- Handle ISO Schematron phases -->
+		<xsl:when test="//iso:schema/@defaultPhase">
+			<xsl:value-of select="//iso:schema/@defaultPhase"/>
+		</xsl:when>
+		<xsl:otherwise>#ALL</xsl:otherwise>
+	</xsl:choose>
+</xsl:param>
+<xsl:param name="allow-foreign" >false</xsl:param>
+<xsl:param name="generate-paths" >true</xsl:param>
+<xsl:param name="generate-fired-rule" >true</xsl:param>
+<xsl:param name="optimize"/>
+
+<xsl:param name="output-encoding" ></xsl:param>
+
+<!-- e.g. saxon file.xml file.xsl "sch.exslt.imports=.../string.xsl;.../math.xsl" -->
+<xsl:param name="sch.exslt.imports" />
+
+
+
+<!-- Experimental: If this file called, then must be generating svrl -->
+<xsl:variable name="svrlTest" select="true()" />
+
+  
+ 
+<!-- ================================================================ -->
+
+<xsl:template name="process-prolog">
+	<axsl:output method="xml" omit-xml-declaration="no" standalone="yes"
+		indent="yes">
+		<xsl:if test=" string-length($output-encoding) &gt; 0">
+			<xsl:attribute name="encoding"><xsl:value-of select=" $output-encoding" /></xsl:attribute>
+		</xsl:if>
+    </axsl:output>
+     
+</xsl:template>
+
+<!-- Overrides skeleton.xsl -->
+<xsl:template name="process-root">
+	<xsl:param name="title"/>
+	<xsl:param name="contents" />
+	<xsl:param name="queryBinding" >xslt1</xsl:param>
+	<xsl:param name="schemaVersion" />
+	<xsl:param name="id" />
+	<xsl:param name="version"/>
+	<!-- "Rich" parameters -->
+	<xsl:param name="fpi" />
+	<xsl:param name="icon" />
+	<xsl:param name="lang" />
+	<xsl:param name="see" />
+	<xsl:param name="space" />
+	
+	<svrl:schematron-output title="{$title}" schemaVersion="{$schemaVersion}" >
+		<xsl:if test=" string-length( normalize-space( $phase )) &gt; 0 and 
+		not( normalize-space( $phase ) = '#ALL') ">
+			<axsl:attribute name="phase">
+				<xsl:value-of select=" $phase " />
+			</axsl:attribute>
+		</xsl:if>
+		<xsl:if test=" $allow-foreign = 'true'">
+		</xsl:if>
+		  <xsl:if  test=" $allow-foreign = 'true'">
+	
+		<xsl:call-template name='richParms'>
+			<xsl:with-param name="fpi" select="$fpi" />
+			<xsl:with-param name="icon" select="$icon"/>
+			<xsl:with-param name="lang" select="$lang"/>
+			<xsl:with-param name="see"  select="$see" />
+			<xsl:with-param name="space"  select="$space" />
+		</xsl:call-template>
+	</xsl:if>
+		 
+		 <axsl:comment><axsl:value-of select="$archiveDirParameter"/>  &#xA0;
+		 <axsl:value-of select="$archiveNameParameter"/> &#xA0;
+		 <axsl:value-of select="$fileNameParameter"/> &#xA0;
+		 <axsl:value-of select="$fileDirParameter"/></axsl:comment> 
+		 
+		
+		<xsl:apply-templates mode="do-schema-p" />
+		<xsl:copy-of select="$contents" />
+	</svrl:schematron-output>
+</xsl:template>
+
+
+<xsl:template name="process-assert">
+	<xsl:param name="test"/>
+	<xsl:param name="diagnostics" />
+	<xsl:param name="id" />
+	<xsl:param name="flag" />
+	<!-- "Linkable" parameters -->
+	<xsl:param name="role"/>
+	<xsl:param name="subject"/>
+	<!-- "Rich" parameters -->
+	<xsl:param name="fpi" />
+	<xsl:param name="icon" />
+	<xsl:param name="lang" />
+	<xsl:param name="see" />
+	<xsl:param name="space" />
+	<svrl:failed-assert test="{$test}" >
+		<xsl:if test="string-length( $id ) &gt; 0">
+			<axsl:attribute name="id">
+				<xsl:value-of select=" $id " />
+			</axsl:attribute>
+		</xsl:if>
+		<xsl:if test=" string-length( $flag ) &gt; 0">
+			<axsl:attribute name="flag">
+				<xsl:value-of select=" $flag " />
+			</axsl:attribute>
+		</xsl:if>
+		<!-- Process rich attributes.  -->
+		<xsl:call-template name="richParms">
+			<xsl:with-param name="fpi" select="$fpi"/>
+			<xsl:with-param name="icon" select="$icon"/>
+			<xsl:with-param name="lang" select="$lang"/>
+			<xsl:with-param name="see" select="$see" />
+			<xsl:with-param name="space" select="$space" />
+		</xsl:call-template>
+		<xsl:call-template name='linkableParms'>
+			<xsl:with-param name="role" select="$role" />
+			<xsl:with-param name="subject" select="$subject"/>
+		</xsl:call-template>
+		<xsl:if test=" $generate-paths = 'true' or $generate-paths= 'yes' ">
+			<!-- true/false is the new way -->
+			<axsl:attribute name="location">
+				<axsl:apply-templates select="." mode="schematron-get-full-path"/>
+			</axsl:attribute>
+		</xsl:if>
+		  
+		<svrl:text>
+			<xsl:apply-templates mode="text" />
+	
+		</svrl:text>
+		    <xsl:if test="$diagnose = 'yes' or $diagnose= 'true' ">
+			<!-- true/false is the new way -->
+				<xsl:call-template name="diagnosticsSplit">
+					<xsl:with-param name="str" select="$diagnostics"/>
+				</xsl:call-template>
+			</xsl:if>
+	</svrl:failed-assert>
+</xsl:template>
+
+<xsl:template name="process-report">
+	<xsl:param name="id"/>
+	<xsl:param name="test"/>
+	<xsl:param name="diagnostics"/>
+	<xsl:param name="flag" />
+	<!-- "Linkable" parameters -->
+	<xsl:param name="role"/>
+	<xsl:param name="subject"/>
+	<!-- "Rich" parameters -->
+	<xsl:param name="fpi" />
+	<xsl:param name="icon" />
+	<xsl:param name="lang" />
+	<xsl:param name="see" />
+	<xsl:param name="space" />
+	<svrl:successful-report test="{$test}" >
+		<xsl:if test=" string-length( $id ) &gt; 0">
+			<axsl:attribute name="id">
+				<xsl:value-of select=" $id " />
+			</axsl:attribute>
+		</xsl:if>
+		<xsl:if test=" string-length( $flag ) &gt; 0">
+			<axsl:attribute name="flag">
+				<xsl:value-of select=" $flag " />
+			</axsl:attribute>
+		</xsl:if>
+		
+		<!-- Process rich attributes.  -->
+		<xsl:call-template name="richParms">
+			<xsl:with-param name="fpi" select="$fpi"/>
+			<xsl:with-param name="icon" select="$icon"/>
+			<xsl:with-param name="lang" select="$lang"/>
+			<xsl:with-param name="see" select="$see" />
+			<xsl:with-param name="space" select="$space" />
+		</xsl:call-template>
+		<xsl:call-template name='linkableParms'>
+			<xsl:with-param name="role" select="$role" />
+			<xsl:with-param name="subject" select="$subject"/>
+		</xsl:call-template>
+		<xsl:if test=" $generate-paths = 'yes' or $generate-paths = 'true' ">
+			<!-- true/false is the new way -->
+			<axsl:attribute name="location">
+				<axsl:apply-templates select="." mode="schematron-get-full-path"/>
+			</axsl:attribute>
+		</xsl:if>
+	 
+		<svrl:text>
+			<xsl:apply-templates mode="text" />
+
+		</svrl:text>
+			<xsl:if test="$diagnose = 'yes' or $diagnose='true' ">
+			<!-- true/false is the new way -->
+				<xsl:call-template name="diagnosticsSplit">
+					<xsl:with-param name="str" select="$diagnostics"/>
+				</xsl:call-template>
+			</xsl:if>
+	</svrl:successful-report>
+</xsl:template>
+
+
+    <!-- Overrides skeleton -->
+	<xsl:template name="process-dir" >
+		<xsl:param name="value" />
+        <xsl:choose>
+        	<xsl:when test=" $allow-foreign = 'true'">
+        		<xsl:copy-of select="."/>
+        	</xsl:when>
+       
+        <xsl:otherwise>
+	    <!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<xsl:apply-templates mode="inline-text"/>
+		<axsl:text> </axsl:text>
+		</xsl:otherwise>
+		 </xsl:choose>		
+	</xsl:template>
+
+<xsl:template name="process-diagnostic">
+	<xsl:param name="id"/>
+	<!-- Rich parameters -->
+	<xsl:param name="fpi" />
+	<xsl:param name="icon" />
+	<xsl:param name="lang" />
+	<xsl:param name="see" />
+	<xsl:param name="space" />
+	<svrl:diagnostic-reference diagnostic="{$id}" >
+	  
+		<xsl:call-template name="richParms">
+			<xsl:with-param name="fpi" select="$fpi"/>
+			<xsl:with-param name="icon" select="$icon"/>
+			<xsl:with-param name="lang" select="$lang"/>
+			<xsl:with-param name="see" select="$see" />
+			<xsl:with-param name="space" select="$space" />
+		</xsl:call-template> 
+<xsl:text>
+</xsl:text>
+ 
+		<xsl:apply-templates mode="text"/>
+		 
+	</svrl:diagnostic-reference>
+</xsl:template>
+
+
+    <!-- Overrides skeleton -->
+	<xsl:template name="process-emph" >
+		<xsl:param name="class" />
+        <xsl:choose>
+        	<xsl:when test=" $allow-foreign = 'true'">
+        		<xsl:copy-of select="."/>
+        	</xsl:when> 
+        <xsl:otherwise>
+	    <!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<xsl:apply-templates mode="inline-text"/>
+		<axsl:text> </axsl:text>
+		</xsl:otherwise>
+	 	</xsl:choose>	
+	</xsl:template>
+
+<xsl:template name="process-rule">
+	<xsl:param name="id"/>
+	<xsl:param name="context"/>
+	<xsl:param name="flag"/>
+	<!-- "Linkable" parameters -->
+	<xsl:param name="role"/>
+	<xsl:param name="subject"/>
+	<!-- "Rich" parameters -->
+	<xsl:param name="fpi" />
+	<xsl:param name="icon" />
+	<xsl:param name="lang" />
+	<xsl:param name="see" />
+	<xsl:param name="space" />
+	<xsl:if test=" $generate-fired-rule = 'true'">
+	<svrl:fired-rule context="{$context}" >
+		<!-- Process rich attributes.  -->
+		<xsl:call-template name="richParms">
+			<xsl:with-param name="fpi" select="$fpi"/>
+			<xsl:with-param name="icon" select="$icon"/>
+			<xsl:with-param name="lang" select="$lang"/>
+			<xsl:with-param name="see" select="$see" />
+			<xsl:with-param name="space" select="$space" />
+		</xsl:call-template>
+		<xsl:if test=" string( $id )">
+			<xsl:attribute name="id">
+				<xsl:value-of select=" $id " />
+			</xsl:attribute>
+		</xsl:if>
+		<xsl:if test=" string-length( $role ) &gt; 0">
+			<xsl:attribute name="role">
+				<xsl:value-of select=" $role " />
+			</xsl:attribute>
+		</xsl:if> 
+	</svrl:fired-rule>
+</xsl:if>
+</xsl:template>
+
+<xsl:template name="process-ns">
+	<xsl:param name="prefix"/>
+	<xsl:param name="uri"/>
+	<svrl:ns-prefix-in-attribute-values uri="{$uri}" prefix="{$prefix}" />
+</xsl:template>
+
+<xsl:template name="process-p"> 
+	<xsl:param name="icon"/>
+	<xsl:param name="class"/>
+	<xsl:param name="id"/>
+	<xsl:param name="lang"/>
+	 
+	<svrl:text> 
+		<xsl:apply-templates mode="text"/>
+	</svrl:text>
+</xsl:template>
+
+<xsl:template name="process-pattern">
+	<xsl:param name="name"/>
+	<xsl:param name="id"/>
+	<xsl:param name="is-a"/>
+	
+	<!-- "Rich" parameters -->
+	<xsl:param name="fpi" />
+	<xsl:param name="icon" />
+	<xsl:param name="lang" />
+	<xsl:param name="see" />
+	<xsl:param name="space" />
+	<svrl:active-pattern > 
+		<xsl:if test=" string( $id )">
+			<axsl:attribute name="id">
+				<xsl:value-of select=" $id " />
+			</axsl:attribute>
+		</xsl:if>
+		<xsl:if test=" string( $name )">
+			<axsl:attribute name="name">
+				<xsl:value-of select=" $name " />
+			</axsl:attribute>
+		</xsl:if> 
+		 
+		<xsl:call-template name='richParms'>
+			<xsl:with-param name="fpi" select="$fpi"/>
+			<xsl:with-param name="icon" select="$icon"/>
+			<xsl:with-param name="lang" select="$lang"/>
+			<xsl:with-param name="see" select="$see" />
+			<xsl:with-param name="space" select="$space" />
+		</xsl:call-template>
+		
+		<!-- ?? report that this screws up iso:title processing  -->
+		<xsl:apply-templates mode="do-pattern-p"/>
+		<!-- ?? Seems that this apply-templates is never triggered DP -->
+		<axsl:apply-templates />
+	</svrl:active-pattern>
+</xsl:template>
+
+<!-- Overrides skeleton -->
+<xsl:template name="process-message" > 
+	<xsl:param name="pattern"/>
+	<xsl:param name="role"/>
+</xsl:template>
+
+
+    <!-- Overrides skeleton -->
+	<xsl:template name="process-span" >
+		<xsl:param name="class" />
+        <xsl:choose>
+        	<xsl:when test=" $allow-foreign = 'true'">
+        		<xsl:copy-of select="."/>
+        	</xsl:when> 
+        <xsl:otherwise>
+	    <!-- We generate too much whitespace rather than risking concatenation -->
+		<axsl:text> </axsl:text>
+		<xsl:apply-templates mode="inline-text"/>
+		<axsl:text> </axsl:text>
+		</xsl:otherwise>
+	 	</xsl:choose>	
+	</xsl:template>
+
+<!-- =========================================================================== -->
+<!-- processing rich parameters. -->
+<xsl:template name='richParms'>
+	<!-- "Rich" parameters -->
+	<xsl:param name="fpi" />
+	<xsl:param name="icon" />
+	<xsl:param name="lang" />
+	<xsl:param name="see" />
+	<xsl:param name="space" />
+	<!-- Process rich attributes.  -->
+	<xsl:if  test=" $allow-foreign = 'true'">
+	<xsl:if test="string($fpi)"> 
+		<axsl:attribute name="fpi">
+			<xsl:value-of select="$fpi"/>
+		</axsl:attribute>
+	</xsl:if>
+	<xsl:if test="string($icon)"> 
+		<axsl:attribute name="icon">
+			<xsl:value-of select="$icon"/>
+		</axsl:attribute>
+	</xsl:if>
+	<xsl:if test="string($see)"> 
+		<axsl:attribute name="see">
+			<xsl:value-of select="$see"/>
+		</axsl:attribute>
+	</xsl:if>
+	</xsl:if>
+	<xsl:if test="string($space)">
+		<axsl:attribute name="xml:space">
+			<xsl:value-of select="$space"/>
+		</axsl:attribute>
+	</xsl:if>
+	<xsl:if test="string($lang)">
+		<axsl:attribute name="xml:lang">
+			<xsl:value-of select="$lang"/>
+		</axsl:attribute>
+	</xsl:if>
+</xsl:template>
+
+<!-- processing linkable parameters. -->
+<xsl:template name='linkableParms'>
+	<xsl:param name="role"/>
+	<xsl:param name="subject"/>
+	
+	<!-- ISO SVRL has a role attribute to match the Schematron role attribute -->
+	<xsl:if test=" string($role )">
+		<axsl:attribute name="role">
+			<xsl:value-of select=" $role " />
+		</axsl:attribute>
+	</xsl:if>
+	<!-- ISO SVRL does not have a subject attribute to match the Schematron subject attribute.
+       Instead, the Schematron subject attribute is folded into the location attribute -->
+</xsl:template>
+   
+
+</xsl:stylesheet>
+
diff --git a/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/readme.txt b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/readme.txt
new file mode 100644
index 00000000..d9f68c5a
--- /dev/null
+++ b/lib/lxml/isoschematron/resources/xsl/iso-schematron-xslt1/readme.txt
@@ -0,0 +1,83 @@
+ISO SCHEMATRON 2009
+
+XSLT implementation by Rick Jelliffe with assistance from members of Schematron-love-in maillist.
+
+2009-03-18
+
+Two distributions are available. One is for XSLT1 engines. 
+The other is for XSLT2 engines, such as SAXON 9.
+
+
+This version of Schematron splits the process into a pipeline of several different XSLT stages.
+
+1) First, preprocess your Schematron schema with iso_dsdl_include.xsl.  
+This is a macro processor to assemble the schema from various parts. 
+If your schema is not in separate parts, you can skip this stage.
+
+2) Second, preprocess the output from stage 1 with iso_abstract_expand.xsl.  
+This is a macro processor to convert abstract patterns to real patterns. 
+If your schema does not use abstract patterns, you can skip this
+stage.
+
+3) Third, compile the Schematron schema into an XSLT script. 
+This will typically use iso_svrl_for_xslt1.xsl or iso_svrl_for_xslt2.xsl 
+(which in turn invoke iso_schematron_skeleton_for_xslt1.xsl or iso_schematron_skeleton_for_saxon.xsl)
+However, other "meta-styleseets" are also in common use; the principle of operation is the same.
+If your schema uses Schematron phases, supply these as command line/invocation parameters
+to this process.
+
+4) Fourth, run the script generated by stage 3 against the document being validated.
+If you are using the SVRL script, then the output of validation will be an XML document.
+If your schema uses Schematron parameters, supply these as command line/invocation parameters
+to this process. 
+
+
+The XSLT2 distribution also features several next generation features, 
+such as validating multiple documents. See the source code for details.
+
+Schematron assertions can be written in any language, of course; the file
+sch-messages-en.xhtml contains the diagnostics messages from the XSLT2 skeleton
+in English, and this can be used as template to localize the skeleton's
+error messages. Note that typically programming errors in Schematron are XPath
+errors, which requires localized messages from the XSLT engine.
+
+ANT
+---
+To give an example of how to process a document, here is a sample ANT task.
+
+<target  name="schematron-compile-test" >
+
+	   <!-- expand inclusions -->
+	   <xslt basedir="test/schematron"
+	   		style="iso_dsdl_include.xsl" in="test.sch"  out="test1.sch"> 
+	   				<classpath>
+	   					<pathelement location="${lib.dir}/saxon9.jar"/>
+	   				</classpath>
+	   </xslt>
+
+	   <!-- expand abstract patterns -->
+	   <xslt basedir="test/schematron"
+	   		style="iso_abstract_expand.xsl" in="test1.sch"  out="test2.sch"> 
+	   				<classpath>
+	   					<pathelement location="${lib.dir}/saxon9.jar"/>
+	   				</classpath>
+	   </xslt>
+
+
+
+	   <!-- compile it -->
+	   <xslt basedir="test/schematron"
+	   		style="iso_svrl_for_xslt2.xsl" in="test2.sch"  out="test.xsl"> 
+	   				<classpath>
+	   					<pathelement location="${lib.dir}/saxon9.jar"/>
+	   				</classpath>
+	   </xslt>
+	   
+	   <!-- validate -->
+	   <xslt basedir="test/schematron"
+		   		style="test.xsl" in="instance.xml"  out="instance.svrlt"> 
+		   				<classpath>
+		   					<pathelement location="${lib.dir}/saxon9.jar"/>
+		   				</classpath>
+	</xslt>
+		</target>
\ No newline at end of file
diff --git a/lib/lxml/iterparse.pxi b/lib/lxml/iterparse.pxi
new file mode 100644
index 00000000..13b94495
--- /dev/null
+++ b/lib/lxml/iterparse.pxi
@@ -0,0 +1,357 @@
+# iterparse -- event-driven parsing
+
+DEF __ITERPARSE_CHUNK_SIZE = 32768
+
+cdef class iterparse:
+    u"""iterparse(self, source, events=("end",), tag=None, \
+                  attribute_defaults=False, dtd_validation=False, \
+                  load_dtd=False, no_network=True, remove_blank_text=False, \
+                  remove_comments=False, remove_pis=False, encoding=None, \
+                  html=False, recover=None, huge_tree=False, schema=None)
+
+    Incremental parser.
+
+    Parses XML into a tree and generates tuples (event, element) in a
+    SAX-like fashion. ``event`` is any of 'start', 'end', 'start-ns',
+    'end-ns'.
+
+    For 'start' and 'end', ``element`` is the Element that the parser just
+    found opening or closing.  For 'start-ns', it is a tuple (prefix, URI) of
+    a new namespace declaration.  For 'end-ns', it is simply None.  Note that
+    all start and end events are guaranteed to be properly nested.
+
+    The keyword argument ``events`` specifies a sequence of event type names
+    that should be generated.  By default, only 'end' events will be
+    generated.
+
+    The additional ``tag`` argument restricts the 'start' and 'end' events to
+    those elements that match the given tag.  By default, events are generated
+    for all elements.  Note that the 'start-ns' and 'end-ns' events are not
+    impacted by this restriction.
+
+    The other keyword arguments in the constructor are mainly based on the
+    libxml2 parser configuration.  A DTD will also be loaded if validation or
+    attribute default values are requested.
+
+    Available boolean keyword arguments:
+     - attribute_defaults: read default attributes from DTD
+     - dtd_validation: validate (if DTD is available)
+     - load_dtd: use DTD for parsing
+     - no_network: prevent network access for related files
+     - remove_blank_text: discard blank text nodes
+     - remove_comments: discard comments
+     - remove_pis: discard processing instructions
+     - strip_cdata: replace CDATA sections by normal text content (default: True)
+     - compact: safe memory for short text content (default: True)
+     - resolve_entities: replace entities by their text value (default: True)
+     - huge_tree: disable security restrictions and support very deep trees
+                  and very long text content (only affects libxml2 2.7+)
+     - html: parse input as HTML (default: XML)
+     - recover: try hard to parse through broken input (default: True for HTML,
+                False otherwise)
+
+    Other keyword arguments:
+     - encoding: override the document encoding
+     - schema: an XMLSchema to validate against
+    """
+    cdef _FeedParser _parser
+    cdef object _tag
+    cdef object _events
+    cdef readonly object root
+    cdef object _source
+    cdef object _filename
+    cdef object _error
+    cdef bint _close_source_after_read
+
+    def __init__(self, source, events=(u"end",), *, tag=None,
+                 attribute_defaults=False, dtd_validation=False,
+                 load_dtd=False, no_network=True, remove_blank_text=False,
+                 compact=True, resolve_entities=True, remove_comments=False,
+                 remove_pis=False, strip_cdata=True, encoding=None,
+                 html=False, recover=None, huge_tree=False,
+                 XMLSchema schema=None):
+        if not hasattr(source, 'read'):
+            self._filename = source
+            if not python.IS_PYTHON3:
+                source = _encodeFilename(source)
+            source = open(source, 'rb')
+            self._close_source_after_read = True
+        else:
+            self._filename = _getFilenameForFile(source)
+            self._close_source_after_read = False
+
+        if recover is None:
+            recover = html
+
+        if html:
+            # make sure we're not looking for namespaces
+            events = [event for event in events
+                      if event not in ('start-ns', 'end-ns')]
+            parser = HTMLPullParser(
+                events,
+                tag=tag,
+                recover=recover,
+                base_url=self._filename,
+                encoding=encoding,
+                remove_blank_text=remove_blank_text,
+                remove_comments=remove_comments,
+                remove_pis=remove_pis,
+                strip_cdata=strip_cdata,
+                no_network=no_network,
+                target=None,  # TODO
+                schema=schema,
+                compact=compact)
+        else:
+            parser = XMLPullParser(
+                events,
+                tag=tag,
+                recover=recover,
+                base_url=self._filename,
+                encoding=encoding,
+                attribute_defaults=attribute_defaults,
+                dtd_validation=dtd_validation,
+                load_dtd=load_dtd,
+                no_network=no_network,
+                schema=schema,
+                huge_tree=huge_tree,
+                remove_blank_text=remove_blank_text,
+                resolve_entities=resolve_entities,
+                remove_comments=remove_comments,
+                remove_pis=remove_pis,
+                strip_cdata=strip_cdata,
+                target=None,  # TODO
+                compact=compact)
+
+        self._events = parser.read_events()
+        self._parser = parser
+        self._source = source
+
+    property error_log:
+        u"""The error log of the last (or current) parser run.
+        """
+        def __get__(self):
+            return self._parser.feed_error_log
+
+    property resolvers:
+        u"""The custom resolver registry of the last (or current) parser run.
+        """
+        def __get__(self):
+            return self._parser.resolvers
+
+    property version:
+        u"""The version of the underlying XML parser."""
+        def __get__(self):
+            return self._parser.version
+
+    def set_element_class_lookup(self, ElementClassLookup lookup = None):
+        u"""set_element_class_lookup(self, lookup = None)
+
+        Set a lookup scheme for element classes generated from this parser.
+
+        Reset it by passing None or nothing.
+        """
+        self._parser.set_element_class_lookup(lookup)
+
+    def makeelement(self, _tag, attrib=None, nsmap=None, **_extra):
+        u"""makeelement(self, _tag, attrib=None, nsmap=None, **_extra)
+
+        Creates a new element associated with this parser.
+        """
+        self._parser.makeelement(
+            _tag, attrib=None, nsmap=None, **_extra)
+
+    @cython.final
+    cdef _close_source(self):
+        if self._source is None:
+            return
+        if not self._close_source_after_read:
+            self._source = None
+            return
+        try:
+            close = self._source.close
+        except AttributeError:
+            close = None
+        finally:
+            self._source = None
+        if close is not None:
+            close()
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        try:
+            return next(self._events)
+        except StopIteration:
+            pass
+        context = <_SaxParserContext>self._parser._getPushParserContext()
+        if self._source is not None:
+            done = False
+            while not done:
+                try:
+                    done = self._read_more_events(context)
+                    return next(self._events)
+                except StopIteration:
+                    pass  # no events yet
+                except Exception, e:
+                    self._error = e
+                    self._close_source()
+                    try:
+                        return next(self._events)
+                    except StopIteration:
+                        break
+        # nothing left to read or return
+        if self._error is not None:
+            error = self._error
+            self._error = None
+            raise error
+        if (context._validator is not None
+                and not context._validator.isvalid()):
+            _raiseParseError(context._c_ctxt, self._filename,
+                             context._error_log)
+        # no errors => all done
+        raise StopIteration
+
+    @cython.final
+    cdef bint _read_more_events(self, _SaxParserContext context) except -123:
+        data = self._source.read(__ITERPARSE_CHUNK_SIZE)
+        if not isinstance(data, bytes):
+            self._close_source()
+            raise TypeError("reading file objects must return bytes objects")
+        if not data:
+            try:
+                self.root = self._parser.close()
+            finally:
+                self._close_source()
+            return True
+        self._parser.feed(data)
+        return False
+
+
+cdef class iterwalk:
+    u"""iterwalk(self, element_or_tree, events=("end",), tag=None)
+
+    A tree walker that generates events from an existing tree as if it
+    was parsing XML data with ``iterparse()``.
+    """
+    cdef _MultiTagMatcher _matcher
+    cdef list   _node_stack
+    cdef int    _index
+    cdef list   _events
+    cdef object _pop_event
+    cdef int    _event_filter
+
+    def __init__(self, element_or_tree, events=(u"end",), tag=None):
+        cdef _Element root
+        cdef int ns_count
+        root = _rootNodeOrRaise(element_or_tree)
+        self._event_filter = _buildParseEventFilter(events)
+        if tag is None or tag == '*':
+            self._matcher = None
+        else:
+            self._matcher = _MultiTagMatcher(tag)
+        self._node_stack  = []
+        self._events = []
+        self._pop_event = self._events.pop
+
+        if self._event_filter:
+            self._index = 0
+            ns_count = self._start_node(root)
+            self._node_stack.append( (root, ns_count) )
+        else:
+            self._index = -1
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        cdef xmlNode* c_child
+        cdef _Element node
+        cdef _Element next_node
+        cdef int ns_count = 0
+        if self._events:
+            return self._pop_event(0)
+        if self._matcher is not None and self._index >= 0:
+            node = self._node_stack[self._index][0]
+            self._matcher.cacheTags(node._doc)
+
+        # find next node
+        while self._index >= 0:
+            node = self._node_stack[self._index][0]
+
+            c_child = _findChildForwards(node._c_node, 0)
+            if c_child is not NULL:
+                # try children
+                next_node = _elementFactory(node._doc, c_child)
+            else:
+                # back off
+                next_node = None
+                while next_node is None:
+                    # back off through parents
+                    self._index -= 1
+                    node = self._end_node()
+                    if self._index < 0:
+                        break
+                    next_node = node.getnext()
+            if next_node is not None:
+                if self._event_filter & (PARSE_EVENT_FILTER_START |
+                                         PARSE_EVENT_FILTER_START_NS):
+                    ns_count = self._start_node(next_node)
+                elif self._event_filter & PARSE_EVENT_FILTER_END_NS:
+                    ns_count = _countNsDefs(next_node._c_node)
+                self._node_stack.append( (next_node, ns_count) )
+                self._index += 1
+            if self._events:
+                return self._pop_event(0)
+        raise StopIteration
+
+    cdef int _start_node(self, _Element node) except -1:
+        cdef int ns_count
+        if self._event_filter & PARSE_EVENT_FILTER_START_NS:
+            ns_count = _appendStartNsEvents(node._c_node, self._events)
+        elif self._event_filter & PARSE_EVENT_FILTER_END_NS:
+            ns_count = _countNsDefs(node._c_node)
+        else:
+            ns_count = 0
+        if self._event_filter & PARSE_EVENT_FILTER_START:
+            if self._matcher is None or self._matcher.matches(node._c_node):
+                self._events.append( (u"start", node) )
+        return ns_count
+
+    cdef _Element _end_node(self):
+        cdef _Element node
+        cdef int i, ns_count
+        node, ns_count = self._node_stack.pop()
+        if self._event_filter & PARSE_EVENT_FILTER_END:
+            if self._matcher is None or self._matcher.matches(node._c_node):
+                self._events.append( (u"end", node) )
+        if self._event_filter & PARSE_EVENT_FILTER_END_NS:
+            event = (u"end-ns", None)
+            for i from 0 <= i < ns_count:
+                self._events.append(event)
+        return node
+
+
+cdef int _countNsDefs(xmlNode* c_node):
+    cdef xmlNs* c_ns
+    cdef int count
+    count = 0
+    c_ns = c_node.nsDef
+    while c_ns is not NULL:
+        count += 1
+        c_ns = c_ns.next
+    return count
+
+
+cdef int _appendStartNsEvents(xmlNode* c_node, list event_list) except -1:
+    cdef xmlNs* c_ns
+    cdef int count
+    count = 0
+    c_ns = c_node.nsDef
+    while c_ns is not NULL:
+        ns_tuple = (funicode(c_ns.prefix) if c_ns.prefix is not NULL else '',
+                    funicode(c_ns.href))
+        event_list.append( (u"start-ns", ns_tuple) )
+        count += 1
+        c_ns = c_ns.next
+    return count
diff --git a/lib/lxml/lxml.etree.pyx b/lib/lxml/lxml.etree.pyx
new file mode 100644
index 00000000..6e75eeab
--- /dev/null
+++ b/lib/lxml/lxml.etree.pyx
@@ -0,0 +1,3332 @@
+u"""The ``lxml.etree`` module implements the extended ElementTree API
+for XML.
+"""
+
+from __future__ import absolute_import
+
+__docformat__ = u"restructuredtext en"
+
+__all__ = [
+    'AttributeBasedElementClassLookup', 'C14NError', 'CDATA',
+    'Comment', 'CommentBase', 'CustomElementClassLookup', 'DEBUG',
+    'DTD', 'DTDError', 'DTDParseError', 'DTDValidateError',
+    'DocumentInvalid', 'ETCompatXMLParser', 'ETXPath', 'Element',
+    'ElementBase', 'ElementClassLookup', 'ElementDefaultClassLookup',
+    'ElementNamespaceClassLookup', 'ElementTree', 'Entity', 'EntityBase',
+    'Error', 'ErrorDomains', 'ErrorLevels', 'ErrorTypes', 'Extension',
+    'FallbackElementClassLookup', 'FunctionNamespace', 'HTML',
+    'HTMLParser', 'LIBXML_COMPILED_VERSION', 'LIBXML_VERSION',
+    'LIBXSLT_COMPILED_VERSION', 'LIBXSLT_VERSION', 'LXML_VERSION',
+    'LxmlError', 'LxmlRegistryError', 'LxmlSyntaxError',
+    'NamespaceRegistryError', 'PI', 'PIBase', 'ParseError',
+    'ParserBasedElementClassLookup', 'ParserError', 'ProcessingInstruction',
+    'PyErrorLog', 'PythonElementClassLookup', 'QName', 'RelaxNG',
+    'RelaxNGError', 'RelaxNGErrorTypes', 'RelaxNGParseError',
+    'RelaxNGValidateError', 'Resolver', 'Schematron', 'SchematronError',
+    'SchematronParseError', 'SchematronValidateError', 'SerialisationError',
+    'SubElement', 'TreeBuilder', 'XInclude', 'XIncludeError', 'XML',
+    'XMLDTDID', 'XMLID', 'XMLParser', 'XMLSchema', 'XMLSchemaError',
+    'XMLSchemaParseError', 'XMLSchemaValidateError', 'XMLSyntaxError',
+    'XMLTreeBuilder', 'XPath', 'XPathDocumentEvaluator', 'XPathError',
+    'XPathEvalError', 'XPathEvaluator', 'XPathFunctionError', 'XPathResultError',
+    'XPathSyntaxError', 'XSLT', 'XSLTAccessControl', 'XSLTApplyError',
+    'XSLTError', 'XSLTExtension', 'XSLTExtensionError', 'XSLTParseError',
+    'XSLTSaveError', 'cleanup_namespaces', 'clear_error_log', 'dump',
+    'fromstring', 'fromstringlist', 'get_default_parser', 'iselement',
+    'iterparse', 'iterwalk', 'parse', 'parseid', 'register_namespace',
+    'set_default_parser', 'set_element_class_lookup', 'strip_attributes',
+    'strip_elements', 'strip_tags', 'tostring', 'tostringlist', 'tounicode',
+    'use_global_python_log'
+    ]
+
+cimport cython
+
+from lxml cimport python
+from lxml.includes cimport tree, config
+from lxml.includes.tree cimport xmlDoc, xmlNode, xmlAttr, xmlNs, _isElement, _getNs
+from lxml.includes.tree cimport const_xmlChar, xmlChar, _xcstr
+from lxml.python cimport _cstr, _isString
+from lxml.includes cimport xpath
+from lxml.includes cimport c14n
+
+# Cython's standard declarations
+cimport cpython.mem
+cimport cpython.ref
+from libc cimport limits, stdio, stdlib
+from libc cimport string as cstring_h   # not to be confused with stdlib 'string'
+from libc.string cimport const_char
+
+try:
+    import __builtin__
+except ImportError:
+    # Python 3
+    import builtins as __builtin__
+
+cdef object _unicode
+try:
+    _unicode = __builtin__.unicode
+except AttributeError:
+    # Python 3
+    _unicode = __builtin__.str
+
+del __builtin__
+
+cdef object os_path_abspath
+from os.path import abspath as os_path_abspath
+
+cdef object BytesIO, StringIO
+try:
+    from io import BytesIO, StringIO
+except (ImportError, AttributeError):
+    from StringIO import StringIO, StringIO as BytesIO
+
+cdef object _elementpath
+from lxml import _elementpath
+
+cdef object sys
+import sys
+
+cdef object re
+import re
+
+cdef object islice
+from itertools import islice
+
+cdef object ITER_EMPTY = iter(())
+
+try:
+    from collections.abc import MutableMapping  # Py3.3+
+except ImportError:
+    from collections import MutableMapping  # Py2.6+
+
+class _ImmutableMapping(MutableMapping):
+    def __getitem__(self, key):
+        raise KeyError, key
+
+    def __setitem__(self, key, value):
+        raise KeyError, key
+
+    def __delitem__(self, key):
+        raise KeyError, key
+
+    def __contains__(self, key):
+        return False
+
+    def __len__(self):
+        return 0
+
+    def __iter__(self):
+        return ITER_EMPTY
+    iterkeys = itervalues = iteritems = __iter__
+
+cdef object IMMUTABLE_EMPTY_MAPPING = _ImmutableMapping()
+del MutableMapping, _ImmutableMapping
+
+
+# the rules
+# ---------
+# any libxml C argument/variable is prefixed with c_
+# any non-public function/class is prefixed with an underscore
+# instance creation is always through factories
+
+# what to do with libxml2/libxslt error messages?
+# 0 : drop
+# 1 : use log
+DEF __DEBUG = 1
+
+# maximum number of lines in the libxml2/xslt log if __DEBUG == 1
+DEF __MAX_LOG_SIZE = 100
+
+# make the compiled-in debug state publicly available
+DEBUG = __DEBUG
+
+# A struct to store a cached qualified tag name+href pair.
+# While we can borrow the c_name from the document dict,
+# PyPy requires us to store a Python reference for the
+# namespace in order to keep the byte buffer alive.
+cdef struct qname:
+    const_xmlChar* c_name
+    python.PyObject* href
+
+# global per-thread setup
+tree.xmlThrDefIndentTreeOutput(1)
+tree.xmlThrDefLineNumbersDefaultValue(1)
+
+_initThreadLogging()
+
+# initialize parser (and threading)
+xmlparser.xmlInitParser()
+
+# filename encoding
+cdef bytes _FILENAME_ENCODING = (sys.getfilesystemencoding() or sys.getdefaultencoding() or 'ascii').encode(u"UTF-8")
+cdef char* _C_FILENAME_ENCODING = _cstr(_FILENAME_ENCODING)
+
+# set up some default namespace prefixes
+cdef dict _DEFAULT_NAMESPACE_PREFIXES = {
+    b"http://www.w3.org/XML/1998/namespace": b'xml',
+    b"http://www.w3.org/1999/xhtml": b"html",
+    b"http://www.w3.org/1999/XSL/Transform": b"xsl",
+    b"http://www.w3.org/1999/02/22-rdf-syntax-ns#": b"rdf",
+    b"http://schemas.xmlsoap.org/wsdl/": b"wsdl",
+    # xml schema
+    b"http://www.w3.org/2001/XMLSchema": b"xs",
+    b"http://www.w3.org/2001/XMLSchema-instance": b"xsi",
+    # dublin core
+    b"http://purl.org/dc/elements/1.1/": b"dc",
+    # objectify
+    b"http://codespeak.net/lxml/objectify/pytype" : b"py",
+}
+
+cdef object _check_internal_prefix = re.compile(b"ns\d+$").match
+
+def register_namespace(prefix, uri):
+    u"""Registers a namespace prefix that newly created Elements in that
+    namespace will use.  The registry is global, and any existing
+    mapping for either the given prefix or the namespace URI will be
+    removed.
+    """
+    prefix_utf, uri_utf = _utf8(prefix), _utf8(uri)
+    if _check_internal_prefix(prefix_utf):
+        raise ValueError("Prefix format reserved for internal use")
+    _tagValidOrRaise(prefix_utf)
+    _uriValidOrRaise(uri_utf)
+    for k, v in list(_DEFAULT_NAMESPACE_PREFIXES.items()):
+        if k == uri_utf or v == prefix_utf:
+            del _DEFAULT_NAMESPACE_PREFIXES[k]
+    _DEFAULT_NAMESPACE_PREFIXES[uri_utf] = prefix_utf
+
+
+# Error superclass for ElementTree compatibility
+class Error(Exception):
+    pass
+
+# module level superclass for all exceptions
+class LxmlError(Error):
+    u"""Main exception base class for lxml.  All other exceptions inherit from
+    this one.
+    """
+    def __init__(self, message, error_log=None):
+        super(_Error, self).__init__(message)
+        if error_log is None:
+            self.error_log = __copyGlobalErrorLog()
+        else:
+            self.error_log = error_log.copy()
+
+cdef object _Error = Error
+
+
+# superclass for all syntax errors
+class LxmlSyntaxError(LxmlError, SyntaxError):
+    u"""Base class for all syntax errors.
+    """
+    pass
+
+class C14NError(LxmlError):
+    u"""Error during C14N serialisation.
+    """
+    pass
+
+# version information
+cdef __unpackDottedVersion(version):
+    version_list = []
+    l = (version.decode("ascii").replace(u'-', u'.').split(u'.') + [0]*4)[:4]
+    for item in l:
+        try:
+            item = int(item)
+        except ValueError:
+            if item.startswith(u'dev'):
+                count = item[3:]
+                item = -300
+            elif item.startswith(u'alpha'):
+                count = item[5:]
+                item = -200
+            elif item.startswith(u'beta'):
+                count = item[4:]
+                item = -100
+            else:
+                count = 0
+            if count:
+                item += int(count)
+        version_list.append(item)
+    return tuple(version_list)
+
+cdef __unpackIntVersion(int c_version):
+    return (
+        ((c_version / (100*100)) % 100),
+        ((c_version / 100)       % 100),
+        (c_version               % 100)
+        )
+
+cdef int _LIBXML_VERSION_INT
+try:
+    _LIBXML_VERSION_INT = int(
+        re.match(u'[0-9]+', (<unsigned char*>tree.xmlParserVersion).decode("ascii")).group(0))
+except Exception:
+    print u"Unknown libxml2 version: %s" % (<unsigned char*>tree.xmlParserVersion).decode("ascii")
+    _LIBXML_VERSION_INT = 0
+
+LIBXML_VERSION = __unpackIntVersion(_LIBXML_VERSION_INT)
+LIBXML_COMPILED_VERSION = __unpackIntVersion(tree.LIBXML_VERSION)
+LXML_VERSION = __unpackDottedVersion(tree.LXML_VERSION_STRING)
+
+__version__ = tree.LXML_VERSION_STRING.decode("ascii")
+
+
+# class for temporary storage of Python references,
+# used e.g. for XPath results
+@cython.final
+@cython.internal
+cdef class _TempStore:
+    cdef list _storage
+    def __init__(self):
+        self._storage = []
+
+    cdef int add(self, obj) except -1:
+        self._storage.append(obj)
+        return 0
+
+    cdef int clear(self) except -1:
+        del self._storage[:]
+        return 0
+
+# class for temporarily storing exceptions raised in extensions
+@cython.internal
+cdef class _ExceptionContext:
+    cdef object _exc_info
+    cdef void clear(self):
+        self._exc_info = None
+
+    cdef void _store_raised(self):
+        self._exc_info = sys.exc_info()
+
+    cdef void _store_exception(self, exception):
+        self._exc_info = (exception, None, None)
+
+    cdef bint _has_raised(self):
+        return self._exc_info is not None
+
+    cdef int _raise_if_stored(self) except -1:
+        if self._exc_info is None:
+            return 0
+        type, value, traceback = self._exc_info
+        self._exc_info = None
+        if value is None and traceback is None:
+            raise type
+        else:
+            raise type, value, traceback
+
+
+# forward declarations
+cdef public class _Document [ type LxmlDocumentType, object LxmlDocument ]
+cdef public class _Element [ type LxmlElementType, object LxmlElement ]
+cdef class _BaseParser
+cdef class QName
+ctypedef public xmlNode* (*_node_to_node_function)(xmlNode*)
+
+################################################################################
+# Include submodules
+
+include "proxy.pxi"        # Proxy handling (element backpointers/memory/etc.)
+include "apihelpers.pxi"   # Private helper functions
+include "xmlerror.pxi"     # Error and log handling
+
+
+################################################################################
+# Public Python API
+
+@cython.final
+@cython.freelist(8)
+cdef public class _Document [ type LxmlDocumentType, object LxmlDocument ]:
+    u"""Internal base class to reference a libxml document.
+
+    When instances of this class are garbage collected, the libxml
+    document is cleaned up.
+    """
+    cdef int _ns_counter
+    cdef bytes _prefix_tail
+    cdef xmlDoc* _c_doc
+    cdef _BaseParser _parser
+    
+    def __dealloc__(self):
+        # if there are no more references to the document, it is safe
+        # to clean the whole thing up, as all nodes have a reference to
+        # the document
+        tree.xmlFreeDoc(self._c_doc)
+
+    @cython.final
+    cdef getroot(self):
+        # return an element proxy for the document root
+        cdef xmlNode* c_node
+        c_node = tree.xmlDocGetRootElement(self._c_doc)
+        if c_node is NULL:
+            return None
+        return _elementFactory(self, c_node)
+
+    @cython.final
+    cdef bint hasdoctype(self):
+        # DOCTYPE gets parsed into internal subset (xmlDTD*)
+        return self._c_doc is not NULL and self._c_doc.intSubset is not NULL
+
+    @cython.final
+    cdef getdoctype(self):
+        # get doctype info: root tag, public/system ID (or None if not known)
+        cdef tree.xmlDtd* c_dtd
+        cdef xmlNode* c_root_node
+        public_id = None
+        sys_url   = None
+        c_dtd = self._c_doc.intSubset
+        if c_dtd is not NULL:
+            if c_dtd.ExternalID is not NULL:
+                public_id = funicode(c_dtd.ExternalID)
+            if c_dtd.SystemID is not NULL:
+                sys_url = funicode(c_dtd.SystemID)
+        c_dtd = self._c_doc.extSubset
+        if c_dtd is not NULL:
+            if not public_id and c_dtd.ExternalID is not NULL:
+                public_id = funicode(c_dtd.ExternalID)
+            if not sys_url and c_dtd.SystemID is not NULL:
+                sys_url = funicode(c_dtd.SystemID)
+        c_root_node = tree.xmlDocGetRootElement(self._c_doc)
+        if c_root_node is NULL:
+            root_name = None
+        else:
+            root_name = funicode(c_root_node.name)
+        return (root_name, public_id, sys_url)
+
+    @cython.final
+    cdef getxmlinfo(self):
+        # return XML version and encoding (or None if not known)
+        cdef xmlDoc* c_doc = self._c_doc
+        if c_doc.version is NULL:
+            version = None
+        else:
+            version = funicode(c_doc.version)
+        if c_doc.encoding is NULL:
+            encoding = None
+        else:
+            encoding = funicode(c_doc.encoding)
+        return (version, encoding)
+
+    @cython.final
+    cdef isstandalone(self):
+        # returns True for "standalone=true",
+        # False for "standalone=false", None if not provided
+        if self._c_doc.standalone == -1:
+            return None
+        else:
+            return <bint>(self._c_doc.standalone == 1)
+
+    @cython.final
+    cdef bytes buildNewPrefix(self):
+        # get a new unique prefix ("nsX") for this document
+        cdef bytes ns
+        if self._ns_counter < len(_PREFIX_CACHE):
+            ns = _PREFIX_CACHE[self._ns_counter]
+        else:
+            ns = python.PyBytes_FromFormat("ns%d", self._ns_counter)
+        if self._prefix_tail is not None:
+            ns += self._prefix_tail
+        self._ns_counter += 1
+        if self._ns_counter < 0:
+            # overflow!
+            self._ns_counter = 0
+            if self._prefix_tail is None:
+                self._prefix_tail = b"A"
+            else:
+                self._prefix_tail += b"A"
+        return ns
+
+    @cython.final
+    cdef xmlNs* _findOrBuildNodeNs(self, xmlNode* c_node,
+                                   const_xmlChar* c_href, const_xmlChar* c_prefix,
+                                   bint is_attribute) except NULL:
+        u"""Get or create namespace structure for a node.  Reuses the prefix if
+        possible.
+        """
+        cdef xmlNs* c_ns
+        cdef xmlNs* c_doc_ns
+        cdef python.PyObject* dict_result
+        if c_node.type != tree.XML_ELEMENT_NODE:
+            assert c_node.type == tree.XML_ELEMENT_NODE, \
+                u"invalid node type %d, expected %d" % (
+                c_node.type, tree.XML_ELEMENT_NODE)
+        # look for existing ns declaration
+        c_ns = _searchNsByHref(c_node, c_href, is_attribute)
+        if c_ns is not NULL:
+            if is_attribute and c_ns.prefix is NULL:
+                # do not put namespaced attributes into the default
+                # namespace as this would break serialisation
+                pass
+            else:
+                return c_ns
+
+        # none found => determine a suitable new prefix
+        if c_prefix is NULL:
+            dict_result = python.PyDict_GetItem(
+                _DEFAULT_NAMESPACE_PREFIXES, <unsigned char*>c_href)
+            if dict_result is not NULL:
+                prefix = <object>dict_result
+            else:
+                prefix = self.buildNewPrefix()
+            c_prefix = _xcstr(prefix)
+
+        # make sure the prefix is not in use already
+        while tree.xmlSearchNs(self._c_doc, c_node, c_prefix) is not NULL:
+            prefix = self.buildNewPrefix()
+            c_prefix = _xcstr(prefix)
+
+        # declare the namespace and return it
+        c_ns = tree.xmlNewNs(c_node, c_href, c_prefix)
+        if c_ns is NULL:
+            raise MemoryError()
+        return c_ns
+
+    @cython.final
+    cdef int _setNodeNs(self, xmlNode* c_node, const_xmlChar* c_href) except -1:
+        u"Lookup namespace structure and set it for the node."
+        c_ns = self._findOrBuildNodeNs(c_node, c_href, NULL, 0)
+        tree.xmlSetNs(c_node, c_ns)
+
+cdef tuple __initPrefixCache():
+    cdef int i
+    return tuple([ python.PyBytes_FromFormat("ns%d", i)
+                   for i in range(30) ])
+
+cdef tuple _PREFIX_CACHE = __initPrefixCache()
+
+cdef _Document _documentFactory(xmlDoc* c_doc, _BaseParser parser):
+    cdef _Document result
+    result = _Document.__new__(_Document)
+    result._c_doc = c_doc
+    result._ns_counter = 0
+    result._prefix_tail = None
+    if parser is None:
+        parser = __GLOBAL_PARSER_CONTEXT.getDefaultParser()
+    result._parser = parser
+    return result
+
+
+cdef class DocInfo:
+    u"Document information provided by parser and DTD."
+    cdef _Document _doc
+    def __cinit__(self, tree):
+        u"Create a DocInfo object for an ElementTree object or root Element."
+        self._doc = _documentOrRaise(tree)
+        root_name, public_id, system_url = self._doc.getdoctype()
+        if not root_name and (public_id or system_url):
+            raise ValueError, u"Could not find root node"
+
+    property root_name:
+        u"Returns the name of the root node as defined by the DOCTYPE."
+        def __get__(self):
+            root_name, public_id, system_url = self._doc.getdoctype()
+            return root_name
+
+    property public_id:
+        u"Returns the public ID of the DOCTYPE."
+        def __get__(self):
+            root_name, public_id, system_url = self._doc.getdoctype()
+            return public_id
+
+    property system_url:
+        u"Returns the system ID of the DOCTYPE."
+        def __get__(self):
+            root_name, public_id, system_url = self._doc.getdoctype()
+            return system_url
+
+    property xml_version:
+        u"Returns the XML version as declared by the document."
+        def __get__(self):
+            xml_version, encoding = self._doc.getxmlinfo()
+            return xml_version
+
+    property encoding:
+        u"Returns the encoding name as declared by the document."
+        def __get__(self):
+            xml_version, encoding = self._doc.getxmlinfo()
+            return encoding
+
+    property standalone:
+        u"""Returns the standalone flag as declared by the document.  The possible
+        values are True (``standalone='yes'``), False
+        (``standalone='no'`` or flag not provided in the declaration),
+        and None (unknown or no declaration found).  Note that a
+        normal truth test on this value will always tell if the
+        ``standalone`` flag was set to ``'yes'`` or not.
+        """
+        def __get__(self):
+            return self._doc.isstandalone()
+
+    property URL:
+        u"The source URL of the document (or None if unknown)."
+        def __get__(self):
+            if self._doc._c_doc.URL is NULL:
+                return None
+            return _decodeFilename(self._doc._c_doc.URL)
+        def __set__(self, url):
+            url = _encodeFilename(url)
+            c_oldurl = self._doc._c_doc.URL
+            if url is None:
+                self._doc._c_doc.URL = NULL
+            else:
+                self._doc._c_doc.URL = tree.xmlStrdup(_xcstr(url))
+            if c_oldurl is not NULL:
+                tree.xmlFree(<void*>c_oldurl)
+
+    property doctype:
+        u"Returns a DOCTYPE declaration string for the document."
+        def __get__(self):
+            root_name, public_id, system_url = self._doc.getdoctype()
+            if public_id:
+                if system_url:
+                    return u'<!DOCTYPE %s PUBLIC "%s" "%s">' % (
+                        root_name, public_id, system_url)
+                else:
+                    return u'<!DOCTYPE %s PUBLIC "%s">' % (
+                        root_name, public_id)
+            elif system_url:
+                return u'<!DOCTYPE %s SYSTEM "%s">' % (
+                    root_name, system_url)
+            elif self._doc.hasdoctype():
+                return u'<!DOCTYPE %s>' % root_name
+            else:
+                return u""
+
+    property internalDTD:
+        u"Returns a DTD validator based on the internal subset of the document."
+        def __get__(self):
+            return _dtdFactory(self._doc._c_doc.intSubset)
+
+    property externalDTD:
+        u"Returns a DTD validator based on the external subset of the document."
+        def __get__(self):
+            return _dtdFactory(self._doc._c_doc.extSubset)
+
+
+@cython.no_gc_clear
+cdef public class _Element [ type LxmlElementType, object LxmlElement ]:
+    u"""Element class.
+
+    References a document object and a libxml node.
+
+    By pointing to a Document instance, a reference is kept to
+    _Document as long as there is some pointer to a node in it.
+    """
+    cdef _Document _doc
+    cdef xmlNode* _c_node
+    cdef object _tag
+
+    def _init(self):
+        u"""_init(self)
+
+        Called after object initialisation.  Custom subclasses may override
+        this if they recursively call _init() in the superclasses.
+        """
+
+    def __dealloc__(self):
+        #print "trying to free node:", <int>self._c_node
+        #displayNode(self._c_node, 0)
+        if self._c_node is not NULL:
+            _unregisterProxy(self)
+            attemptDeallocation(self._c_node)
+
+    # MANIPULATORS
+
+    def __setitem__(self, x, value):
+        u"""__setitem__(self, x, value)
+
+        Replaces the given subelement index or slice.
+        """
+        cdef xmlNode* c_node = NULL
+        cdef xmlNode* c_next
+        cdef xmlDoc* c_source_doc
+        cdef _Element element
+        cdef bint left_to_right
+        cdef Py_ssize_t slicelength = 0, step = 0
+        _assertValidNode(self)
+        if value is None:
+            raise ValueError, u"cannot assign None"
+        if isinstance(x, slice):
+            # slice assignment
+            _findChildSlice(<slice>x, self._c_node, &c_node, &step, &slicelength)
+            if step > 0:
+                left_to_right = 1
+            else:
+                left_to_right = 0
+                step = -step
+            _replaceSlice(self, c_node, slicelength, step, left_to_right, value)
+            return
+        else:
+            # otherwise: normal item assignment
+            element = value
+            _assertValidNode(element)
+            c_node = _findChild(self._c_node, x)
+            if c_node is NULL:
+                raise IndexError, u"list index out of range"
+            c_source_doc = element._c_node.doc
+            c_next = element._c_node.next
+            _removeText(c_node.next)
+            tree.xmlReplaceNode(c_node, element._c_node)
+            _moveTail(c_next, element._c_node)
+            moveNodeToDocument(self._doc, c_source_doc, element._c_node)
+            if not attemptDeallocation(c_node):
+                moveNodeToDocument(self._doc, c_node.doc, c_node)
+
+    def __delitem__(self, x):
+        u"""__delitem__(self, x)
+
+        Deletes the given subelement or a slice.
+        """
+        cdef xmlNode* c_node = NULL
+        cdef xmlNode* c_next
+        cdef Py_ssize_t step = 0, slicelength = 0
+        _assertValidNode(self)
+        if isinstance(x, slice):
+            # slice deletion
+            if _isFullSlice(<slice>x):
+                c_node = self._c_node.children
+                if c_node is not NULL:
+                    if not _isElement(c_node):
+                        c_node = _nextElement(c_node)
+                    while c_node is not NULL:
+                        c_next = _nextElement(c_node)
+                        _removeNode(self._doc, c_node)
+                        c_node = c_next
+            else:
+                _findChildSlice(<slice>x, self._c_node, &c_node, &step, &slicelength)
+                _deleteSlice(self._doc, c_node, slicelength, step)
+        else:
+            # item deletion
+            c_node = _findChild(self._c_node, x)
+            if c_node is NULL:
+                raise IndexError, u"index out of range: %d" % x
+            _removeText(c_node.next)
+            _removeNode(self._doc, c_node)
+
+    def __deepcopy__(self, memo):
+        u"__deepcopy__(self, memo)"
+        return self.__copy__()
+        
+    def __copy__(self):
+        u"__copy__(self)"
+        cdef xmlDoc* c_doc
+        cdef xmlNode* c_node
+        cdef _Document new_doc
+        _assertValidNode(self)
+        c_doc = _copyDocRoot(self._doc._c_doc, self._c_node) # recursive
+        new_doc = _documentFactory(c_doc, self._doc._parser)
+        root = new_doc.getroot()
+        if root is not None:
+            return root
+        # Comment/PI
+        c_node = c_doc.children
+        while c_node is not NULL and c_node.type != self._c_node.type:
+            c_node = c_node.next
+        if c_node is NULL:
+            return None
+        return _elementFactory(new_doc, c_node)
+
+    def set(self, key, value):
+        u"""set(self, key, value)
+
+        Sets an element attribute.
+        """
+        _assertValidNode(self)
+        _setAttributeValue(self, key, value)
+
+    def append(self, _Element element not None):
+        u"""append(self, element)
+
+        Adds a subelement to the end of this element.
+        """
+        _assertValidNode(self)
+        _assertValidNode(element)
+        _appendChild(self, element)
+
+    def addnext(self, _Element element not None):
+        u"""addnext(self, element)
+
+        Adds the element as a following sibling directly after this
+        element.
+
+        This is normally used to set a processing instruction or comment after
+        the root node of a document.  Note that tail text is automatically
+        discarded when adding at the root level.
+        """
+        _assertValidNode(self)
+        _assertValidNode(element)
+        if self._c_node.parent != NULL and not _isElement(self._c_node.parent):
+            if element._c_node.type != tree.XML_PI_NODE:
+                if element._c_node.type != tree.XML_COMMENT_NODE:
+                    raise TypeError, u"Only processing instructions and comments can be siblings of the root element"
+            element.tail = None
+        _appendSibling(self, element)
+
+    def addprevious(self, _Element element not None):
+        u"""addprevious(self, element)
+
+        Adds the element as a preceding sibling directly before this
+        element.
+
+        This is normally used to set a processing instruction or comment
+        before the root node of a document.  Note that tail text is
+        automatically discarded when adding at the root level.
+        """
+        _assertValidNode(self)
+        _assertValidNode(element)
+        if self._c_node.parent != NULL and not _isElement(self._c_node.parent):
+            if element._c_node.type != tree.XML_PI_NODE:
+                if element._c_node.type != tree.XML_COMMENT_NODE:
+                    raise TypeError, u"Only processing instructions and comments can be siblings of the root element"
+            element.tail = None
+        _prependSibling(self, element)
+
+    def extend(self, elements):
+        u"""extend(self, elements)
+
+        Extends the current children by the elements in the iterable.
+        """
+        cdef _Element element
+        _assertValidNode(self)
+        for element in elements:
+            if element is None:
+                raise TypeError, u"Node must not be None"
+            _assertValidNode(element)
+            _appendChild(self, element)
+
+    def clear(self):
+        u"""clear(self)
+
+        Resets an element.  This function removes all subelements, clears
+        all attributes and sets the text and tail properties to None.
+        """
+        cdef xmlAttr* c_attr
+        cdef xmlAttr* c_attr_next
+        cdef xmlNode* c_node
+        cdef xmlNode* c_node_next
+        _assertValidNode(self)
+        c_node = self._c_node
+        # remove self.text and self.tail
+        _removeText(c_node.children)
+        _removeText(c_node.next)
+        # remove all attributes
+        c_attr = c_node.properties
+        while c_attr is not NULL:
+            c_attr_next = c_attr.next
+            tree.xmlRemoveProp(c_attr)
+            c_attr = c_attr_next
+        # remove all subelements
+        c_node = c_node.children
+        if c_node is not NULL:
+            if not _isElement(c_node):
+                c_node = _nextElement(c_node)
+            while c_node is not NULL:
+                c_node_next = _nextElement(c_node)
+                _removeNode(self._doc, c_node)
+                c_node = c_node_next
+
+    def insert(self, index, _Element element not None):
+        u"""insert(self, index, element)
+
+        Inserts a subelement at the given position in this element
+        """
+        cdef xmlNode* c_node
+        cdef xmlNode* c_next
+        cdef xmlDoc* c_source_doc
+        _assertValidNode(self)
+        _assertValidNode(element)
+        c_node = _findChild(self._c_node, index)
+        if c_node is NULL:
+            _appendChild(self, element)
+            return
+        c_source_doc = c_node.doc
+        c_next = element._c_node.next
+        tree.xmlAddPrevSibling(c_node, element._c_node)
+        _moveTail(c_next, element._c_node)
+        moveNodeToDocument(self._doc, c_source_doc, element._c_node)
+
+    def remove(self, _Element element not None):
+        u"""remove(self, element)
+
+        Removes a matching subelement. Unlike the find methods, this
+        method compares elements based on identity, not on tag value
+        or contents.
+        """
+        cdef xmlNode* c_node
+        cdef xmlNode* c_next
+        _assertValidNode(self)
+        _assertValidNode(element)
+        c_node = element._c_node
+        if c_node.parent is not self._c_node:
+            raise ValueError, u"Element is not a child of this node."
+        c_next = element._c_node.next
+        tree.xmlUnlinkNode(c_node)
+        _moveTail(c_next, c_node)
+        # fix namespace declarations
+        moveNodeToDocument(self._doc, c_node.doc, c_node)
+
+    def replace(self, _Element old_element not None,
+                _Element new_element not None):
+        u"""replace(self, old_element, new_element)
+
+        Replaces a subelement with the element passed as second argument.
+        """
+        cdef xmlNode* c_old_node
+        cdef xmlNode* c_old_next
+        cdef xmlNode* c_new_node
+        cdef xmlNode* c_new_next
+        cdef xmlDoc* c_source_doc
+        _assertValidNode(self)
+        _assertValidNode(old_element)
+        _assertValidNode(new_element)
+        c_old_node = old_element._c_node
+        if c_old_node.parent is not self._c_node:
+            raise ValueError, u"Element is not a child of this node."
+        c_old_next = c_old_node.next
+        c_new_node = new_element._c_node
+        c_new_next = c_new_node.next
+        c_source_doc = c_new_node.doc
+        tree.xmlReplaceNode(c_old_node, c_new_node)
+        _moveTail(c_new_next, c_new_node)
+        _moveTail(c_old_next, c_old_node)
+        moveNodeToDocument(self._doc, c_source_doc, c_new_node)
+        # fix namespace declarations
+        moveNodeToDocument(self._doc, c_old_node.doc, c_old_node)
+        
+    # PROPERTIES
+    property tag:
+        u"""Element tag
+        """
+        def __get__(self):
+            if self._tag is not None:
+                return self._tag
+            _assertValidNode(self)
+            self._tag = _namespacedName(self._c_node)
+            return self._tag
+    
+        def __set__(self, value):
+            cdef _BaseParser parser
+            _assertValidNode(self)
+            ns, name = _getNsTag(value)
+            parser = self._doc._parser
+            if parser is not None and parser._for_html:
+                _htmlTagValidOrRaise(name)
+            else:
+                _tagValidOrRaise(name)
+            self._tag = value
+            tree.xmlNodeSetName(self._c_node, _xcstr(name))
+            if ns is None:
+                self._c_node.ns = NULL
+            else:
+                self._doc._setNodeNs(self._c_node, _xcstr(ns))
+
+    property attrib:
+        u"""Element attribute dictionary. Where possible, use get(), set(),
+        keys(), values() and items() to access element attributes.
+        """
+        def __get__(self):
+            return _Attrib.__new__(_Attrib, self)
+
+    property text:
+        u"""Text before the first subelement. This is either a string or 
+        the value None, if there was no text.
+        """
+        def __get__(self):
+            _assertValidNode(self)
+            return _collectText(self._c_node.children)
+
+        def __set__(self, value):
+            _assertValidNode(self)
+            if isinstance(value, QName):
+                value = _resolveQNameText(self, value).decode('utf8')
+            _setNodeText(self._c_node, value)
+
+        # using 'del el.text' is the wrong thing to do
+        #def __del__(self):
+        #    _setNodeText(self._c_node, None)
+
+    property tail:
+        u"""Text after this element's end tag, but before the next sibling
+        element's start tag. This is either a string or the value None, if
+        there was no text.
+        """
+        def __get__(self):
+            _assertValidNode(self)
+            return _collectText(self._c_node.next)
+           
+        def __set__(self, value):
+            _assertValidNode(self)
+            _setTailText(self._c_node, value)
+
+        # using 'del el.tail' is the wrong thing to do
+        #def __del__(self):
+        #    _setTailText(self._c_node, None)
+
+    # not in ElementTree, read-only
+    property prefix:
+        u"""Namespace prefix or None.
+        """
+        def __get__(self):
+            if self._c_node.ns is not NULL:
+                if self._c_node.ns.prefix is not NULL:
+                    return funicode(self._c_node.ns.prefix)
+            return None
+
+    # not in ElementTree, read-only
+    property sourceline:
+        u"""Original line number as found by the parser or None if unknown.
+        """
+        def __get__(self):
+            cdef long line
+            _assertValidNode(self)
+            line = tree.xmlGetLineNo(self._c_node)
+            return line if line > 0 else None
+
+        def __set__(self, line):
+            _assertValidNode(self)
+            if line <= 0:
+                self._c_node.line = 0
+            else:
+                self._c_node.line = line
+
+    # not in ElementTree, read-only
+    property nsmap:
+        u"""Namespace prefix->URI mapping known in the context of this
+        Element.  This includes all namespace declarations of the
+        parents.
+
+        Note that changing the returned dict has no effect on the Element.
+        """
+        def __get__(self):
+            cdef xmlNode* c_node
+            cdef xmlNs* c_ns
+            _assertValidNode(self)
+            nsmap = {}
+            c_node = self._c_node
+            while c_node is not NULL and c_node.type == tree.XML_ELEMENT_NODE:
+                c_ns = c_node.nsDef
+                while c_ns is not NULL:
+                    prefix = funicodeOrNone(c_ns.prefix)
+                    if prefix not in nsmap:
+                        nsmap[prefix] = funicodeOrNone(c_ns.href)
+                    c_ns = c_ns.next
+                c_node = c_node.parent
+            return nsmap
+
+    # not in ElementTree, read-only
+    property base:
+        u"""The base URI of the Element (xml:base or HTML base URL).
+        None if the base URI is unknown.
+
+        Note that the value depends on the URL of the document that
+        holds the Element if there is no xml:base attribute on the
+        Element or its ancestors.
+
+        Setting this property will set an xml:base attribute on the
+        Element, regardless of the document type (XML or HTML).
+        """
+        def __get__(self):
+            _assertValidNode(self)
+            c_base = tree.xmlNodeGetBase(self._doc._c_doc, self._c_node)
+            if c_base is NULL:
+                if self._doc._c_doc.URL is NULL:
+                    return None
+                return _decodeFilename(self._doc._c_doc.URL)
+            try:
+                base = _decodeFilename(c_base)
+            finally:
+                tree.xmlFree(c_base)
+            return base
+
+        def __set__(self, url):
+            _assertValidNode(self)
+            if url is None:
+                c_base = <const_xmlChar*>NULL
+            else:
+                url = _encodeFilename(url)
+                c_base = _xcstr(url)
+            tree.xmlNodeSetBase(self._c_node, c_base)
+
+    # ACCESSORS
+    def __repr__(self):
+        u"__repr__(self)"
+        return u"<Element %s at 0x%x>" % (self.tag, id(self))
+
+    def __getitem__(self, x):
+        u"""Returns the subelement at the given position or the requested
+        slice.
+        """
+        cdef xmlNode* c_node = NULL
+        cdef Py_ssize_t step = 0, slicelength = 0
+        cdef Py_ssize_t c, i
+        cdef _node_to_node_function next_element
+        cdef list result
+        _assertValidNode(self)
+        if isinstance(x, slice):
+            # slicing
+            if _isFullSlice(<slice>x):
+                return _collectChildren(self)
+            _findChildSlice(<slice>x, self._c_node, &c_node, &step, &slicelength)
+            if c_node is NULL:
+                return []
+            if step > 0:
+                next_element = _nextElement
+            else:
+                step = -step
+                next_element = _previousElement
+            result = []
+            c = 0
+            while c_node is not NULL and c < slicelength:
+                result.append(_elementFactory(self._doc, c_node))
+                c += 1
+                for i in range(step):
+                    c_node = next_element(c_node)
+            return result
+        else:
+            # indexing
+            c_node = _findChild(self._c_node, x)
+            if c_node is NULL:
+                raise IndexError, u"list index out of range"
+            return _elementFactory(self._doc, c_node)
+            
+    def __len__(self):
+        u"""__len__(self)
+
+        Returns the number of subelements.
+        """
+        _assertValidNode(self)
+        return _countElements(self._c_node.children)
+
+    def __nonzero__(self):
+        #u"__nonzero__(self)" # currently fails in Py3.1
+        import warnings
+        warnings.warn(
+            u"The behavior of this method will change in future versions. "
+            u"Use specific 'len(elem)' or 'elem is not None' test instead.",
+            FutureWarning
+            )
+        # emulate old behaviour
+        _assertValidNode(self)
+        return _hasChild(self._c_node)
+
+    def __contains__(self, element):
+        u"__contains__(self, element)"
+        cdef xmlNode* c_node
+        _assertValidNode(self)
+        if not isinstance(element, _Element):
+            return 0
+        c_node = (<_Element>element)._c_node
+        return c_node is not NULL and c_node.parent is self._c_node
+
+    def __iter__(self):
+        u"__iter__(self)"
+        return ElementChildIterator(self)
+
+    def __reversed__(self):
+        u"__reversed__(self)"
+        return ElementChildIterator(self, reversed=True)
+
+    def index(self, _Element child not None, start=None, stop=None):
+        u"""index(self, child, start=None, stop=None)
+
+        Find the position of the child within the parent.
+
+        This method is not part of the original ElementTree API.
+        """
+        cdef Py_ssize_t k, l
+        cdef Py_ssize_t c_start, c_stop
+        cdef xmlNode* c_child
+        cdef xmlNode* c_start_node
+        _assertValidNode(self)
+        _assertValidNode(child)
+        c_child = child._c_node
+        if c_child.parent is not self._c_node:
+            raise ValueError, u"Element is not a child of this node."
+
+        # handle the unbounded search straight away (normal case)
+        if stop is None and (start is None or start == 0):
+            k = 0
+            c_child = c_child.prev
+            while c_child is not NULL:
+                if _isElement(c_child):
+                    k += 1
+                c_child = c_child.prev
+            return k
+
+        # check indices
+        if start is None:
+            c_start = 0
+        else:
+            c_start = start
+        if stop is None:
+            c_stop = 0
+        else:
+            c_stop = stop
+            if c_stop == 0 or \
+                   c_start >= c_stop and (c_stop > 0 or c_start < 0):
+                raise ValueError, u"list.index(x): x not in slice"
+
+        # for negative slice indices, check slice before searching index
+        if c_start < 0 or c_stop < 0:
+            # start from right, at most up to leftmost(c_start, c_stop)
+            if c_start < c_stop:
+                k = -c_start
+            else:
+                k = -c_stop
+            c_start_node = self._c_node.last
+            l = 1
+            while c_start_node != c_child and l < k:
+                if _isElement(c_start_node):
+                    l += 1
+                c_start_node = c_start_node.prev
+            if c_start_node == c_child:
+                # found! before slice end?
+                if c_stop < 0 and l <= -c_stop:
+                    raise ValueError, u"list.index(x): x not in slice"
+            elif c_start < 0:
+                raise ValueError, u"list.index(x): x not in slice"
+
+        # now determine the index backwards from child
+        c_child = c_child.prev
+        k = 0
+        if c_stop > 0:
+            # we can optimize: stop after c_stop elements if not found
+            while c_child != NULL and k < c_stop:
+                if _isElement(c_child):
+                    k += 1
+                c_child = c_child.prev
+            if k < c_stop:
+                return k
+        else:
+            # traverse all
+            while c_child != NULL:
+                if _isElement(c_child):
+                    k = k + 1
+                c_child = c_child.prev
+            if c_start > 0:
+                if k >= c_start:
+                    return k
+            else:
+                return k
+        if c_start != 0 or c_stop != 0:
+            raise ValueError, u"list.index(x): x not in slice"
+        else:
+            raise ValueError, u"list.index(x): x not in list"
+
+    def get(self, key, default=None):
+        u"""get(self, key, default=None)
+
+        Gets an element attribute.
+        """
+        _assertValidNode(self)
+        return _getAttributeValue(self, key, default)
+
+    def keys(self):
+        u"""keys(self)
+
+        Gets a list of attribute names.  The names are returned in an
+        arbitrary order (just like for an ordinary Python dictionary).
+        """
+        _assertValidNode(self)
+        return _collectAttributes(self._c_node, 1)
+
+    def values(self):
+        u"""values(self)
+
+        Gets element attribute values as a sequence of strings.  The
+        attributes are returned in an arbitrary order.
+        """
+        _assertValidNode(self)
+        return _collectAttributes(self._c_node, 2)
+
+    def items(self):
+        u"""items(self)
+
+        Gets element attributes, as a sequence. The attributes are returned in
+        an arbitrary order.
+        """
+        _assertValidNode(self)
+        return _collectAttributes(self._c_node, 3)
+
+    def getchildren(self):
+        u"""getchildren(self)
+
+        Returns all direct children.  The elements are returned in document
+        order.
+
+        :deprecated: Note that this method has been deprecated as of
+          ElementTree 1.3 and lxml 2.0.  New code should use
+          ``list(element)`` or simply iterate over elements.
+        """
+        _assertValidNode(self)
+        return _collectChildren(self)
+
+    def getparent(self):
+        u"""getparent(self)
+
+        Returns the parent of this element or None for the root element.
+        """
+        cdef xmlNode* c_node
+        #_assertValidNode(self) # not needed
+        c_node = _parentElement(self._c_node)
+        if c_node is NULL:
+            return None
+        return _elementFactory(self._doc, c_node)
+
+    def getnext(self):
+        u"""getnext(self)
+
+        Returns the following sibling of this element or None.
+        """
+        cdef xmlNode* c_node
+        #_assertValidNode(self) # not needed
+        c_node = _nextElement(self._c_node)
+        if c_node is NULL:
+            return None
+        return _elementFactory(self._doc, c_node)
+
+    def getprevious(self):
+        u"""getprevious(self)
+
+        Returns the preceding sibling of this element or None.
+        """
+        cdef xmlNode* c_node
+        #_assertValidNode(self) # not needed
+        c_node = _previousElement(self._c_node)
+        if c_node is NULL:
+            return None
+        return _elementFactory(self._doc, c_node)
+
+    def itersiblings(self, tag=None, *tags, preceding=False):
+        u"""itersiblings(self, tag=None, *tags, preceding=False)
+
+        Iterate over the following or preceding siblings of this element.
+
+        The direction is determined by the 'preceding' keyword which
+        defaults to False, i.e. forward iteration over the following
+        siblings.  When True, the iterator yields the preceding
+        siblings in reverse document order, i.e. starting right before
+        the current element and going backwards.
+
+        Can be restricted to find only elements with a specific tag,
+        see `iter`.
+        """
+        if tag is not None:
+            tags += (tag,)
+        return SiblingsIterator(self, tags, preceding=preceding)
+
+    def iterancestors(self, tag=None, *tags):
+        u"""iterancestors(self, tag=None, *tags)
+
+        Iterate over the ancestors of this element (from parent to parent).
+
+        Can be restricted to find only elements with a specific tag,
+        see `iter`.
+        """
+        if tag is not None:
+            tags += (tag,)
+        return AncestorsIterator(self, tags)
+
+    def iterdescendants(self, tag=None, *tags):
+        u"""iterdescendants(self, tag=None, *tags)
+
+        Iterate over the descendants of this element in document order.
+
+        As opposed to ``el.iter()``, this iterator does not yield the element
+        itself.  The returned elements can be restricted to find only elements
+        with a specific tag, see `iter`.
+        """
+        if tag is not None:
+            tags += (tag,)
+        return ElementDepthFirstIterator(self, tags, inclusive=False)
+
+    def iterchildren(self, tag=None, *tags, reversed=False):
+        u"""iterchildren(self, tag=None, *tags, reversed=False)
+
+        Iterate over the children of this element.
+
+        As opposed to using normal iteration on this element, the returned
+        elements can be reversed with the 'reversed' keyword and restricted
+        to find only elements with a specific tag, see `iter`.
+        """
+        if tag is not None:
+            tags += (tag,)
+        return ElementChildIterator(self, tags, reversed=reversed)
+
+    def getroottree(self):
+        u"""getroottree(self)
+
+        Return an ElementTree for the root node of the document that
+        contains this element.
+
+        This is the same as following element.getparent() up the tree until it
+        returns None (for the root element) and then build an ElementTree for
+        the last parent that was returned."""
+        _assertValidDoc(self._doc)
+        return _elementTreeFactory(self._doc, None)
+
+    def getiterator(self, tag=None, *tags):
+        u"""getiterator(self, tag=None, *tags)
+
+        Returns a sequence or iterator of all elements in the subtree in
+        document order (depth first pre-order), starting with this
+        element.
+
+        Can be restricted to find only elements with a specific tag,
+        see `iter`.
+
+        :deprecated: Note that this method is deprecated as of
+          ElementTree 1.3 and lxml 2.0.  It returns an iterator in
+          lxml, which diverges from the original ElementTree
+          behaviour.  If you want an efficient iterator, use the
+          ``element.iter()`` method instead.  You should only use this
+          method in new code if you require backwards compatibility
+          with older versions of lxml or ElementTree.
+        """
+        if tag is not None:
+            tags += (tag,)
+        return ElementDepthFirstIterator(self, tags)
+
+    def iter(self, tag=None, *tags):
+        u"""iter(self, tag=None, *tags)
+
+        Iterate over all elements in the subtree in document order (depth
+        first pre-order), starting with this element.
+
+        Can be restricted to find only elements with a specific tag:
+        pass ``"{ns}localname"`` as tag. Either or both of ``ns`` and
+        ``localname`` can be ``*`` for a wildcard; ``ns`` can be empty
+        for no namespace. ``"localname"`` is equivalent to ``"{}localname"``
+        (i.e. no namespace) but ``"*"`` is ``"{*}*"`` (any or no namespace),
+        not ``"{}*"``.
+
+        You can also pass the Element, Comment, ProcessingInstruction and
+        Entity factory functions to look only for the specific element type.
+
+        Passing more than one tag will let the iterator return all elements
+        matching any of these tags, in document order.
+        """
+        if tag is not None:
+            tags += (tag,)
+        return ElementDepthFirstIterator(self, tags)
+
+    def itertext(self, tag=None, *tags, with_tail=True):
+        u"""itertext(self, tag=None, *tags, with_tail=True)
+
+        Iterates over the text content of a subtree.
+
+        You can pass a tag name to restrict text content to specific elements,
+        see `iter`.
+
+        You can set the ``with_tail`` keyword argument to ``False`` to skip
+        over tail text.
+        """
+        if tag is not None:
+            tags += (tag,)
+        return ElementTextIterator(self, tags, with_tail=with_tail)
+
+    def makeelement(self, _tag, attrib=None, nsmap=None, **_extra):
+        u"""makeelement(self, _tag, attrib=None, nsmap=None, **_extra)
+
+        Creates a new element associated with the same document.
+        """
+        _assertValidDoc(self._doc)
+        return _makeElement(_tag, NULL, self._doc, None, None, None,
+                            attrib, nsmap, _extra)
+
+    def find(self, path, namespaces=None):
+        u"""find(self, path, namespaces=None)
+
+        Finds the first matching subelement, by tag name or path.
+
+        The optional ``namespaces`` argument accepts a
+        prefix-to-namespace mapping that allows the usage of XPath
+        prefixes in the path expression.
+        """
+        if isinstance(path, QName):
+            path = (<QName>path).text
+        return _elementpath.find(self, path, namespaces)
+
+    def findtext(self, path, default=None, namespaces=None):
+        u"""findtext(self, path, default=None, namespaces=None)
+
+        Finds text for the first matching subelement, by tag name or path.
+
+        The optional ``namespaces`` argument accepts a
+        prefix-to-namespace mapping that allows the usage of XPath
+        prefixes in the path expression.
+        """
+        if isinstance(path, QName):
+            path = (<QName>path).text
+        return _elementpath.findtext(self, path, default, namespaces)
+
+    def findall(self, path, namespaces=None):
+        u"""findall(self, path, namespaces=None)
+
+        Finds all matching subelements, by tag name or path.
+
+        The optional ``namespaces`` argument accepts a
+        prefix-to-namespace mapping that allows the usage of XPath
+        prefixes in the path expression.
+        """
+        if isinstance(path, QName):
+            path = (<QName>path).text
+        return _elementpath.findall(self, path, namespaces)
+
+    def iterfind(self, path, namespaces=None):
+        u"""iterfind(self, path, namespaces=None)
+
+        Iterates over all matching subelements, by tag name or path.
+
+        The optional ``namespaces`` argument accepts a
+        prefix-to-namespace mapping that allows the usage of XPath
+        prefixes in the path expression.
+        """
+        if isinstance(path, QName):
+            path = (<QName>path).text
+        return _elementpath.iterfind(self, path, namespaces)
+
+    def xpath(self, _path, *, namespaces=None, extensions=None,
+              smart_strings=True, **_variables):
+        u"""xpath(self, _path, namespaces=None, extensions=None, smart_strings=True, **_variables)
+
+        Evaluate an xpath expression using the element as context node.
+        """
+        evaluator = XPathElementEvaluator(self, namespaces=namespaces,
+                                          extensions=extensions,
+                                          smart_strings=smart_strings)
+        return evaluator(_path, **_variables)
+
+
+cdef extern from "etree_defs.h":
+    # macro call to 't->tp_new()' for fast instantiation
+    cdef object NEW_ELEMENT "PY_NEW" (object t)
+
+cdef _Element _elementFactory(_Document doc, xmlNode* c_node):
+    cdef _Element result
+    result = getProxy(c_node)
+    if result is not None:
+        return result
+    if c_node is NULL:
+        return None
+
+    element_class = LOOKUP_ELEMENT_CLASS(
+        ELEMENT_CLASS_LOOKUP_STATE, doc, c_node)
+    if hasProxy(c_node):
+        # prevent re-entry race condition - we just called into Python
+        return getProxy(c_node)
+    result = NEW_ELEMENT(element_class)
+    if hasProxy(c_node):
+        # prevent re-entry race condition - we just called into Python
+        result._c_node = NULL
+        return getProxy(c_node)
+
+    _registerProxy(result, doc, c_node)
+    if element_class is not _Element:
+        result._init()
+    return result
+
+
+@cython.internal
+cdef class __ContentOnlyElement(_Element):
+    cdef int _raiseImmutable(self) except -1:
+        raise TypeError, u"this element does not have children or attributes"
+
+    def set(self, key, value):
+        u"set(self, key, value)"
+        self._raiseImmutable()
+
+    def append(self, value):
+        u"append(self, value)"
+        self._raiseImmutable()
+
+    def insert(self, index, value):
+        u"insert(self, index, value)"
+        self._raiseImmutable()
+
+    def __setitem__(self, index, value):
+        u"__setitem__(self, index, value)"
+        self._raiseImmutable()
+
+    property attrib:
+        def __get__(self):
+            return IMMUTABLE_EMPTY_MAPPING
+
+    property text:
+        def __get__(self):
+            _assertValidNode(self)
+            return funicodeOrEmpty(self._c_node.content)
+
+        def __set__(self, value):
+            cdef tree.xmlDict* c_dict
+            _assertValidNode(self)
+            if value is None:
+                c_text = <const_xmlChar*>NULL
+            else:
+                value = _utf8(value)
+                c_text = _xcstr(value)
+            tree.xmlNodeSetContent(self._c_node, c_text)
+
+    # ACCESSORS
+    def __getitem__(self, x):
+        u"__getitem__(self, x)"
+        if isinstance(x, slice):
+            return []
+        else:
+            raise IndexError, u"list index out of range"
+
+    def __len__(self):
+        u"__len__(self)"
+        return 0
+
+    def get(self, key, default=None):
+        u"get(self, key, default=None)"
+        return None
+
+    def keys(self):
+        u"keys(self)"
+        return []
+    
+    def items(self):
+        u"items(self)"
+        return []
+
+    def values(self):
+        u"values(self)"
+        return []
+
+cdef class _Comment(__ContentOnlyElement):
+    property tag:
+        def __get__(self):
+            return Comment
+
+    def __repr__(self):
+        return u"<!--%s-->" % self.text
+    
+cdef class _ProcessingInstruction(__ContentOnlyElement):
+    property tag:
+        def __get__(self):
+            return ProcessingInstruction
+
+    property target:
+        # not in ElementTree
+        def __get__(self):
+            _assertValidNode(self)
+            return funicode(self._c_node.name)
+
+        def __set__(self, value):
+            _assertValidNode(self)
+            value = _utf8(value)
+            c_text = _xcstr(value)
+            tree.xmlNodeSetName(self._c_node, c_text)
+
+    def __repr__(self):
+        text = self.text
+        if text:
+            return u"<?%s %s?>" % (self.target, text)
+        else:
+            return u"<?%s?>" % self.target
+
+    def get(self, key, default=None):
+        u"""get(self, key, default=None)
+
+        Try to parse pseudo-attributes from the text content of the
+        processing instruction, search for one with the given key as
+        name and return its associated value.
+
+        Note that this is only a convenience method for the most
+        common case that all text content is structured in
+        attribute-like name-value pairs with properly quoted values.
+        It is not guaranteed to work for all possible text content.
+        """
+        return self.attrib.get(key, default)
+
+    property attrib:
+        u"""Returns a dict containing all pseudo-attributes that can be
+        parsed from the text content of this processing instruction.
+        Note that modifying the dict currently has no effect on the
+        XML node, although this is not guaranteed to stay this way.
+        """
+        def __get__(self):
+            return { attr : (value1 or value2)
+                     for attr, value1, value2 in _FIND_PI_ATTRIBUTES(u' ' + self.text) }
+
+cdef object _FIND_PI_ATTRIBUTES = re.compile(ur'\s+(\w+)\s*=\s*(?:\'([^\']*)\'|"([^"]*)")', re.U).findall
+
+cdef class _Entity(__ContentOnlyElement):
+    property tag:
+        def __get__(self):
+            return Entity
+
+    property name:
+        # not in ElementTree
+        def __get__(self):
+            _assertValidNode(self)
+            return funicode(self._c_node.name)
+
+        def __set__(self, value):
+            _assertValidNode(self)
+            value_utf = _utf8(value)
+            if b'&' in value_utf or b';' in value_utf:
+                raise ValueError(u"Invalid entity name '%s'" % value)
+            tree.xmlNodeSetName(self._c_node, _xcstr(value_utf))
+
+    property text:
+        # FIXME: should this be None or '&[VALUE];' or the resolved
+        # entity value ?
+        def __get__(self):
+            _assertValidNode(self)
+            return u'&%s;' % funicode(self._c_node.name)
+
+    def __repr__(self):
+        return u"&%s;" % self.name
+
+
+cdef class QName:
+    u"""QName(text_or_uri_or_element, tag=None)
+
+    QName wrapper for qualified XML names.
+
+    Pass a tag name by itself or a namespace URI and a tag name to
+    create a qualified name.  Alternatively, pass an Element to
+    extract its tag name.
+
+    The ``text`` property holds the qualified name in
+    ``{namespace}tagname`` notation.  The ``namespace`` and
+    ``localname`` properties hold the respective parts of the tag
+    name.
+
+    You can pass QName objects wherever a tag name is expected.  Also,
+    setting Element text from a QName will resolve the namespace
+    prefix and set a qualified text value.  This is helpful in XML
+    languages like SOAP or XML-Schema that use prefixed tag names in
+    their text content.
+    """
+    cdef readonly unicode text
+    cdef readonly unicode localname
+    cdef readonly unicode namespace
+    def __init__(self, text_or_uri_or_element, tag=None):
+        if not _isString(text_or_uri_or_element):
+            if isinstance(text_or_uri_or_element, _Element):
+                text_or_uri_or_element = (<_Element>text_or_uri_or_element).tag
+                if not _isString(text_or_uri_or_element):
+                    raise ValueError, (u"Invalid input tag of type %r" %
+                                       type(text_or_uri_or_element))
+            elif isinstance(text_or_uri_or_element, QName):
+                text_or_uri_or_element = (<QName>text_or_uri_or_element).text
+            else:
+                text_or_uri_or_element = unicode(text_or_uri_or_element)
+
+        ns_utf, tag_utf = _getNsTag(text_or_uri_or_element)
+        if tag is not None:
+            # either ('ns', 'tag') or ('{ns}oldtag', 'newtag')
+            if ns_utf is None:
+                ns_utf = tag_utf # case 1: namespace ended up as tag name
+            tag_utf = _utf8(tag)
+        _tagValidOrRaise(tag_utf)
+        self.localname = (<bytes>tag_utf).decode('utf8')
+        if ns_utf is None:
+            self.namespace = None
+            self.text = self.localname
+        else:
+            self.namespace = (<bytes>ns_utf).decode('utf8')
+            self.text = u"{%s}%s" % (self.namespace, self.localname)
+    def __str__(self):
+        return self.text
+    def __hash__(self):
+        return hash(self.text)
+    def __richcmp__(one, other, int op):
+        try:
+            if type(one) is QName:
+                one = (<QName>one).text
+            elif not isinstance(one, unicode):
+                one = unicode(one)
+            if type(other) is QName:
+                other = (<QName>other).text
+            elif not isinstance(other, unicode):
+                other = unicode(other)
+        except (ValueError, UnicodeDecodeError):
+            return NotImplemented
+        return python.PyObject_RichCompare(one, other, op)
+
+
+cdef public class _ElementTree [ type LxmlElementTreeType,
+                                 object LxmlElementTree ]:
+    cdef _Document _doc
+    cdef _Element _context_node
+
+    # Note that _doc is only used to store the original document if we do not
+    # have a _context_node.  All methods should prefer self._context_node._doc
+    # to honour tree restructuring.  _doc can happily be None!
+
+    @cython.final
+    cdef int _assertHasRoot(self) except -1:
+        u"""We have to take care here: the document may not have a root node!
+        This can happen if ElementTree() is called without any argument and
+        the caller 'forgets' to call parse() afterwards, so this is a bug in
+        the caller program.
+        """
+        assert self._context_node is not None, \
+               u"ElementTree not initialized, missing root"
+        return 0
+
+    def parse(self, source, _BaseParser parser=None, *, base_url=None):
+        u"""parse(self, source, parser=None, base_url=None)
+
+        Updates self with the content of source and returns its root
+        """
+        cdef _Document doc = None
+        try:
+            doc = _parseDocument(source, parser, base_url)
+            self._context_node = doc.getroot()
+            if self._context_node is None:
+                self._doc = doc
+        except _TargetParserResult as result_container:
+            # raises a TypeError if we don't get an _Element
+            self._context_node = result_container.result
+        return self._context_node
+
+    def _setroot(self, _Element root not None):
+        u"""_setroot(self, root)
+
+        Relocate the ElementTree to a new root node.
+        """
+        _assertValidNode(root)
+        if root._c_node.type != tree.XML_ELEMENT_NODE:
+            raise TypeError, u"Only elements can be the root of an ElementTree"
+        self._context_node = root
+        self._doc = None
+
+    def getroot(self):
+        u"""getroot(self)
+
+        Gets the root element for this tree.
+        """
+        return self._context_node
+
+    def __copy__(self):
+        return _elementTreeFactory(self._doc, self._context_node)
+
+    def __deepcopy__(self, memo):
+        cdef _Element root
+        cdef _Document doc
+        cdef xmlDoc* c_doc
+        if self._context_node is not None:
+            root = self._context_node.__copy__()
+            assert root is not None
+            _assertValidNode(root)
+            _copyNonElementSiblings(self._context_node._c_node, root._c_node)
+            doc = root._doc
+            c_doc = self._context_node._doc._c_doc
+            if c_doc.intSubset is not NULL and doc._c_doc.intSubset is NULL:
+                doc._c_doc.intSubset = _copyDtd(c_doc.intSubset)
+            if c_doc.extSubset is not NULL and not doc._c_doc.extSubset is NULL:
+                doc._c_doc.extSubset = _copyDtd(c_doc.extSubset)
+            return _elementTreeFactory(None, root)
+        elif self._doc is not None:
+            _assertValidDoc(self._doc)
+            c_doc = tree.xmlCopyDoc(self._doc._c_doc, 1)
+            if c_doc is NULL:
+                raise MemoryError()
+            doc = _documentFactory(c_doc, self._doc._parser)
+            return _elementTreeFactory(doc, None)
+        else:
+            # so what ...
+            return self
+
+    # not in ElementTree, read-only
+    property docinfo:
+        u"""Information about the document provided by parser and DTD.  This
+        value is only defined for ElementTree objects based on the root node
+        of a parsed document (e.g.  those returned by the parse functions),
+        not for trees that were built manually.
+        """
+        def __get__(self):
+            self._assertHasRoot()
+            return DocInfo(self._context_node._doc)
+
+    # not in ElementTree, read-only
+    property parser:
+        u"""The parser that was used to parse the document in this ElementTree.
+        """
+        def __get__(self):
+            if self._context_node is not None and \
+                   self._context_node._doc is not None:
+                return self._context_node._doc._parser
+            if self._doc is not None:
+                return self._doc._parser
+            return None
+
+    def write(self, file, *, encoding=None, method=u"xml",
+              pretty_print=False, xml_declaration=None, with_tail=True,
+              standalone=None, docstring=None, compression=0,
+              exclusive=False, with_comments=True, inclusive_ns_prefixes=None):
+        u"""write(self, file, encoding=None, method="xml",
+                  pretty_print=False, xml_declaration=None, with_tail=True,
+                  standalone=None, compression=0,
+                  exclusive=False, with_comments=True, inclusive_ns_prefixes=None)
+
+        Write the tree to a filename, file or file-like object.
+
+        Defaults to ASCII encoding and writing a declaration as needed.
+
+        The keyword argument 'method' selects the output method:
+        'xml', 'html', 'text' or 'c14n'.  Default is 'xml'.
+
+        The ``exclusive`` and ``with_comments`` arguments are only
+        used with C14N output, where they request exclusive and
+        uncommented C14N serialisation respectively.
+
+        Passing a boolean value to the ``standalone`` option will
+        output an XML declaration with the corresponding
+        ``standalone`` flag.
+
+        The ``compression`` option enables GZip compression level 1-9.
+
+        The ``inclusive_ns_prefixes`` should be a list of namespace strings
+        (i.e. ['xs', 'xsi']) that will be promoted to the top-level element
+        during exclusive C14N serialisation.  This parameter is ignored if
+        exclusive mode=False.
+
+        If exclusive=True and no list is provided, a namespace will only be
+        rendered if it is used by the immediate parent or one of its attributes
+        and its prefix and values have not already been rendered by an ancestor
+        of the namespace node's parent element.
+        """
+        cdef bint write_declaration
+        cdef int is_standalone
+
+        self._assertHasRoot()
+        _assertValidNode(self._context_node)
+        if compression is None or compression < 0:
+            compression = 0
+
+        # C14N serialisation
+        if method == 'c14n':
+            if encoding is not None:
+                raise ValueError("Cannot specify encoding with C14N")
+            if xml_declaration:
+                raise ValueError("Cannot enable XML declaration in C14N")
+
+            _tofilelikeC14N(file, self._context_node, exclusive, with_comments,
+                            compression, inclusive_ns_prefixes)
+            return
+        if not with_comments:
+            raise ValueError("Can only discard comments in C14N serialisation")
+        # suppress decl. in default case (purely for ElementTree compatibility)
+        if xml_declaration is not None:
+            write_declaration = xml_declaration
+            if encoding is None:
+                encoding = u'ASCII'
+            else:
+                encoding = encoding.upper()
+        elif encoding is None:
+            encoding = u'ASCII'
+            write_declaration = 0
+        else:
+            encoding = encoding.upper()
+            write_declaration = encoding not in \
+                                  (u'US-ASCII', u'ASCII', u'UTF8', u'UTF-8')
+        if standalone is None:
+            is_standalone = -1
+        elif standalone:
+            write_declaration = 1
+            is_standalone = 1
+        else:
+            write_declaration = 1
+            is_standalone = 0
+        _tofilelike(file, self._context_node, encoding, docstring, method,
+                    write_declaration, 1, pretty_print, with_tail,
+                    is_standalone, compression)
+
+    def getpath(self, _Element element not None):
+        u"""getpath(self, element)
+
+        Returns a structural, absolute XPath expression to find that element.
+        """
+        cdef _Document doc
+        cdef _Element root
+        cdef xmlDoc* c_doc
+        _assertValidNode(element)
+        if self._context_node is not None:
+            root = self._context_node
+            doc = root._doc
+        elif self._doc is not None:
+            doc = self._doc
+            root = doc.getroot()
+        else:
+            raise ValueError, u"Element is not in this tree."
+        _assertValidDoc(doc)
+        _assertValidNode(root)
+        if element._doc is not doc:
+            raise ValueError, u"Element is not in this tree."
+
+        c_doc = _fakeRootDoc(doc._c_doc, root._c_node)
+        c_path = tree.xmlGetNodePath(element._c_node)
+        _destroyFakeDoc(doc._c_doc, c_doc)
+        if c_path is NULL:
+            raise MemoryError()
+        path = funicode(c_path)
+        tree.xmlFree(c_path)
+        return path
+
+    def getiterator(self, tag=None, *tags):
+        u"""getiterator(self, *tags, tag=None)
+
+        Returns a sequence or iterator of all elements in document order
+        (depth first pre-order), starting with the root element.
+
+        Can be restricted to find only elements with a specific tag,
+        see `_Element.iter`.
+
+        :deprecated: Note that this method is deprecated as of
+          ElementTree 1.3 and lxml 2.0.  It returns an iterator in
+          lxml, which diverges from the original ElementTree
+          behaviour.  If you want an efficient iterator, use the
+          ``tree.iter()`` method instead.  You should only use this
+          method in new code if you require backwards compatibility
+          with older versions of lxml or ElementTree.
+        """
+        root = self.getroot()
+        if root is None:
+            return ITER_EMPTY
+        if tag is not None:
+            tags += (tag,)
+        return root.getiterator(*tags)
+
+    def iter(self, tag=None, *tags):
+        u"""iter(self, tag=None, *tags)
+
+        Creates an iterator for the root element.  The iterator loops over
+        all elements in this tree, in document order.
+
+        Can be restricted to find only elements with a specific tag,
+        see `_Element.iter`.
+        """
+        root = self.getroot()
+        if root is None:
+            return ITER_EMPTY
+        if tag is not None:
+            tags += (tag,)
+        return root.iter(*tags)
+
+    def find(self, path, namespaces=None):
+        u"""find(self, path, namespaces=None)
+
+        Finds the first toplevel element with given tag.  Same as
+        ``tree.getroot().find(path)``.
+
+        The optional ``namespaces`` argument accepts a
+        prefix-to-namespace mapping that allows the usage of XPath
+        prefixes in the path expression.
+        """
+        self._assertHasRoot()
+        root = self.getroot()
+        if _isString(path):
+            if path[:1] == "/":
+                path = "." + path
+        return root.find(path, namespaces)
+
+    def findtext(self, path, default=None, namespaces=None):
+        u"""findtext(self, path, default=None, namespaces=None)
+
+        Finds the text for the first element matching the ElementPath
+        expression.  Same as getroot().findtext(path)
+
+        The optional ``namespaces`` argument accepts a
+        prefix-to-namespace mapping that allows the usage of XPath
+        prefixes in the path expression.
+        """
+        self._assertHasRoot()
+        root = self.getroot()
+        if _isString(path):
+            if path[:1] == "/":
+                path = "." + path
+        return root.findtext(path, default, namespaces)
+
+    def findall(self, path, namespaces=None):
+        u"""findall(self, path, namespaces=None)
+
+        Finds all elements matching the ElementPath expression.  Same as
+        getroot().findall(path).
+
+        The optional ``namespaces`` argument accepts a
+        prefix-to-namespace mapping that allows the usage of XPath
+        prefixes in the path expression.
+        """
+        self._assertHasRoot()
+        root = self.getroot()
+        if _isString(path):
+            if path[:1] == "/":
+                path = "." + path
+        return root.findall(path, namespaces)
+
+    def iterfind(self, path, namespaces=None):
+        u"""iterfind(self, path, namespaces=None)
+
+        Iterates over all elements matching the ElementPath expression.
+        Same as getroot().iterfind(path).
+
+        The optional ``namespaces`` argument accepts a
+        prefix-to-namespace mapping that allows the usage of XPath
+        prefixes in the path expression.
+        """
+        self._assertHasRoot()
+        root = self.getroot()
+        if _isString(path):
+            if path[:1] == "/":
+                path = "." + path
+        return root.iterfind(path, namespaces)
+
+    def xpath(self, _path, *, namespaces=None, extensions=None,
+              smart_strings=True, **_variables):
+        u"""xpath(self, _path, namespaces=None, extensions=None, smart_strings=True, **_variables)
+
+        XPath evaluate in context of document.
+
+        ``namespaces`` is an optional dictionary with prefix to namespace URI
+        mappings, used by XPath.  ``extensions`` defines additional extension
+        functions.
+        
+        Returns a list (nodeset), or bool, float or string.
+
+        In case of a list result, return Element for element nodes,
+        string for text and attribute values.
+
+        Note: if you are going to apply multiple XPath expressions
+        against the same document, it is more efficient to use
+        XPathEvaluator directly.
+        """
+        self._assertHasRoot()
+        evaluator = XPathDocumentEvaluator(self, namespaces=namespaces,
+                                           extensions=extensions,
+                                           smart_strings=smart_strings)
+        return evaluator(_path, **_variables)
+
+    def xslt(self, _xslt, extensions=None, access_control=None, **_kw):
+        u"""xslt(self, _xslt, extensions=None, access_control=None, **_kw)
+
+        Transform this document using other document.
+
+        xslt is a tree that should be XSLT
+        keyword parameters are XSLT transformation parameters.
+
+        Returns the transformed tree.
+
+        Note: if you are going to apply the same XSLT stylesheet against
+        multiple documents, it is more efficient to use the XSLT
+        class directly.
+        """
+        self._assertHasRoot()
+        style = XSLT(_xslt, extensions=extensions,
+                     access_control=access_control)
+        return style(self, **_kw)
+
+    def relaxng(self, relaxng):
+        u"""relaxng(self, relaxng)
+
+        Validate this document using other document.
+
+        The relaxng argument is a tree that should contain a Relax NG schema.
+
+        Returns True or False, depending on whether validation
+        succeeded.
+
+        Note: if you are going to apply the same Relax NG schema against
+        multiple documents, it is more efficient to use the RelaxNG
+        class directly.
+        """
+        self._assertHasRoot()
+        schema = RelaxNG(relaxng)
+        return schema.validate(self)
+
+    def xmlschema(self, xmlschema):
+        u"""xmlschema(self, xmlschema)
+
+        Validate this document using other document.
+
+        The xmlschema argument is a tree that should contain an XML Schema.
+
+        Returns True or False, depending on whether validation
+        succeeded.
+
+        Note: If you are going to apply the same XML Schema against
+        multiple documents, it is more efficient to use the XMLSchema
+        class directly.
+        """
+        self._assertHasRoot()
+        schema = XMLSchema(xmlschema)
+        return schema.validate(self)
+
+    def xinclude(self):
+        u"""xinclude(self)
+
+        Process the XInclude nodes in this document and include the
+        referenced XML fragments.
+
+        There is support for loading files through the file system, HTTP and
+        FTP.
+
+        Note that XInclude does not support custom resolvers in Python space
+        due to restrictions of libxml2 <= 2.6.29.
+        """
+        self._assertHasRoot()
+        XInclude()(self._context_node)
+
+    def write_c14n(self, file, *, exclusive=False, with_comments=True,
+                   compression=0, inclusive_ns_prefixes=None):
+        u"""write_c14n(self, file, exclusive=False, with_comments=True,
+                       compression=0, inclusive_ns_prefixes=None)
+
+        C14N write of document. Always writes UTF-8.
+
+        The ``compression`` option enables GZip compression level 1-9.
+
+        The ``inclusive_ns_prefixes`` should be a list of namespace strings
+        (i.e. ['xs', 'xsi']) that will be promoted to the top-level element
+        during exclusive C14N serialisation.  This parameter is ignored if
+        exclusive mode=False.
+
+        If exclusive=True and no list is provided, a namespace will only be
+        rendered if it is used by the immediate parent or one of its attributes
+        and its prefix and values have not already been rendered by an ancestor
+        of the namespace node's parent element.
+        """
+        self._assertHasRoot()
+        _assertValidNode(self._context_node)
+        if compression is None or compression < 0:
+            compression = 0
+
+        _tofilelikeC14N(file, self._context_node, exclusive, with_comments,
+                        compression, inclusive_ns_prefixes)
+
+cdef _ElementTree _elementTreeFactory(_Document doc, _Element context_node):
+    return _newElementTree(doc, context_node, _ElementTree)
+
+cdef _ElementTree _newElementTree(_Document doc, _Element context_node,
+                                  object baseclass):
+    cdef _ElementTree result
+    result = baseclass()
+    if context_node is None and doc is not None:
+        context_node = doc.getroot()
+    if context_node is None:
+        _assertValidDoc(doc)
+        result._doc = doc
+    else:
+        _assertValidNode(context_node)
+    result._context_node = context_node
+    return result
+
+
+@cython.final
+@cython.freelist(16)
+cdef class _Attrib:
+    u"""A dict-like proxy for the ``Element.attrib`` property.
+    """
+    cdef _Element _element
+    def __cinit__(self, _Element element not None):
+        _assertValidNode(element)
+        self._element = element
+
+    # MANIPULATORS
+    def __setitem__(self, key, value):
+        _assertValidNode(self._element)
+        _setAttributeValue(self._element, key, value)
+
+    def __delitem__(self, key):
+        _assertValidNode(self._element)
+        _delAttribute(self._element, key)
+
+    def update(self, sequence_or_dict):
+        _assertValidNode(self._element)
+        if isinstance(sequence_or_dict, (dict, _Attrib)):
+            sequence_or_dict = sequence_or_dict.items()
+        for key, value in sequence_or_dict:
+            _setAttributeValue(self._element, key, value)
+
+    def pop(self, key, *default):
+        if len(default) > 1:
+            raise TypeError, u"pop expected at most 2 arguments, got %d" % (
+                len(default)+1)
+        _assertValidNode(self._element)
+        result = _getAttributeValue(self._element, key, None)
+        if result is None:
+            if not default:
+                raise KeyError, key
+            result = default[0]
+        else:
+            _delAttribute(self._element, key)
+        return result
+
+    def clear(self):
+        _assertValidNode(self._element)
+        cdef xmlNode* c_node = self._element._c_node
+        while c_node.properties is not NULL:
+            tree.xmlRemoveProp(c_node.properties)
+
+    # ACCESSORS
+    def __repr__(self):
+        _assertValidNode(self._element)
+        return repr(dict( _collectAttributes(self._element._c_node, 3) ))
+
+    def __copy__(self):
+        _assertValidNode(self._element)
+        return dict(_collectAttributes(self._element._c_node, 3))
+
+    def __deepcopy__(self, memo):
+        _assertValidNode(self._element)
+        return dict(_collectAttributes(self._element._c_node, 3))
+
+    def __getitem__(self, key):
+        _assertValidNode(self._element)
+        result = _getAttributeValue(self._element, key, None)
+        if result is None:
+            raise KeyError, key
+        return result
+
+    def __bool__(self):
+        _assertValidNode(self._element)
+        cdef xmlAttr* c_attr = self._element._c_node.properties
+        while c_attr is not NULL:
+            if c_attr.type == tree.XML_ATTRIBUTE_NODE:
+                return 1
+            c_attr = c_attr.next
+        return 0
+
+    def __len__(self):
+        _assertValidNode(self._element)
+        cdef xmlAttr* c_attr = self._element._c_node.properties
+        cdef Py_ssize_t c = 0
+        while c_attr is not NULL:
+            if c_attr.type == tree.XML_ATTRIBUTE_NODE:
+                c += 1
+            c_attr = c_attr.next
+        return c
+
+    def get(self, key, default=None):
+        _assertValidNode(self._element)
+        return _getAttributeValue(self._element, key, default)
+
+    def keys(self):
+        _assertValidNode(self._element)
+        return _collectAttributes(self._element._c_node, 1)
+
+    def __iter__(self):
+        _assertValidNode(self._element)
+        return iter(_collectAttributes(self._element._c_node, 1))
+    
+    def iterkeys(self):
+        _assertValidNode(self._element)
+        return iter(_collectAttributes(self._element._c_node, 1))
+
+    def values(self):
+        _assertValidNode(self._element)
+        return _collectAttributes(self._element._c_node, 2)
+
+    def itervalues(self):
+        _assertValidNode(self._element)
+        return iter(_collectAttributes(self._element._c_node, 2))
+
+    def items(self):
+        _assertValidNode(self._element)
+        return _collectAttributes(self._element._c_node, 3)
+
+    def iteritems(self):
+        _assertValidNode(self._element)
+        return iter(_collectAttributes(self._element._c_node, 3))
+
+    def has_key(self, key):
+        _assertValidNode(self._element)
+        return key in self
+
+    def __contains__(self, key):
+        _assertValidNode(self._element)
+        cdef xmlNode* c_node
+        ns, tag = _getNsTag(key)
+        c_node = self._element._c_node
+        c_href = <const_xmlChar*>NULL if ns is None else _xcstr(ns)
+        return 1 if tree.xmlHasNsProp(c_node, _xcstr(tag), c_href) else 0
+
+    def __richcmp__(one, other, int op):
+        try:
+            if not isinstance(one, dict):
+                one = dict(one)
+            if not isinstance(other, dict):
+                other = dict(other)
+        except (TypeError, ValueError):
+            return NotImplemented
+        return python.PyObject_RichCompare(one, other, op)
+
+
+@cython.final
+@cython.internal
+cdef class _AttribIterator:
+    u"""Attribute iterator - for internal use only!
+    """
+    # XML attributes must not be removed while running!
+    cdef _Element _node
+    cdef xmlAttr* _c_attr
+    cdef int _keysvalues # 1 - keys, 2 - values, 3 - items (key, value)
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        cdef xmlAttr* c_attr
+        if self._node is None:
+            raise StopIteration
+        c_attr = self._c_attr
+        while c_attr is not NULL and c_attr.type != tree.XML_ATTRIBUTE_NODE:
+            c_attr = c_attr.next
+        if c_attr is NULL:
+            self._node = None
+            raise StopIteration
+
+        self._c_attr = c_attr.next
+        if self._keysvalues == 1:
+            return _namespacedName(<xmlNode*>c_attr)
+        elif self._keysvalues == 2:
+            return _attributeValue(self._node._c_node, c_attr)
+        else:
+            return (_namespacedName(<xmlNode*>c_attr),
+                    _attributeValue(self._node._c_node, c_attr))
+
+cdef object _attributeIteratorFactory(_Element element, int keysvalues):
+    cdef _AttribIterator attribs
+    if element._c_node.properties is NULL:
+        return ITER_EMPTY
+    attribs = _AttribIterator()
+    attribs._node = element
+    attribs._c_attr = element._c_node.properties
+    attribs._keysvalues = keysvalues
+    return attribs
+
+
+cdef public class _ElementTagMatcher [ object LxmlElementTagMatcher,
+                                       type LxmlElementTagMatcherType ]:
+    """
+    Dead but public. :)
+    """
+    cdef object _pystrings
+    cdef int _node_type
+    cdef char* _href
+    cdef char* _name
+    cdef _initTagMatch(self, tag):
+        self._href = NULL
+        self._name = NULL
+        if tag is None:
+            self._node_type = 0
+        elif tag is Comment:
+            self._node_type = tree.XML_COMMENT_NODE
+        elif tag is ProcessingInstruction:
+            self._node_type = tree.XML_PI_NODE
+        elif tag is Entity:
+            self._node_type = tree.XML_ENTITY_REF_NODE
+        elif tag is Element:
+            self._node_type = tree.XML_ELEMENT_NODE
+        else:
+            self._node_type = tree.XML_ELEMENT_NODE
+            self._pystrings = _getNsTag(tag)
+            if self._pystrings[0] is not None:
+                self._href = _cstr(self._pystrings[0])
+            self._name = _cstr(self._pystrings[1])
+            if self._name[0] == c'*' and self._name[1] == c'\0':
+                self._name = NULL
+
+cdef public class _ElementIterator(_ElementTagMatcher) [
+    object LxmlElementIterator, type LxmlElementIteratorType ]:
+    """
+    Dead but public. :)
+    """
+    # we keep Python references here to control GC
+    cdef _Element _node
+    cdef _node_to_node_function _next_element
+    def __iter__(self):
+        return self
+
+    cdef void _storeNext(self, _Element node):
+        cdef xmlNode* c_node
+        c_node = self._next_element(node._c_node)
+        while c_node is not NULL and \
+                  self._node_type != 0 and \
+                  (<tree.xmlElementType>self._node_type != c_node.type or
+                   not _tagMatches(c_node, <const_xmlChar*>self._href, <const_xmlChar*>self._name)):
+            c_node = self._next_element(c_node)
+        if c_node is NULL:
+            self._node = None
+        else:
+            # Python ref:
+            self._node = _elementFactory(node._doc, c_node)
+
+    def __next__(self):
+        cdef xmlNode* c_node
+        cdef _Element current_node
+        if self._node is None:
+            raise StopIteration
+        # Python ref:
+        current_node = self._node
+        self._storeNext(current_node)
+        return current_node
+
+@cython.final
+@cython.internal
+cdef class _MultiTagMatcher:
+    """
+    Match an xmlNode against a list of tags.
+    """
+    cdef list _py_tags
+    cdef qname* _cached_tags
+    cdef size_t _tag_count
+    cdef size_t _cached_size
+    cdef _Document _cached_doc
+    cdef int _node_types
+
+    def __cinit__(self, tags):
+        self._cached_tags = NULL
+        self._cached_size = 0
+        self._tag_count = 0
+        self._node_types = 0
+        self._py_tags = []
+        self.initTagMatch(tags)
+
+    def __dealloc__(self):
+        self._clear()
+
+    cdef bint rejectsAll(self):
+        return not self._tag_count and not self._node_types
+
+    cdef bint rejectsAllAttributes(self):
+        return not self._tag_count
+
+    cdef bint matchesType(self, int node_type):
+        if node_type == tree.XML_ELEMENT_NODE and self._tag_count:
+            return True
+        return self._node_types & (1 << node_type)
+
+    cdef void _clear(self):
+        cdef size_t i, count
+        count = self._tag_count
+        self._tag_count = 0
+        if self._cached_tags:
+            for i in xrange(count):
+                cpython.ref.Py_XDECREF(self._cached_tags[i].href)
+            cpython.mem.PyMem_Free(self._cached_tags)
+            self._cached_tags = NULL
+
+    cdef initTagMatch(self, tags):
+        self._cached_doc = None
+        del self._py_tags[:]
+        self._clear()
+        if tags is None or tags == ():
+            # no selection in tags argument => match anything
+            self._node_types = (
+                1 << tree.XML_COMMENT_NODE |
+                1 << tree.XML_PI_NODE |
+                1 << tree.XML_ENTITY_REF_NODE |
+                1 << tree.XML_ELEMENT_NODE)
+        else:
+            self._node_types = 0
+            self._storeTags(tags, set())
+
+    cdef _storeTags(self, tag, set seen):
+        if tag is Comment:
+            self._node_types |= 1 << tree.XML_COMMENT_NODE
+        elif tag is ProcessingInstruction:
+            self._node_types |= 1 << tree.XML_PI_NODE
+        elif tag is Entity:
+            self._node_types |= 1 << tree.XML_ENTITY_REF_NODE
+        elif tag is Element:
+            self._node_types |= 1 << tree.XML_ELEMENT_NODE
+        elif python._isString(tag):
+            if tag in seen:
+                return
+            seen.add(tag)
+            if tag in ('*', '{*}*'):
+                self._node_types |= 1 << tree.XML_ELEMENT_NODE
+            else:
+                href, name = _getNsTag(tag)
+                if name == b'*':
+                    name = None
+                if href is None:
+                    href = b''  # no namespace
+                elif href == b'*':
+                    href = None  # wildcard: any namespace, including none
+                self._py_tags.append((href, name))
+        else:
+            # support a sequence of tags
+            for item in tag:
+                self._storeTags(item, seen)
+
+    cdef inline int cacheTags(self, _Document doc, bint force_into_dict=False) except -1:
+        """
+        Look up the tag names in the doc dict to enable string pointer comparisons.
+        """
+        cdef size_t dict_size = tree.xmlDictSize(doc._c_doc.dict)
+        if doc is self._cached_doc and dict_size == self._cached_size:
+            # doc and dict didn't change => names already cached
+            return 0
+        self._tag_count = 0
+        if not self._py_tags:
+            self._cached_doc = doc
+            self._cached_size = dict_size
+            return 0
+        if not self._cached_tags:
+            self._cached_tags = <qname*>cpython.mem.PyMem_Malloc(len(self._py_tags) * sizeof(qname))
+            if not self._cached_tags:
+                self._cached_doc = None
+                raise MemoryError()
+        self._tag_count = <size_t>_mapTagsToQnameMatchArray(
+            doc._c_doc, self._py_tags, self._cached_tags, force_into_dict)
+        self._cached_doc = doc
+        self._cached_size = dict_size
+        return 0
+
+    cdef inline bint matches(self, xmlNode* c_node):
+        cdef qname* c_qname
+        if self._node_types & (1 << c_node.type):
+            return True
+        elif c_node.type == tree.XML_ELEMENT_NODE:
+            for c_qname in self._cached_tags[:self._tag_count]:
+                if _tagMatchesExactly(c_node, c_qname):
+                    return True
+        return False
+
+    cdef inline bint matchesNsTag(self, const_xmlChar* c_href,
+                                  const_xmlChar* c_name):
+        cdef qname* c_qname
+        if self._node_types & (1 << tree.XML_ELEMENT_NODE):
+            return True
+        for c_qname in self._cached_tags[:self._tag_count]:
+            if _nsTagMatchesExactly(c_href, c_name, c_qname):
+                return True
+        return False
+
+    cdef inline bint matchesAttribute(self, xmlAttr* c_attr):
+        """Attribute matches differ from Element matches in that they do
+        not care about node types.
+        """
+        cdef qname* c_qname
+        for c_qname in self._cached_tags[:self._tag_count]:
+            if _tagMatchesExactly(<xmlNode*>c_attr, c_qname):
+                return True
+        return False
+
+cdef class _ElementMatchIterator:
+    cdef _Element _node
+    cdef _node_to_node_function _next_element
+    cdef _MultiTagMatcher _matcher
+
+    @cython.final
+    cdef _initTagMatcher(self, tags):
+        self._matcher = _MultiTagMatcher(tags)
+
+    def __iter__(self):
+        return self
+
+    @cython.final
+    cdef int _storeNext(self, _Element node) except -1:
+        self._matcher.cacheTags(node._doc)
+        c_node = self._next_element(node._c_node)
+        while c_node is not NULL and not self._matcher.matches(c_node):
+            c_node = self._next_element(c_node)
+        # store Python ref to next node to make sure it's kept alive
+        self._node = _elementFactory(node._doc, c_node) if c_node is not NULL else None
+        return 0
+
+    def __next__(self):
+        cdef _Element current_node = self._node
+        if current_node is None:
+            raise StopIteration
+        self._storeNext(current_node)
+        return current_node
+
+cdef class ElementChildIterator(_ElementMatchIterator):
+    u"""ElementChildIterator(self, node, tag=None, reversed=False)
+    Iterates over the children of an element.
+    """
+    def __cinit__(self, _Element node not None, tag=None, *, bint reversed=False):
+        cdef xmlNode* c_node
+        _assertValidNode(node)
+        self._initTagMatcher(tag)
+        if reversed:
+            c_node = _findChildBackwards(node._c_node, 0)
+            self._next_element = _previousElement
+        else:
+            c_node = _findChildForwards(node._c_node, 0)
+            self._next_element = _nextElement
+        self._matcher.cacheTags(node._doc)
+        while c_node is not NULL and not self._matcher.matches(c_node):
+            c_node = self._next_element(c_node)
+        # store Python ref to next node to make sure it's kept alive
+        self._node = _elementFactory(node._doc, c_node) if c_node is not NULL else None
+
+cdef class SiblingsIterator(_ElementMatchIterator):
+    u"""SiblingsIterator(self, node, tag=None, preceding=False)
+    Iterates over the siblings of an element.
+
+    You can pass the boolean keyword ``preceding`` to specify the direction.
+    """
+    def __cinit__(self, _Element node not None, tag=None, *, bint preceding=False):
+        _assertValidNode(node)
+        self._initTagMatcher(tag)
+        if preceding:
+            self._next_element = _previousElement
+        else:
+            self._next_element = _nextElement
+        self._storeNext(node)
+
+cdef class AncestorsIterator(_ElementMatchIterator):
+    u"""AncestorsIterator(self, node, tag=None)
+    Iterates over the ancestors of an element (from parent to parent).
+    """
+    def __cinit__(self, _Element node not None, tag=None):
+        _assertValidNode(node)
+        self._initTagMatcher(tag)
+        self._next_element = _parentElement
+        self._storeNext(node)
+
+cdef class ElementDepthFirstIterator:
+    u"""ElementDepthFirstIterator(self, node, tag=None, inclusive=True)
+    Iterates over an element and its sub-elements in document order (depth
+    first pre-order).
+
+    Note that this also includes comments, entities and processing
+    instructions.  To filter them out, check if the ``tag`` property
+    of the returned element is a string (i.e. not None and not a
+    factory function), or pass the ``Element`` factory for the ``tag``
+    argument to receive only Elements.
+
+    If the optional ``tag`` argument is not None, the iterator returns only
+    the elements that match the respective name and namespace.
+
+    The optional boolean argument 'inclusive' defaults to True and can be set
+    to False to exclude the start element itself.
+
+    Note that the behaviour of this iterator is completely undefined if the
+    tree it traverses is modified during iteration.
+    """
+    # we keep Python references here to control GC
+    # keep the next Element after the one we return, and the (s)top node
+    cdef _Element _next_node
+    cdef _Element _top_node
+    cdef _MultiTagMatcher _matcher
+    def __cinit__(self, _Element node not None, tag=None, *, bint inclusive=True):
+        _assertValidNode(node)
+        self._top_node  = node
+        self._next_node = node
+        self._matcher = _MultiTagMatcher(tag)
+        self._matcher.cacheTags(node._doc)
+        if not inclusive or not self._matcher.matches(node._c_node):
+            # find start node (this cannot raise StopIteration, self._next_node != None)
+            next(self)
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        cdef xmlNode* c_node
+        cdef _Element current_node = self._next_node
+        if current_node is None:
+            raise StopIteration
+        c_node = current_node._c_node
+        self._matcher.cacheTags(current_node._doc)
+        if not self._matcher._tag_count:
+            # no tag name was found in the dict => not in document either
+            # try to match by node type
+            c_node = self._nextNodeAnyTag(c_node)
+        else:
+            c_node = self._nextNodeMatchTag(c_node)
+        if c_node is NULL:
+            self._next_node = None
+        else:
+            self._next_node = _elementFactory(current_node._doc, c_node)
+        return current_node
+
+    @cython.final
+    cdef xmlNode* _nextNodeAnyTag(self, xmlNode* c_node):
+        cdef int node_types = self._matcher._node_types
+        if not node_types:
+            return NULL
+        tree.BEGIN_FOR_EACH_ELEMENT_FROM(self._top_node._c_node, c_node, 0)
+        if node_types & (1 << c_node.type):
+            return c_node
+        tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+        return NULL
+
+    @cython.final
+    cdef xmlNode* _nextNodeMatchTag(self, xmlNode* c_node):
+        tree.BEGIN_FOR_EACH_ELEMENT_FROM(self._top_node._c_node, c_node, 0)
+        if self._matcher.matches(c_node):
+            return c_node
+        tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+        return NULL
+
+cdef class ElementTextIterator:
+    u"""ElementTextIterator(self, element, tag=None, with_tail=True)
+    Iterates over the text content of a subtree.
+
+    You can pass the ``tag`` keyword argument to restrict text content to a
+    specific tag name.
+
+    You can set the ``with_tail`` keyword argument to ``False`` to skip over
+    tail text (e.g. if you know that it's only whitespace from pretty-printing).
+    """
+    cdef object _nextEvent
+    cdef _Element _start_element
+    def __cinit__(self, _Element element not None, tag=None, *, bint with_tail=True):
+        _assertValidNode(element)
+        if with_tail:
+            events = (u"start", u"end")
+        else:
+            events = (u"start",)
+        self._start_element = element
+        self._nextEvent = iterwalk(element, events=events, tag=tag).__next__
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        cdef _Element element
+        result = None
+        while result is None:
+            event, element = self._nextEvent() # raises StopIteration
+            if event == u"start":
+                result = element.text
+            elif element is not self._start_element:
+                result = element.tail
+        return result
+
+cdef xmlNode* _createElement(xmlDoc* c_doc, object name_utf) except NULL:
+    cdef xmlNode* c_node
+    c_node = tree.xmlNewDocNode(c_doc, NULL, _xcstr(name_utf), NULL)
+    return c_node
+
+cdef xmlNode* _createComment(xmlDoc* c_doc, const_xmlChar* text):
+    cdef xmlNode* c_node
+    c_node = tree.xmlNewDocComment(c_doc, text)
+    return c_node
+
+cdef xmlNode* _createPI(xmlDoc* c_doc, const_xmlChar* target, const_xmlChar* text):
+    cdef xmlNode* c_node
+    c_node = tree.xmlNewDocPI(c_doc, target, text)
+    return c_node
+
+cdef xmlNode* _createEntity(xmlDoc* c_doc, const_xmlChar* name):
+    cdef xmlNode* c_node
+    c_node = tree.xmlNewReference(c_doc, name)
+    return c_node
+
+# module-level API for ElementTree
+
+def Element(_tag, attrib=None, nsmap=None, **_extra):
+    u"""Element(_tag, attrib=None, nsmap=None, **_extra)
+
+    Element factory.  This function returns an object implementing the
+    Element interface.
+
+    Also look at the `_Element.makeelement()` and
+    `_BaseParser.makeelement()` methods, which provide a faster way to
+    create an Element within a specific document or parser context.
+    """
+    return _makeElement(_tag, NULL, None, None, None, None,
+                        attrib, nsmap, _extra)
+
+def Comment(text=None):
+    u"""Comment(text=None)
+
+    Comment element factory. This factory function creates a special element that will
+    be serialized as an XML comment.
+    """
+    cdef _Document doc
+    cdef xmlNode*  c_node
+    cdef xmlDoc*   c_doc
+    if text is None:
+        text = b''
+    else:
+        text = _utf8(text)
+    c_doc = _newXMLDoc()
+    doc = _documentFactory(c_doc, None)
+    c_node = _createComment(c_doc, _xcstr(text))
+    tree.xmlAddChild(<xmlNode*>c_doc, c_node)
+    return _elementFactory(doc, c_node)
+
+def ProcessingInstruction(target, text=None):
+    u"""ProcessingInstruction(target, text=None)
+
+    ProcessingInstruction element factory. This factory function creates a
+    special element that will be serialized as an XML processing instruction.
+    """
+    cdef _Document doc
+    cdef xmlNode*  c_node
+    cdef xmlDoc*   c_doc
+    target = _utf8(target)
+    if text is None:
+        text = b''
+    else:
+        text = _utf8(text)
+    c_doc = _newXMLDoc()
+    doc = _documentFactory(c_doc, None)
+    c_node = _createPI(c_doc, _xcstr(target), _xcstr(text))
+    tree.xmlAddChild(<xmlNode*>c_doc, c_node)
+    return _elementFactory(doc, c_node)
+
+PI = ProcessingInstruction
+
+cdef class CDATA:
+    u"""CDATA(data)
+
+    CDATA factory.  This factory creates an opaque data object that
+    can be used to set Element text.  The usual way to use it is::
+
+        >>> el = Element('content')
+        >>> el.text = CDATA('a string')
+
+        >>> print(el.text)
+        a string
+        >>> print(tostring(el, encoding="unicode"))
+        <content><![CDATA[a string]]></content>
+    """
+    cdef bytes _utf8_data
+    def __cinit__(self, data):
+        self._utf8_data = _utf8(data)
+
+def Entity(name):
+    u"""Entity(name)
+
+    Entity factory.  This factory function creates a special element
+    that will be serialized as an XML entity reference or character
+    reference.  Note, however, that entities will not be automatically
+    declared in the document.  A document that uses entity references
+    requires a DTD to define the entities.
+    """
+    cdef _Document doc
+    cdef xmlNode*  c_node
+    cdef xmlDoc*   c_doc
+    name_utf = _utf8(name)
+    c_name = _xcstr(name_utf)
+    if c_name[0] == c'#':
+        if not _characterReferenceIsValid(c_name + 1):
+            raise ValueError, u"Invalid character reference: '%s'" % name
+    elif not _xmlNameIsValid(c_name):
+        raise ValueError, u"Invalid entity reference: '%s'" % name
+    c_doc = _newXMLDoc()
+    doc = _documentFactory(c_doc, None)
+    c_node = _createEntity(c_doc, c_name)
+    tree.xmlAddChild(<xmlNode*>c_doc, c_node)
+    return _elementFactory(doc, c_node)
+
+def SubElement(_Element _parent not None, _tag,
+               attrib=None, nsmap=None, **_extra):
+    u"""SubElement(_parent, _tag, attrib=None, nsmap=None, **_extra)
+
+    Subelement factory.  This function creates an element instance, and
+    appends it to an existing element.
+    """
+    return _makeSubElement(_parent, _tag, None, None, attrib, nsmap, _extra)
+
+def ElementTree(_Element element=None, *, file=None, _BaseParser parser=None):
+    u"""ElementTree(element=None, file=None, parser=None)
+
+    ElementTree wrapper class.
+    """
+    cdef xmlNode* c_next
+    cdef xmlNode* c_node
+    cdef xmlNode* c_node_copy
+    cdef xmlDoc*  c_doc
+    cdef _ElementTree etree
+    cdef _Document doc
+
+    if element is not None:
+        doc  = element._doc
+    elif file is not None:
+        try:
+            doc = _parseDocument(file, parser, None)
+        except _TargetParserResult as result_container:
+            return result_container.result
+    else:
+        c_doc = _newXMLDoc()
+        doc = _documentFactory(c_doc, parser)
+
+    return _elementTreeFactory(doc, element)
+
+def HTML(text, _BaseParser parser=None, *, base_url=None):
+    u"""HTML(text, parser=None, base_url=None)
+
+    Parses an HTML document from a string constant.  Returns the root
+    node (or the result returned by a parser target).  This function
+    can be used to embed "HTML literals" in Python code.
+
+    To override the parser with a different ``HTMLParser`` you can pass it to
+    the ``parser`` keyword argument.
+
+    The ``base_url`` keyword argument allows to set the original base URL of
+    the document to support relative Paths when looking up external entities
+    (DTD, XInclude, ...).
+    """
+    cdef _Document doc
+    if parser is None:
+        parser = __GLOBAL_PARSER_CONTEXT.getDefaultParser()
+        if not isinstance(parser, HTMLParser):
+            parser = __DEFAULT_HTML_PARSER
+    try:
+        doc = _parseMemoryDocument(text, base_url, parser)
+        return doc.getroot()
+    except _TargetParserResult as result_container:
+        return result_container.result
+
+def XML(text, _BaseParser parser=None, *, base_url=None):
+    u"""XML(text, parser=None, base_url=None)
+
+    Parses an XML document or fragment from a string constant.
+    Returns the root node (or the result returned by a parser target).
+    This function can be used to embed "XML literals" in Python code,
+    like in
+
+       >>> root = XML("<root><test/></root>")
+       >>> print(root.tag)
+       root
+
+    To override the parser with a different ``XMLParser`` you can pass it to
+    the ``parser`` keyword argument.
+
+    The ``base_url`` keyword argument allows to set the original base URL of
+    the document to support relative Paths when looking up external entities
+    (DTD, XInclude, ...).
+    """
+    cdef _Document doc
+    if parser is None:
+        parser = __GLOBAL_PARSER_CONTEXT.getDefaultParser()
+        if not isinstance(parser, XMLParser):
+            parser = __DEFAULT_XML_PARSER
+    try:
+        doc = _parseMemoryDocument(text, base_url, parser)
+        return doc.getroot()
+    except _TargetParserResult as result_container:
+        return result_container.result
+
+def fromstring(text, _BaseParser parser=None, *, base_url=None):
+    u"""fromstring(text, parser=None, base_url=None)
+
+    Parses an XML document or fragment from a string.  Returns the
+    root node (or the result returned by a parser target).
+
+    To override the default parser with a different parser you can pass it to
+    the ``parser`` keyword argument.
+
+    The ``base_url`` keyword argument allows to set the original base URL of
+    the document to support relative Paths when looking up external entities
+    (DTD, XInclude, ...).
+    """
+    cdef _Document doc
+    try:
+        doc = _parseMemoryDocument(text, base_url, parser)
+        return doc.getroot()
+    except _TargetParserResult as result_container:
+        return result_container.result
+
+def fromstringlist(strings, _BaseParser parser=None):
+    u"""fromstringlist(strings, parser=None)
+
+    Parses an XML document from a sequence of strings.  Returns the
+    root node (or the result returned by a parser target).
+
+    To override the default parser with a different parser you can pass it to
+    the ``parser`` keyword argument.
+    """
+    cdef _Document doc
+    if isinstance(strings, (bytes, unicode)):
+        raise ValueError("passing a single string into fromstringlist() is not"
+                         " efficient, use fromstring() instead")
+    if parser is None:
+        parser = __GLOBAL_PARSER_CONTEXT.getDefaultParser()
+    feed = parser.feed
+    for data in strings:
+        feed(data)
+    return parser.close()
+
+def iselement(element):
+    u"""iselement(element)
+
+    Checks if an object appears to be a valid element object.
+    """
+    return isinstance(element, _Element) and (<_Element>element)._c_node is not NULL
+
+def dump(_Element elem not None, *, bint pretty_print=True, with_tail=True):
+    u"""dump(elem, pretty_print=True, with_tail=True)
+
+    Writes an element tree or element structure to sys.stdout. This function
+    should be used for debugging only.
+    """
+    xml = tostring(elem, pretty_print=pretty_print, with_tail=with_tail,
+                   encoding=u'unicode' if python.IS_PYTHON3 else None)
+    if not pretty_print:
+        xml += '\n'
+    sys.stdout.write(xml)
+
+def tostring(element_or_tree, *, encoding=None, method=u"xml",
+             xml_declaration=None, bint pretty_print=False, bint with_tail=True,
+             standalone=None, doctype=None,
+             bint exclusive=False, bint with_comments=True, inclusive_ns_prefixes=None):
+    u"""tostring(element_or_tree, encoding=None, method="xml",
+                 xml_declaration=None, pretty_print=False, with_tail=True,
+                 standalone=None, doctype=None,
+                 exclusive=False, with_comments=True, inclusive_ns_prefixes=None)
+
+    Serialize an element to an encoded string representation of its XML
+    tree.
+
+    Defaults to ASCII encoding without XML declaration.  This
+    behaviour can be configured with the keyword arguments 'encoding'
+    (string) and 'xml_declaration' (bool).  Note that changing the
+    encoding to a non UTF-8 compatible encoding will enable a
+    declaration by default.
+
+    You can also serialise to a Unicode string without declaration by
+    passing the ``unicode`` function as encoding (or ``str`` in Py3),
+    or the name 'unicode'.  This changes the return value from a byte
+    string to an unencoded unicode string.
+
+    The keyword argument 'pretty_print' (bool) enables formatted XML.
+
+    The keyword argument 'method' selects the output method: 'xml',
+    'html', plain 'text' (text content without tags) or 'c14n'.
+    Default is 'xml'.
+
+    The ``exclusive`` and ``with_comments`` arguments are only used
+    with C14N output, where they request exclusive and uncommented
+    C14N serialisation respectively.
+
+    Passing a boolean value to the ``standalone`` option will output
+    an XML declaration with the corresponding ``standalone`` flag.
+
+    The ``doctype`` option allows passing in a plain string that will
+    be serialised before the XML tree.  Note that passing in non
+    well-formed content here will make the XML output non well-formed.
+    Also, an existing doctype in the document tree will not be removed
+    when serialising an ElementTree instance.
+
+    You can prevent the tail text of the element from being serialised
+    by passing the boolean ``with_tail`` option.  This has no impact
+    on the tail text of children, which will always be serialised.
+    """
+    cdef bint write_declaration
+    cdef int is_standalone
+    # C14N serialisation
+    if method == 'c14n':
+        if encoding is not None:
+            raise ValueError("Cannot specify encoding with C14N")
+        if xml_declaration:
+            raise ValueError("Cannot enable XML declaration in C14N")
+        return _tostringC14N(element_or_tree, exclusive, with_comments, inclusive_ns_prefixes)
+    if not with_comments:
+        raise ValueError("Can only discard comments in C14N serialisation")
+    if encoding is _unicode or (encoding is not None and encoding.upper() == 'UNICODE'):
+        if xml_declaration:
+            raise ValueError, \
+                u"Serialisation to unicode must not request an XML declaration"
+        write_declaration = 0
+        encoding = _unicode
+    elif xml_declaration is None:
+        # by default, write an XML declaration only for non-standard encodings
+        write_declaration = encoding is not None and encoding.upper() not in \
+                            (u'ASCII', u'UTF-8', u'UTF8', u'US-ASCII')
+    else:
+        write_declaration = xml_declaration
+    if encoding is None:
+        encoding = u'ASCII'
+    if standalone is None:
+        is_standalone = -1
+    elif standalone:
+        write_declaration = 1
+        is_standalone = 1
+    else:
+        write_declaration = 1
+        is_standalone = 0
+
+    if isinstance(element_or_tree, _Element):
+        return _tostring(<_Element>element_or_tree, encoding, doctype, method,
+                         write_declaration, 0, pretty_print, with_tail,
+                         is_standalone)
+    elif isinstance(element_or_tree, _ElementTree):
+        return _tostring((<_ElementTree>element_or_tree)._context_node,
+                         encoding, doctype, method, write_declaration, 1,
+                         pretty_print, with_tail, is_standalone)
+    else:
+        raise TypeError, u"Type '%s' cannot be serialized." % \
+            python._fqtypename(element_or_tree).decode('utf8')
+
+def tostringlist(element_or_tree, *args, **kwargs):
+    u"""tostringlist(element_or_tree, *args, **kwargs)
+
+    Serialize an element to an encoded string representation of its XML
+    tree, stored in a list of partial strings.
+
+    This is purely for ElementTree 1.3 compatibility.  The result is a
+    single string wrapped in a list.
+    """
+    return [tostring(element_or_tree, *args, **kwargs)]
+
+def tounicode(element_or_tree, *, method=u"xml", bint pretty_print=False,
+              bint with_tail=True, doctype=None):
+    u"""tounicode(element_or_tree, method="xml", pretty_print=False,
+                  with_tail=True, doctype=None)
+
+    Serialize an element to the Python unicode representation of its XML
+    tree.
+
+    :deprecated: use ``tostring(el, encoding='unicode')`` instead.
+
+    Note that the result does not carry an XML encoding declaration and is
+    therefore not necessarily suited for serialization to byte streams without
+    further treatment.
+
+    The boolean keyword argument 'pretty_print' enables formatted XML.
+
+    The keyword argument 'method' selects the output method: 'xml',
+    'html' or plain 'text'.
+
+    You can prevent the tail text of the element from being serialised
+    by passing the boolean ``with_tail`` option.  This has no impact
+    on the tail text of children, which will always be serialised.
+    """
+    if isinstance(element_or_tree, _Element):
+        return _tostring(<_Element>element_or_tree, _unicode, doctype, method,
+                          0, 0, pretty_print, with_tail, -1)
+    elif isinstance(element_or_tree, _ElementTree):
+        return _tostring((<_ElementTree>element_or_tree)._context_node,
+                         _unicode, doctype, method, 0, 1, pretty_print,
+                         with_tail, -1)
+    else:
+        raise TypeError, u"Type '%s' cannot be serialized." % \
+            type(element_or_tree)
+
+def parse(source, _BaseParser parser=None, *, base_url=None):
+    u"""parse(source, parser=None, base_url=None)
+
+    Return an ElementTree object loaded with source elements.  If no parser
+    is provided as second argument, the default parser is used.
+
+    The ``source`` can be any of the following:
+
+    - a file name/path
+    - a file object
+    - a file-like object
+    - a URL using the HTTP or FTP protocol
+
+    To parse from a string, use the ``fromstring()`` function instead.
+
+    Note that it is generally faster to parse from a file path or URL
+    than from an open file object or file-like object.  Transparent
+    decompression from gzip compressed sources is supported (unless
+    explicitly disabled in libxml2).
+
+    The ``base_url`` keyword allows setting a URL for the document
+    when parsing from a file-like object.  This is needed when looking
+    up external entities (DTD, XInclude, ...) with relative paths.
+    """
+    cdef _Document doc
+    try:
+        doc = _parseDocument(source, parser, base_url)
+        return _elementTreeFactory(doc, None)
+    except _TargetParserResult as result_container:
+        return result_container.result
+
+
+################################################################################
+# Include submodules
+
+include "readonlytree.pxi" # Read-only implementation of Element proxies
+include "classlookup.pxi"  # Element class lookup mechanisms
+include "nsclasses.pxi"    # Namespace implementation and registry
+include "docloader.pxi"    # Support for custom document loaders
+include "parser.pxi"       # XML and HTML parsers
+include "saxparser.pxi"    # SAX-like Parser interface and tree builder
+include "parsertarget.pxi" # ET Parser target
+include "serializer.pxi"   # XML output functions
+include "iterparse.pxi"    # incremental XML parsing
+include "xmlid.pxi"        # XMLID and IDDict
+include "xinclude.pxi"     # XInclude
+include "cleanup.pxi"      # Cleanup and recursive element removal functions
+
+
+################################################################################
+# Include submodules for XPath and XSLT
+
+include "extensions.pxi"   # XPath/XSLT extension functions
+include "xpath.pxi"        # XPath evaluation
+include "xslt.pxi"         # XSL transformations
+include "xsltext.pxi"      # XSL extension elements
+
+
+################################################################################
+# Validation
+
+class DocumentInvalid(LxmlError):
+    u"""Validation error.
+
+    Raised by all document validators when their ``assertValid(tree)``
+    method fails.
+    """
+    pass
+
+cdef class _Validator:
+    u"Base class for XML validators."
+    cdef _ErrorLog _error_log
+    def __cinit__(self):
+        self._error_log = _ErrorLog()
+
+    def validate(self, etree):
+        u"""validate(self, etree)
+
+        Validate the document using this schema.
+
+        Returns true if document is valid, false if not.
+        """
+        return self(etree)
+
+    def assertValid(self, etree):
+        u"""assertValid(self, etree)
+
+        Raises `DocumentInvalid` if the document does not comply with the schema.
+        """
+        if not self(etree):
+            raise DocumentInvalid(self._error_log._buildExceptionMessage(
+                    u"Document does not comply with schema"),
+                                  self._error_log)
+
+    def assert_(self, etree):
+        u"""assert_(self, etree)
+
+        Raises `AssertionError` if the document does not comply with the schema.
+        """
+        if not self(etree):
+            raise AssertionError, self._error_log._buildExceptionMessage(
+                u"Document does not comply with schema")
+
+    cpdef _append_log_message(self, int domain, int type, int level, int line,
+                              message, filename):
+        self._error_log._receiveGeneric(domain, type, level, line, message,
+                                        filename)
+
+    cpdef _clear_error_log(self):
+        self._error_log.clear()
+        
+    property error_log:
+        u"The log of validation errors and warnings."
+        def __get__(self):
+            assert self._error_log is not None, "XPath evaluator not initialised"
+            return self._error_log.copy()
+
+include "dtd.pxi"        # DTD
+include "relaxng.pxi"    # RelaxNG
+include "xmlschema.pxi"  # XMLSchema
+include "schematron.pxi" # Schematron (requires libxml2 2.6.21+)
+
+################################################################################
+# Public C API
+
+include "public-api.pxi"
+
+################################################################################
+# Other stuff
+
+include "debug.pxi"
diff --git a/lib/lxml/lxml.objectify.pyx b/lib/lxml/lxml.objectify.pyx
new file mode 100644
index 00000000..ff5f9dc3
--- /dev/null
+++ b/lib/lxml/lxml.objectify.pyx
@@ -0,0 +1,1985 @@
+u"""The ``lxml.objectify`` module implements a Python object API for
+XML.  It is based on `lxml.etree`.
+"""
+
+from __future__ import absolute_import
+
+cimport cython
+
+from lxml.includes.etreepublic cimport _Document, _Element, ElementBase, ElementClassLookup
+from lxml.includes.etreepublic cimport elementFactory, import_lxml__etree, textOf, pyunicode
+from lxml.includes.tree cimport xmlChar, const_xmlChar, _xcstr
+from lxml cimport python
+from lxml.includes cimport tree
+
+cimport lxml.includes.etreepublic as cetree
+cimport libc.string as cstring_h   # not to be confused with stdlib 'string'
+from libc.string cimport const_char
+
+__all__ = [u'BoolElement', u'DataElement', u'E', u'Element', u'ElementMaker',
+           u'FloatElement', u'IntElement', u'LongElement', u'NoneElement',
+           u'NumberElement', u'ObjectPath', u'ObjectifiedDataElement',
+           u'ObjectifiedElement', u'ObjectifyElementClassLookup',
+           u'PYTYPE_ATTRIBUTE', u'PyType', u'StringElement', u'SubElement',
+           u'XML', u'annotate', u'deannotate', u'dump', u'enable_recursive_str',
+           u'fromstring', u'getRegisteredTypes', u'makeparser', u'parse',
+           u'pyannotate', u'pytypename', u'set_default_parser',
+           u'set_pytype_attribute_tag', u'xsiannotate']
+
+cdef object etree
+from lxml import etree
+# initialize C-API of lxml.etree
+import_lxml__etree()
+
+__version__ = etree.__version__
+
+cdef object re
+import re
+
+cdef tuple IGNORABLE_ERRORS = (ValueError, TypeError)
+cdef object is_special_method = re.compile(u'__.*__$').match
+
+cdef object _typename(object t):
+    cdef const_char* c_name
+    c_name = python._fqtypename(t)
+    s = cstring_h.strrchr(c_name, c'.')
+    if s is not NULL:
+        c_name = s + 1
+    return pyunicode(<const_xmlChar*>c_name)
+
+# namespace/name for "pytype" hint attribute
+cdef object PYTYPE_NAMESPACE
+cdef bytes PYTYPE_NAMESPACE_UTF8
+cdef const_xmlChar* _PYTYPE_NAMESPACE
+
+cdef object PYTYPE_ATTRIBUTE_NAME
+cdef bytes PYTYPE_ATTRIBUTE_NAME_UTF8
+cdef const_xmlChar* _PYTYPE_ATTRIBUTE_NAME
+
+PYTYPE_ATTRIBUTE = None
+
+cdef unicode TREE_PYTYPE_NAME = u"TREE"
+
+cdef tuple _unicodeAndUtf8(s):
+    return (s, python.PyUnicode_AsUTF8String(s))
+
+def set_pytype_attribute_tag(attribute_tag=None):
+    u"""set_pytype_attribute_tag(attribute_tag=None)
+    Change name and namespace of the XML attribute that holds Python type
+    information.
+
+    Do not use this unless you know what you are doing.
+
+    Reset by calling without argument.
+
+    Default: "{http://codespeak.net/lxml/objectify/pytype}pytype"
+    """
+    global PYTYPE_ATTRIBUTE, _PYTYPE_NAMESPACE, _PYTYPE_ATTRIBUTE_NAME
+    global PYTYPE_NAMESPACE, PYTYPE_NAMESPACE_UTF8
+    global PYTYPE_ATTRIBUTE_NAME, PYTYPE_ATTRIBUTE_NAME_UTF8
+    if attribute_tag is None:
+        PYTYPE_NAMESPACE, PYTYPE_NAMESPACE_UTF8 = \
+            _unicodeAndUtf8(u"http://codespeak.net/lxml/objectify/pytype")
+        PYTYPE_ATTRIBUTE_NAME, PYTYPE_ATTRIBUTE_NAME_UTF8 = \
+            _unicodeAndUtf8(u"pytype")
+    else:
+        PYTYPE_NAMESPACE_UTF8, PYTYPE_ATTRIBUTE_NAME_UTF8 = \
+            cetree.getNsTag(attribute_tag)
+        PYTYPE_NAMESPACE = PYTYPE_NAMESPACE_UTF8.decode('utf8')
+        PYTYPE_ATTRIBUTE_NAME = PYTYPE_ATTRIBUTE_NAME_UTF8.decode('utf8')
+
+    _PYTYPE_NAMESPACE      = PYTYPE_NAMESPACE_UTF8
+    _PYTYPE_ATTRIBUTE_NAME = PYTYPE_ATTRIBUTE_NAME_UTF8
+    PYTYPE_ATTRIBUTE = cetree.namespacedNameFromNsName(
+        _PYTYPE_NAMESPACE, _PYTYPE_ATTRIBUTE_NAME)
+
+set_pytype_attribute_tag()
+
+
+# namespaces for XML Schema
+cdef object XML_SCHEMA_NS, XML_SCHEMA_NS_UTF8
+XML_SCHEMA_NS, XML_SCHEMA_NS_UTF8 = \
+    _unicodeAndUtf8(u"http://www.w3.org/2001/XMLSchema")
+cdef const_xmlChar* _XML_SCHEMA_NS = _xcstr(XML_SCHEMA_NS_UTF8)
+
+cdef object XML_SCHEMA_INSTANCE_NS, XML_SCHEMA_INSTANCE_NS_UTF8
+XML_SCHEMA_INSTANCE_NS, XML_SCHEMA_INSTANCE_NS_UTF8 = \
+    _unicodeAndUtf8(u"http://www.w3.org/2001/XMLSchema-instance")
+cdef const_xmlChar* _XML_SCHEMA_INSTANCE_NS = _xcstr(XML_SCHEMA_INSTANCE_NS_UTF8)
+
+cdef object XML_SCHEMA_INSTANCE_NIL_ATTR = u"{%s}nil" % XML_SCHEMA_INSTANCE_NS
+cdef object XML_SCHEMA_INSTANCE_TYPE_ATTR = u"{%s}type" % XML_SCHEMA_INSTANCE_NS
+
+
+# Forward declaration
+cdef class PyType
+
+################################################################################
+# Element class for the main API
+
+cdef class ObjectifiedElement(ElementBase):
+    u"""Main XML Element class.
+
+    Element children are accessed as object attributes.  Multiple children
+    with the same name are available through a list index.  Example::
+
+       >>> root = XML("<root><c1><c2>0</c2><c2>1</c2></c1></root>")
+       >>> second_c2 = root.c1.c2[1]
+       >>> print(second_c2.text)
+       1
+
+    Note that you cannot (and must not) instantiate this class or its
+    subclasses.
+    """
+    def __iter__(self):
+        u"""Iterate over self and all siblings with the same tag.
+        """
+        parent = self.getparent()
+        if parent is None:
+            return iter([self])
+        return etree.ElementChildIterator(parent, tag=self.tag)
+
+    def __str__(self):
+        if __RECURSIVE_STR:
+            return _dump(self, 0)
+        else:
+            return textOf(self._c_node) or u''
+
+    # pickle support for objectified Element
+    def __reduce__(self):
+        return (fromstring, (etree.tostring(self),))
+
+    property text:
+        def __get__(self):
+            return textOf(self._c_node)
+
+    property __dict__:
+        u"""A fake implementation for __dict__ to support dir() etc.
+
+        Note that this only considers the first child with a given name.
+        """
+        def __get__(self):
+            cdef _Element child
+            cdef dict children
+            c_ns = tree._getNs(self._c_node)
+            tag = u"{%s}*" % pyunicode(c_ns) if c_ns is not NULL else None
+            children = {}
+            for child in etree.ElementChildIterator(self, tag=tag):
+                if c_ns is NULL and tree._getNs(child._c_node) is not NULL:
+                    continue
+                name = pyunicode(child._c_node.name)
+                if python.PyDict_GetItem(children, name) is NULL:
+                    children[name] = child
+            return children
+
+    def __len__(self):
+        u"""Count self and siblings with the same tag.
+        """
+        return _countSiblings(self._c_node)
+
+    def countchildren(self):
+        u"""countchildren(self)
+
+        Return the number of children of this element, regardless of their
+        name.
+        """
+        # copied from etree
+        cdef Py_ssize_t c
+        cdef tree.xmlNode* c_node
+        c = 0
+        c_node = self._c_node.children
+        while c_node is not NULL:
+            if tree._isElement(c_node):
+                c = c + 1
+            c_node = c_node.next
+        return c
+
+    def getchildren(self):
+        u"""getchildren(self)
+
+        Returns a sequence of all direct children.  The elements are
+        returned in document order.
+        """
+        cdef tree.xmlNode* c_node
+        cdef list result = []
+        c_node = self._c_node.children
+        while c_node is not NULL:
+            if tree._isElement(c_node):
+                result.append(cetree.elementFactory(self._doc, c_node))
+            c_node = c_node.next
+        return result
+
+    def __getattr__(self, tag):
+        u"""Return the (first) child with the given tag name.  If no namespace
+        is provided, the child will be looked up in the same one as self.
+        """
+        if is_special_method(tag):
+            return object.__getattr__(self, tag)
+        return _lookupChildOrRaise(self, tag)
+
+    def __setattr__(self, tag, value):
+        u"""Set the value of the (first) child with the given tag name.  If no
+        namespace is provided, the child will be looked up in the same one as
+        self.
+        """
+        cdef _Element element
+        # properties are looked up /after/ __setattr__, so we must emulate them
+        if tag == u'text' or tag == u'pyval':
+            # read-only !
+            raise TypeError, u"attribute '%s' of '%s' objects is not writable" % \
+                            (tag, _typename(self))
+        elif tag == u'tail':
+            cetree.setTailText(self._c_node, value)
+            return
+        elif tag == u'tag':
+            ElementBase.tag.__set__(self, value)
+            return
+        elif tag == u'base':
+            ElementBase.base.__set__(self, value)
+            return
+        tag = _buildChildTag(self, tag)
+        element = _lookupChild(self, tag)
+        if element is None:
+            _appendValue(self, tag, value)
+        else:
+            _replaceElement(element, value)
+
+    def __delattr__(self, tag):
+        child = _lookupChildOrRaise(self, tag)
+        self.remove(child)
+
+    def addattr(self, tag, value):
+        u"""addattr(self, tag, value)
+
+        Add a child value to the element.
+
+        As opposed to append(), it sets a data value, not an element.
+        """
+        _appendValue(self, _buildChildTag(self, tag), value)
+
+    def __getitem__(self, key):
+        u"""Return a sibling, counting from the first child of the parent.  The
+        method behaves like both a dict and a sequence.
+
+        * If argument is an integer, returns the sibling at that position.
+
+        * If argument is a string, does the same as getattr().  This can be
+          used to provide namespaces for element lookup, or to look up
+          children with special names (``text`` etc.).
+
+        * If argument is a slice object, returns the matching slice.
+        """
+        cdef tree.xmlNode* c_self_node
+        cdef tree.xmlNode* c_parent
+        cdef tree.xmlNode* c_node
+        cdef Py_ssize_t c_index
+        if python._isString(key):
+            return _lookupChildOrRaise(self, key)
+        elif isinstance(key, slice):
+            return list(self)[key]
+        # normal item access
+        c_index = key   # raises TypeError if necessary
+        c_self_node = self._c_node
+        c_parent = c_self_node.parent
+        if c_parent is NULL:
+            if c_index == 0:
+                return self
+            else:
+                raise IndexError, unicode(key)
+        if c_index < 0:
+            c_node = c_parent.last
+        else:
+            c_node = c_parent.children
+        c_node = _findFollowingSibling(
+            c_node, tree._getNs(c_self_node), c_self_node.name, c_index)
+        if c_node is NULL:
+            raise IndexError, unicode(key)
+        return elementFactory(self._doc, c_node)
+
+    def __setitem__(self, key, value):
+        u"""Set the value of a sibling, counting from the first child of the
+        parent.  Implements key assignment, item assignment and slice
+        assignment.
+
+        * If argument is an integer, sets the sibling at that position.
+
+        * If argument is a string, does the same as setattr().  This is used
+          to provide namespaces for element lookup.
+
+        * If argument is a sequence (list, tuple, etc.), assign the contained
+          items to the siblings.
+        """
+        cdef _Element element
+        cdef tree.xmlNode* c_node
+        if python._isString(key):
+            key = _buildChildTag(self, key)
+            element = _lookupChild(self, key)
+            if element is None:
+                _appendValue(self, key, value)
+            else:
+                _replaceElement(element, value)
+            return
+
+        if self._c_node.parent is NULL:
+            # the 'root[i] = ...' case
+            raise TypeError, u"assignment to root element is invalid"
+
+        if isinstance(key, slice):
+            # slice assignment
+            _setSlice(key, self, value)
+        else:
+            # normal index assignment
+            if key < 0:
+                c_node = self._c_node.parent.last
+            else:
+                c_node = self._c_node.parent.children
+            c_node = _findFollowingSibling(
+                c_node, tree._getNs(self._c_node), self._c_node.name, key)
+            if c_node is NULL:
+                raise IndexError, unicode(key)
+            element = elementFactory(self._doc, c_node)
+            _replaceElement(element, value)
+
+    def __delitem__(self, key):
+        parent = self.getparent()
+        if parent is None:
+            raise TypeError, u"deleting items not supported by root element"
+        if isinstance(key, slice):
+            # slice deletion
+            del_items = list(self)[key]
+            remove = parent.remove
+            for el in del_items:
+                remove(el)
+        else:
+            # normal index deletion
+            sibling = self.__getitem__(key)
+            parent.remove(sibling)
+
+    def descendantpaths(self, prefix=None):
+        u"""descendantpaths(self, prefix=None)
+
+        Returns a list of object path expressions for all descendants.
+        """
+        if prefix is not None and not python._isString(prefix):
+            prefix = u'.'.join(prefix)
+        return _buildDescendantPaths(self._c_node, prefix)
+
+cdef inline bint _tagMatches(tree.xmlNode* c_node, const_xmlChar* c_href, const_xmlChar* c_name):
+    if c_node.name != c_name:
+        return 0
+    if c_href == NULL:
+        return 1
+    c_node_href = tree._getNs(c_node)
+    if c_node_href == NULL:
+        return c_href[0] == c'\0'
+    return tree.xmlStrcmp(c_node_href, c_href) == 0
+
+cdef Py_ssize_t _countSiblings(tree.xmlNode* c_start_node):
+    cdef tree.xmlNode* c_node
+    cdef Py_ssize_t count
+    c_tag  = c_start_node.name
+    c_href = tree._getNs(c_start_node)
+    count = 1
+    c_node = c_start_node.next
+    while c_node is not NULL:
+        if c_node.type == tree.XML_ELEMENT_NODE and \
+               _tagMatches(c_node, c_href, c_tag):
+            count += 1
+        c_node = c_node.next
+    c_node = c_start_node.prev
+    while c_node is not NULL:
+        if c_node.type == tree.XML_ELEMENT_NODE and \
+               _tagMatches(c_node, c_href, c_tag):
+            count += 1
+        c_node = c_node.prev
+    return count
+
+cdef tree.xmlNode* _findFollowingSibling(tree.xmlNode* c_node,
+                                         const_xmlChar* href, const_xmlChar* name,
+                                         Py_ssize_t index):
+    cdef tree.xmlNode* (*next)(tree.xmlNode*)
+    if index >= 0:
+        next = cetree.nextElement
+    else:
+        index = -1 - index
+        next = cetree.previousElement
+    while c_node is not NULL:
+        if c_node.type == tree.XML_ELEMENT_NODE and \
+               _tagMatches(c_node, href, name):
+            index = index - 1
+            if index < 0:
+                return c_node
+        c_node = next(c_node)
+    return NULL
+
+cdef object _lookupChild(_Element parent, tag):
+    cdef tree.xmlNode* c_result
+    cdef tree.xmlNode* c_node
+    c_node = parent._c_node
+    ns, tag = cetree.getNsTagWithEmptyNs(tag)
+    c_tag = tree.xmlDictExists(
+        c_node.doc.dict, _xcstr(tag), python.PyBytes_GET_SIZE(tag))
+    if c_tag is NULL:
+        return None # not in the hash map => not in the tree
+    if ns is None:
+        # either inherit ns from parent or use empty (i.e. no) namespace
+        c_href = tree._getNs(c_node) or <tree.const_xmlChar*>''
+    else:
+        c_href = _xcstr(ns)
+    c_result = _findFollowingSibling(c_node.children, c_href, c_tag, 0)
+    if c_result is NULL:
+        return None
+    return elementFactory(parent._doc, c_result)
+
+cdef object _lookupChildOrRaise(_Element parent, tag):
+    element = _lookupChild(parent, tag)
+    if element is None:
+        raise AttributeError, \
+            u"no such child: " + _buildChildTag(parent, tag)
+    return element
+
+cdef object _buildChildTag(_Element parent, tag):
+    ns, tag = cetree.getNsTag(tag)
+    c_tag = _xcstr(tag)
+    c_href = tree._getNs(parent._c_node) if ns is None else _xcstr(ns)
+    return cetree.namespacedNameFromNsName(c_href, c_tag)
+
+cdef _replaceElement(_Element element, value):
+    cdef _Element new_element
+    if isinstance(value, _Element):
+        # deep copy the new element
+        new_element = cetree.deepcopyNodeToDocument(
+            element._doc, (<_Element>value)._c_node)
+        new_element.tag = element.tag
+    elif isinstance(value, (list, tuple)):
+        element[:] = value
+        return
+    else:
+        new_element = element.makeelement(element.tag)
+        _setElementValue(new_element, value)
+    element.getparent().replace(element, new_element)
+
+cdef _appendValue(_Element parent, tag, value):
+    cdef _Element new_element
+    if isinstance(value, _Element):
+        # deep copy the new element
+        new_element = cetree.deepcopyNodeToDocument(
+            parent._doc, (<_Element>value)._c_node)
+        new_element.tag = tag
+        cetree.appendChildToElement(parent, new_element)
+    elif isinstance(value, (list, tuple)):
+        for item in value:
+            _appendValue(parent, tag, item)
+    else:
+        new_element = cetree.makeElement(
+            tag, parent._doc, None, None, None, None, None)
+        _setElementValue(new_element, value)
+        cetree.appendChildToElement(parent, new_element)
+
+cdef _setElementValue(_Element element, value):
+    cdef python.PyObject* _pytype
+    if value is None:
+        cetree.setAttributeValue(
+            element, XML_SCHEMA_INSTANCE_NIL_ATTR, u"true")
+    elif isinstance(value, _Element):
+        _replaceElement(element, value)
+        return
+    else:
+        cetree.delAttributeFromNsName(
+            element._c_node, _XML_SCHEMA_INSTANCE_NS, <unsigned char*>"nil")
+        if python._isString(value):
+            pytype_name = u"str"
+            _pytype = python.PyDict_GetItem(_PYTYPE_DICT, pytype_name)
+        else:
+            pytype_name = _typename(value)
+            _pytype = python.PyDict_GetItem(_PYTYPE_DICT, pytype_name)
+            if _pytype is not NULL:
+                value = (<PyType>_pytype).stringify(value)
+            else:
+                value = unicode(value)
+        if _pytype is not NULL:
+            cetree.setAttributeValue(element, PYTYPE_ATTRIBUTE, pytype_name)
+        else:
+            cetree.delAttributeFromNsName(
+                element._c_node, _PYTYPE_NAMESPACE, _PYTYPE_ATTRIBUTE_NAME)
+    cetree.setNodeText(element._c_node, value)
+
+cdef _setSlice(sliceobject, _Element target, items):
+    cdef _Element parent
+    cdef tree.xmlNode* c_node
+    cdef Py_ssize_t c_step, c_start, pos
+    cdef list new_items
+    # collect existing slice
+    if (<slice>sliceobject).step is None:
+        c_step = 1
+    else:
+        c_step = (<slice>sliceobject).step
+    if c_step == 0:
+        raise ValueError, u"Invalid slice"
+    del_items = target[sliceobject]
+
+    # collect new values
+    new_items = []
+    tag = target.tag
+    for item in items:
+        if isinstance(item, _Element):
+            # deep copy the new element
+            new_element = cetree.deepcopyNodeToDocument(
+                target._doc, (<_Element>item)._c_node)
+            new_element.tag = tag
+        else:
+            new_element = cetree.makeElement(
+                tag, target._doc, None, None, None, None, None)
+            _setElementValue(new_element, item)
+        new_items.append(new_element)
+
+    # sanity check - raise what a list would raise
+    if c_step != 1 and \
+            python.PyList_GET_SIZE(del_items) != python.PyList_GET_SIZE(new_items):
+        raise ValueError, \
+            u"attempt to assign sequence of size %d to extended slice of size %d" % (
+            python.PyList_GET_SIZE(new_items),
+            python.PyList_GET_SIZE(del_items))
+
+    # replace existing items
+    pos = 0
+    parent = target.getparent()
+    replace = parent.replace
+    while pos < python.PyList_GET_SIZE(new_items) and \
+            pos < python.PyList_GET_SIZE(del_items):
+        replace(del_items[pos], new_items[pos])
+        pos += 1
+    # remove leftover items
+    if pos < python.PyList_GET_SIZE(del_items):
+        remove = parent.remove
+        while pos < python.PyList_GET_SIZE(del_items):
+            remove(del_items[pos])
+            pos += 1
+    # append remaining new items
+    if pos < python.PyList_GET_SIZE(new_items):
+        # the sanity check above guarantees (step == 1)
+        if pos > 0:
+            item = new_items[pos-1]
+        else:
+            if (<slice>sliceobject).start > 0:
+                c_node = parent._c_node.children
+            else:
+                c_node = parent._c_node.last
+            c_node = _findFollowingSibling(
+                c_node, tree._getNs(target._c_node), target._c_node.name,
+                (<slice>sliceobject).start - 1)
+            if c_node is NULL:
+                while pos < python.PyList_GET_SIZE(new_items):
+                    cetree.appendChildToElement(parent, new_items[pos])
+                    pos += 1
+                return
+            item = cetree.elementFactory(parent._doc, c_node)
+        while pos < python.PyList_GET_SIZE(new_items):
+            add = item.addnext
+            item = new_items[pos]
+            add(item)
+            pos += 1
+
+################################################################################
+# Data type support in subclasses
+
+cdef class ObjectifiedDataElement(ObjectifiedElement):
+    u"""This is the base class for all data type Elements.  Subclasses should
+    override the 'pyval' property and possibly the __str__ method.
+    """
+    property pyval:
+        def __get__(self):
+            return textOf(self._c_node)
+
+    def __str__(self):
+        return textOf(self._c_node) or u''
+
+    def __repr__(self):
+        return textOf(self._c_node) or u''
+
+    def _setText(self, s):
+        u"""For use in subclasses only. Don't use unless you know what you are
+        doing.
+        """
+        cetree.setNodeText(self._c_node, s)
+
+cdef class NumberElement(ObjectifiedDataElement):
+    cdef object _parse_value
+    def _setValueParser(self, function):
+        u"""Set the function that parses the Python value from a string.
+
+        Do not use this unless you know what you are doing.
+        """
+        self._parse_value = function
+
+    property pyval:
+        def __get__(self):
+            return _parseNumber(self)
+
+    def __int__(self):
+        return int(_parseNumber(self))
+
+    def __long__(self):
+        return long(_parseNumber(self))
+
+    def __float__(self):
+        return float(_parseNumber(self))
+
+    def __complex__(self):
+        return complex(_parseNumber(self))
+
+    def __str__(self):
+        return unicode(_parseNumber(self))
+
+    def __repr__(self):
+        return repr(_parseNumber(self))
+
+    def __oct__(self):
+        return oct(_parseNumber(self))
+
+    def __hex__(self):
+        return hex(_parseNumber(self))
+
+    def __richcmp__(self, other, int op):
+        return _richcmpPyvals(self, other, op)
+
+    def __hash__(self):
+        return hash(_parseNumber(self))
+
+    def __add__(self, other):
+        return _numericValueOf(self) + _numericValueOf(other)
+
+    def __sub__(self, other):
+        return _numericValueOf(self) - _numericValueOf(other)
+
+    def __mul__(self, other):
+        return _numericValueOf(self) * _numericValueOf(other)
+
+    def __div__(self, other):
+        return _numericValueOf(self) / _numericValueOf(other)
+
+    def __truediv__(self, other):
+        return _numericValueOf(self) / _numericValueOf(other)
+
+    def __mod__(self, other):
+        return _numericValueOf(self) % _numericValueOf(other)
+
+    def __pow__(self, other, modulo):
+        if modulo is None:
+            return _numericValueOf(self) ** _numericValueOf(other)
+        else:
+            return pow(_numericValueOf(self), _numericValueOf(other), modulo)
+
+    def __neg__(self):
+        return - _numericValueOf(self)
+
+    def __pos__(self):
+        return + _numericValueOf(self)
+
+    def __abs__(self):
+        return abs( _numericValueOf(self) )
+
+    def __nonzero__(self):
+        return bool(_numericValueOf(self))
+
+    def __invert__(self):
+        return ~ _numericValueOf(self)
+
+    def __lshift__(self, other):
+        return _numericValueOf(self) << _numericValueOf(other)
+
+    def __rshift__(self, other):
+        return _numericValueOf(self) >> _numericValueOf(other)
+
+    def __and__(self, other):
+        return _numericValueOf(self) & _numericValueOf(other)
+
+    def __or__(self, other):
+        return _numericValueOf(self) | _numericValueOf(other)
+
+    def __xor__(self, other):
+        return _numericValueOf(self) ^ _numericValueOf(other)
+
+cdef class IntElement(NumberElement):
+    def _init(self):
+        self._parse_value = int
+
+cdef class LongElement(NumberElement):
+    def _init(self):
+        self._parse_value = long
+
+cdef class FloatElement(NumberElement):
+    def _init(self):
+        self._parse_value = float
+
+cdef class StringElement(ObjectifiedDataElement):
+    u"""String data class.
+
+    Note that this class does *not* support the sequence protocol of strings:
+    len(), iter(), str_attr[0], str_attr[0:1], etc. are *not* supported.
+    Instead, use the .text attribute to get a 'real' string.
+    """
+    property pyval:
+        def __get__(self):
+            return textOf(self._c_node) or u''
+
+    def __repr__(self):
+        return repr(textOf(self._c_node) or u'')
+
+    def strlen(self):
+        text = textOf(self._c_node)
+        if text is None:
+            return 0
+        else:
+            return len(text)
+
+    def __nonzero__(self):
+        return bool(textOf(self._c_node))
+
+    def __richcmp__(self, other, int op):
+        return _richcmpPyvals(self, other, op)
+
+    def __hash__(self):
+        return hash(textOf(self._c_node) or u'')
+
+    def __add__(self, other):
+        text  = _strValueOf(self)
+        other = _strValueOf(other)
+        if text is None:
+            return other
+        if other is None:
+            return text
+        return text + other
+
+    def __mul__(self, other):
+        if isinstance(self, StringElement):
+            return textOf((<StringElement>self)._c_node) * _numericValueOf(other)
+        elif isinstance(other, StringElement):
+            return _numericValueOf(self) * textOf((<StringElement>other)._c_node)
+        else:
+            raise TypeError, u"invalid types for * operator"
+
+    def __mod__(self, other):
+        return _strValueOf(self) % other
+
+    def __int__(self):
+        return int(textOf(self._c_node))
+
+    def __long__(self):
+        return long(textOf(self._c_node))
+
+    def __float__(self):
+        return float(textOf(self._c_node))
+
+    def __complex__(self):
+        return complex(textOf(self._c_node))
+
+cdef class NoneElement(ObjectifiedDataElement):
+    def __str__(self):
+        return u"None"
+
+    def __repr__(self):
+        return u"None"
+
+    def __nonzero__(self):
+        return False
+
+    def __richcmp__(self, other, int op):
+        if other is None or self is None:
+            return python.PyObject_RichCompare(None, None, op)
+        if isinstance(self, NoneElement):
+            return python.PyObject_RichCompare(None, other, op)
+        else:
+            return python.PyObject_RichCompare(self, None, op)
+
+    def __hash__(self):
+        return hash(None)
+
+    property pyval:
+        def __get__(self):
+            return None
+
+cdef class BoolElement(IntElement):
+    u"""Boolean type base on string values: 'true' or 'false'.
+
+    Note that this inherits from IntElement to mimic the behaviour of
+    Python's bool type.
+    """
+    def _init(self):
+        self._parse_value = __parseBool
+
+    def __nonzero__(self):
+        return __parseBool(textOf(self._c_node))
+
+    def __richcmp__(self, other, int op):
+        return _richcmpPyvals(self, other, op)
+
+    def __hash__(self):
+        return hash(__parseBool(textOf(self._c_node)))
+
+    def __str__(self):
+        return unicode(__parseBool(textOf(self._c_node)))
+
+    def __repr__(self):
+        return repr(__parseBool(textOf(self._c_node)))
+
+    property pyval:
+        def __get__(self):
+            return __parseBool(textOf(self._c_node))
+
+def __checkBool(s):
+    cdef int value = -1
+    if s is not None:
+        value = __parseBoolAsInt(s)
+    if value == -1:
+        raise ValueError
+
+cpdef bint __parseBool(s) except -1:
+    cdef int value
+    if s is None:
+        return False
+    value = __parseBoolAsInt(s)
+    if value == -1:
+        raise ValueError, u"Invalid boolean value: '%s'" % s
+    return value
+
+cdef inline int __parseBoolAsInt(text) except -2:
+    if text == 'false':
+        return 0
+    elif text == 'true':
+        return 1
+    elif text == '0':
+        return 0
+    elif text == '1':
+        return 1
+    return -1
+
+cdef object _parseNumber(NumberElement element):
+    return element._parse_value(textOf(element._c_node))
+
+cdef object _strValueOf(obj):
+    if python._isString(obj):
+        return obj
+    if isinstance(obj, _Element):
+        return textOf((<_Element>obj)._c_node) or u''
+    if obj is None:
+        return u''
+    return unicode(obj)
+
+cdef object _numericValueOf(obj):
+    if isinstance(obj, NumberElement):
+        return _parseNumber(<NumberElement>obj)
+    try:
+        # not always numeric, but Python will raise the right exception
+        return obj.pyval
+    except AttributeError:
+        pass
+    return obj
+
+cdef _richcmpPyvals(left, right, int op):
+    left  = getattr(left,  'pyval', left)
+    right = getattr(right, 'pyval', right)
+    return python.PyObject_RichCompare(left, right, op)
+
+
+################################################################################
+# Python type registry
+
+cdef class PyType:
+    u"""PyType(self, name, type_check, type_class, stringify=None)
+    User defined type.
+
+    Named type that contains a type check function and a type class that
+    inherits from ObjectifiedDataElement.  The type check must take a string
+    as argument and raise ValueError or TypeError if it cannot handle the
+    string value.  It may be None in which case it is not considered for type
+    guessing.
+
+    Example::
+
+        PyType('int', int, MyIntClass).register()
+
+    Note that the order in which types are registered matters.  The first
+    matching type will be used.
+    """
+    cdef readonly object name
+    cdef readonly object type_check
+    cdef readonly object stringify
+    cdef object _type
+    cdef list _schema_types
+    def __init__(self, name, type_check, type_class, stringify=None):
+        if isinstance(name, bytes):
+            name = (<bytes>name).decode('ascii')
+        elif not isinstance(name, unicode):
+            raise TypeError, u"Type name must be a string"
+        if type_check is not None and not callable(type_check):
+            raise TypeError, u"Type check function must be callable (or None)"
+        if name != TREE_PYTYPE_NAME and \
+               not issubclass(type_class, ObjectifiedDataElement):
+            raise TypeError, \
+                u"Data classes must inherit from ObjectifiedDataElement"
+        self.name  = name
+        self._type = type_class
+        self.type_check = type_check
+        if stringify is None:
+            stringify = unicode
+        self.stringify = stringify
+        self._schema_types = []
+
+    def __repr__(self):
+        return u"PyType(%s, %s)" % (self.name, self._type.__name__)
+
+    def register(self, before=None, after=None):
+        u"""register(self, before=None, after=None)
+
+        Register the type.
+
+        The additional keyword arguments 'before' and 'after' accept a
+        sequence of type names that must appear before/after the new type in
+        the type list.  If any of them is not currently known, it is simply
+        ignored.  Raises ValueError if the dependencies cannot be fulfilled.
+        """
+        if self.name == TREE_PYTYPE_NAME:
+            raise ValueError, u"Cannot register tree type"
+        if self.type_check is not None:
+            for item in _TYPE_CHECKS:
+                if item[0] is self.type_check:
+                    _TYPE_CHECKS.remove(item)
+                    break
+            entry = (self.type_check, self)
+            first_pos = 0
+            last_pos = -1
+            if before or after:
+                if before is None:
+                    before = ()
+                elif after is None:
+                    after = ()
+                for i, (check, pytype) in enumerate(_TYPE_CHECKS):
+                    if last_pos == -1 and pytype.name in before:
+                        last_pos = i
+                    if pytype.name in after:
+                        first_pos = i+1
+            if last_pos == -1:
+                _TYPE_CHECKS.append(entry)
+            elif first_pos > last_pos:
+                raise ValueError, u"inconsistent before/after dependencies"
+            else:
+                _TYPE_CHECKS.insert(last_pos, entry)
+
+        _PYTYPE_DICT[self.name] = self
+        for xs_type in self._schema_types:
+            _SCHEMA_TYPE_DICT[xs_type] = self
+
+    def unregister(self):
+        u"unregister(self)"
+        if _PYTYPE_DICT.get(self.name) is self:
+            del _PYTYPE_DICT[self.name]
+        for xs_type, pytype in list(_SCHEMA_TYPE_DICT.items()):
+            if pytype is self:
+                del _SCHEMA_TYPE_DICT[xs_type]
+        if self.type_check is None:
+            return
+        try:
+            _TYPE_CHECKS.remove( (self.type_check, self) )
+        except ValueError:
+            pass
+
+    property xmlSchemaTypes:
+        u"""The list of XML Schema datatypes this Python type maps to.
+
+        Note that this must be set before registering the type!
+        """
+        def __get__(self):
+            return self._schema_types
+        def __set__(self, types):
+            self._schema_types = list(map(unicode, types))
+
+
+cdef dict _PYTYPE_DICT = {}
+cdef dict _SCHEMA_TYPE_DICT = {}
+cdef list _TYPE_CHECKS = []
+
+def __lower_bool(b):
+    return u"true" if b else u"false"
+
+cdef _pytypename(obj):
+    return u"str" if python._isString(obj) else _typename(obj)
+
+def pytypename(obj):
+    u"""pytypename(obj)
+
+    Find the name of the corresponding PyType for a Python object.
+    """
+    return _pytypename(obj)
+
+cdef _registerPyTypes():
+    pytype = PyType(u'int', int, IntElement)
+    pytype.xmlSchemaTypes = (u"integer", u"int", u"short", u"byte", u"unsignedShort",
+                             u"unsignedByte", u"nonPositiveInteger",
+                             u"negativeInteger", u"long", u"nonNegativeInteger",
+                             u"unsignedLong", u"unsignedInt", u"positiveInteger",)
+    pytype.register()
+
+    # 'long' type just for backwards compatibility
+    pytype = PyType(u'long', None, IntElement)
+    pytype.register()
+
+    pytype = PyType(u'float', float, FloatElement)
+    pytype.xmlSchemaTypes = (u"double", u"float")
+    pytype.register()
+
+    pytype = PyType(u'bool', __checkBool, BoolElement, __lower_bool)
+    pytype.xmlSchemaTypes = (u"boolean",)
+    pytype.register()
+
+    pytype = PyType(u'str', None, StringElement)
+    pytype.xmlSchemaTypes = (u"string", u"normalizedString", u"token", u"language",
+                             u"Name", u"NCName", u"ID", u"IDREF", u"ENTITY",
+                             u"NMTOKEN", )
+    pytype.register()
+
+    # since lxml 2.0
+    pytype = PyType(u'NoneType', None, NoneElement)
+    pytype.register()
+
+    # backwards compatibility
+    pytype = PyType(u'none', None, NoneElement)
+    pytype.register()
+
+# non-registered PyType for inner tree elements
+cdef PyType TREE_PYTYPE = PyType(TREE_PYTYPE_NAME, None, ObjectifiedElement)
+
+_registerPyTypes()
+
+def getRegisteredTypes():
+    u"""getRegisteredTypes()
+
+    Returns a list of the currently registered PyType objects.
+
+    To add a new type, retrieve this list and call unregister() for all
+    entries.  Then add the new type at a suitable position (possibly replacing
+    an existing one) and call register() for all entries.
+
+    This is necessary if the new type interferes with the type check functions
+    of existing ones (normally only int/float/bool) and must the tried before
+    other types.  To add a type that is not yet parsable by the current type
+    check functions, you can simply register() it, which will append it to the
+    end of the type list.
+    """
+    cdef list types = []
+    cdef set known = set()
+    for check, pytype in _TYPE_CHECKS:
+        name = pytype.name
+        if name not in known:
+            known.add(name)
+            types.append(pytype)
+    for pytype in _PYTYPE_DICT.values():
+        name = pytype.name
+        if name not in known:
+            known.add(name)
+            types.append(pytype)
+    return types
+
+cdef PyType _guessPyType(value, PyType defaulttype):
+    if value is None:
+        return None
+    for type_check, tested_pytype in _TYPE_CHECKS:
+        try:
+            type_check(value)
+            return <PyType>tested_pytype
+        except IGNORABLE_ERRORS:
+            # could not be parsed as the specified type => ignore
+            pass
+    return defaulttype
+
+cdef object _guessElementClass(tree.xmlNode* c_node):
+    value = textOf(c_node)
+    if value is None:
+        return None
+    if value == '':
+        return StringElement
+    
+    for type_check, pytype in _TYPE_CHECKS:
+        try:
+            type_check(value)
+            return (<PyType>pytype)._type
+        except IGNORABLE_ERRORS:
+            pass
+    return None
+
+################################################################################
+# adapted ElementMaker supports registered PyTypes
+
+@cython.final
+@cython.internal
+cdef class _ObjectifyElementMakerCaller:
+    cdef object _tag
+    cdef object _nsmap
+    cdef object _element_factory
+    cdef bint _annotate
+
+    def __call__(self, *children, **attrib):
+        u"__call__(self, *children, **attrib)"
+        cdef _ObjectifyElementMakerCaller elementMaker
+        cdef _Element element
+        cdef _Element childElement
+        cdef bint has_children
+        cdef bint has_string_value
+        if self._element_factory is None:
+            element = _makeElement(self._tag, None, attrib, self._nsmap)
+        else:
+            element = self._element_factory(self._tag, attrib, self._nsmap)
+
+        pytype_name = None
+        has_children = 0
+        has_string_value = 0
+        for child in children:
+            if child is None:
+                if python.PyTuple_GET_SIZE(children) == 1:
+                    cetree.setAttributeValue(
+                        element, XML_SCHEMA_INSTANCE_NIL_ATTR, u"true")
+            elif python._isString(child):
+                _add_text(element, child)
+                has_string_value = 1
+            elif isinstance(child, _Element):
+                cetree.appendChildToElement(element, <_Element>child)
+                has_children = 1
+            elif isinstance(child, _ObjectifyElementMakerCaller):
+                elementMaker = <_ObjectifyElementMakerCaller>child
+                if elementMaker._element_factory is None:
+                    cetree.makeSubElement(element, elementMaker._tag,
+                                          None, None, None, None)
+                else:
+                    childElement = elementMaker._element_factory(
+                        elementMaker._tag)
+                    cetree.appendChildToElement(element, childElement)
+                has_children = 1
+            elif isinstance(child, dict):
+                for name, value in child.items():
+                    # keyword arguments in attrib take precedence
+                    if name in attrib:
+                        continue
+                    pytype = _PYTYPE_DICT.get(_typename(value))
+                    if pytype is not None:
+                        value = (<PyType>pytype).stringify(value)
+                    elif not python._isString(value):
+                        value = unicode(value)
+                    cetree.setAttributeValue(element, name, value)
+            else:
+                if pytype_name is not None:
+                    # concatenation always makes the result a string
+                    has_string_value = 1
+                pytype_name = _typename(child)
+                pytype = _PYTYPE_DICT.get(_typename(child))
+                if pytype is not None:
+                    _add_text(element, (<PyType>pytype).stringify(child))
+                else:
+                    has_string_value = 1
+                    child = unicode(child)
+                    _add_text(element, child)
+
+        if self._annotate and not has_children:
+            if has_string_value:
+                cetree.setAttributeValue(element, PYTYPE_ATTRIBUTE, u"str")
+            elif pytype_name is not None:
+                cetree.setAttributeValue(element, PYTYPE_ATTRIBUTE, pytype_name)
+
+        return element
+
+cdef _add_text(_Element elem, text):
+    # add text to the tree in construction, either as element text or
+    # tail text, depending on the current tree state
+    cdef tree.xmlNode* c_child
+    c_child = cetree.findChildBackwards(elem._c_node, 0)
+    if c_child is not NULL:
+        old = cetree.tailOf(c_child)
+        if old is not None:
+            text = old + text
+        cetree.setTailText(c_child, text)
+    else:
+        old = cetree.textOf(elem._c_node)
+        if old is not None:
+            text = old + text
+        cetree.setNodeText(elem._c_node, text)
+
+cdef class ElementMaker:
+    u"""ElementMaker(self, namespace=None, nsmap=None, annotate=True, makeelement=None)
+
+    An ElementMaker that can be used for constructing trees.
+
+    Example::
+
+      >>> M = ElementMaker(annotate=False)
+      >>> attributes = {'class': 'par'}
+      >>> html = M.html( M.body( M.p('hello', attributes, M.br, 'objectify', style="font-weight: bold") ) )
+
+      >>> from lxml.etree import tostring
+      >>> print(tostring(html, method='html').decode('ascii'))
+      <html><body><p style="font-weight: bold" class="par">hello<br>objectify</p></body></html>
+
+    To create tags that are not valid Python identifiers, call the factory
+    directly and pass the tag name as first argument::
+
+      >>> root = M('tricky-tag', 'some text')
+      >>> print(root.tag)
+      tricky-tag
+      >>> print(root.text)
+      some text
+
+    Note that this module has a predefined ElementMaker instance called ``E``.
+    """
+    cdef object _makeelement
+    cdef object _namespace
+    cdef object _nsmap
+    cdef bint _annotate
+    cdef dict _cache
+    def __init__(self, *, namespace=None, nsmap=None, annotate=True,
+                 makeelement=None):
+        if nsmap is None:
+            nsmap = _DEFAULT_NSMAP if annotate else {}
+        self._nsmap = nsmap
+        self._namespace = None if namespace is None else u"{%s}" % namespace
+        self._annotate = annotate
+        if makeelement is not None:
+            assert callable(makeelement)
+            self._makeelement = makeelement
+        else:
+            self._makeelement = None
+        self._cache = {}
+
+    @cython.final
+    cdef _build_element_maker(self, tag):
+        cdef _ObjectifyElementMakerCaller element_maker
+        element_maker = _ObjectifyElementMakerCaller.__new__(_ObjectifyElementMakerCaller)
+        if self._namespace is not None and tag[0] != u"{":
+            element_maker._tag = self._namespace + tag
+        else:
+            element_maker._tag = tag
+        element_maker._nsmap = self._nsmap
+        element_maker._annotate = self._annotate
+        element_maker._element_factory = self._makeelement
+        if len(self._cache) > 200:
+            self._cache.clear()
+        self._cache[tag] = element_maker
+        return element_maker
+
+    def __getattr__(self, tag):
+        element_maker = self._cache.get(tag, None)
+        if element_maker is None:
+            if is_special_method(tag):
+                return object.__getattr__(self, tag)
+            return self._build_element_maker(tag)
+        return element_maker
+
+    def __call__(self, tag, *args, **kwargs):
+        element_maker = self._cache.get(tag, None)
+        if element_maker is None:
+            element_maker = self._build_element_maker(tag)
+        return element_maker(*args, **kwargs)
+
+################################################################################
+# Recursive element dumping
+
+cdef bint __RECURSIVE_STR = 0 # default: off
+
+def enable_recursive_str(on=True):
+    u"""enable_recursive_str(on=True)
+
+    Enable a recursively generated tree representation for str(element),
+    based on objectify.dump(element).
+    """
+    global __RECURSIVE_STR
+    __RECURSIVE_STR = on
+
+def dump(_Element element not None):
+    u"""dump(_Element element not None)
+
+    Return a recursively generated string representation of an element.
+    """
+    return _dump(element, 0)
+
+cdef object _dump(_Element element, int indent):
+    indentstr = u"    " * indent
+    if isinstance(element, ObjectifiedDataElement):
+        value = repr(element)
+    else:
+        value = textOf(element._c_node)
+        if value is not None:
+            if not value.strip():
+                value = None
+            else:
+                value = repr(value)
+    result = u"%s%s = %s [%s]\n" % (indentstr, element.tag,
+                                    value, _typename(element))
+    xsi_ns    = u"{%s}" % XML_SCHEMA_INSTANCE_NS
+    pytype_ns = u"{%s}" % PYTYPE_NAMESPACE
+    for name, value in cetree.iterattributes(element, 3):
+        if u'{' in name:
+            if name == PYTYPE_ATTRIBUTE:
+                if value == TREE_PYTYPE_NAME:
+                    continue
+                else:
+                    name = name.replace(pytype_ns, u'py:')
+            name = name.replace(xsi_ns, u'xsi:')
+        result += u"%s  * %s = %r\n" % (indentstr, name, value)
+
+    indent += 1
+    for child in element.iterchildren():
+        result += _dump(child, indent)
+    if indent == 1:
+        return result[:-1] # strip last '\n'
+    else:
+        return result
+
+
+################################################################################
+# Pickle support for objectified ElementTree
+
+def __unpickleElementTree(data):
+    return etree.ElementTree(fromstring(data))
+
+cdef _setupPickle(elementTreeReduceFunction):
+    if python.IS_PYTHON3:
+        import copyreg
+    else:
+        import copy_reg as copyreg
+    copyreg.pickle(etree._ElementTree,
+                   elementTreeReduceFunction, __unpickleElementTree)
+
+def pickleReduceElementTree(obj):
+    return (__unpickleElementTree, (etree.tostring(obj),))
+
+_setupPickle(pickleReduceElementTree)
+del pickleReduceElementTree
+
+################################################################################
+# Element class lookup
+
+cdef class ObjectifyElementClassLookup(ElementClassLookup):
+    u"""ObjectifyElementClassLookup(self, tree_class=None, empty_data_class=None)
+    Element class lookup method that uses the objectify classes.
+    """
+    cdef object empty_data_class
+    cdef object tree_class
+    def __init__(self, tree_class=None, empty_data_class=None):
+        u"""Lookup mechanism for objectify.
+
+        The default Element classes can be replaced by passing subclasses of
+        ObjectifiedElement and ObjectifiedDataElement as keyword arguments.
+        'tree_class' defines inner tree classes (defaults to
+        ObjectifiedElement), 'empty_data_class' defines the default class for
+        empty data elements (defauls to StringElement).
+        """
+        self._lookup_function = _lookupElementClass
+        if tree_class is None:
+            tree_class = ObjectifiedElement
+        self.tree_class = tree_class
+        if empty_data_class is None:
+            empty_data_class = StringElement
+        self.empty_data_class = empty_data_class
+
+cdef object _lookupElementClass(state, _Document doc, tree.xmlNode* c_node):
+    cdef ObjectifyElementClassLookup lookup
+    cdef python.PyObject* dict_result
+    lookup = <ObjectifyElementClassLookup>state
+    # if element has children => no data class
+    if cetree.hasChild(c_node):
+        return lookup.tree_class
+
+    # if element is defined as xsi:nil, return NoneElement class
+    if u"true" == cetree.attributeValueFromNsName(
+        c_node, _XML_SCHEMA_INSTANCE_NS, <unsigned char*>"nil"):
+        return NoneElement
+
+    # check for Python type hint
+    value = cetree.attributeValueFromNsName(
+        c_node, _PYTYPE_NAMESPACE, _PYTYPE_ATTRIBUTE_NAME)
+    if value is not None:
+        if value == TREE_PYTYPE_NAME:
+            return lookup.tree_class
+        dict_result = python.PyDict_GetItem(_PYTYPE_DICT, value)
+        if dict_result is not NULL:
+            return (<PyType>dict_result)._type
+        # unknown 'pyval' => try to figure it out ourself, just go on
+
+    # check for XML Schema type hint
+    value = cetree.attributeValueFromNsName(
+        c_node, _XML_SCHEMA_INSTANCE_NS, <unsigned char*>"type")
+
+    if value is not None:
+        dict_result = python.PyDict_GetItem(_SCHEMA_TYPE_DICT, value)
+        if dict_result is NULL and u':' in value:
+            prefix, value = value.split(u':', 1)
+            dict_result = python.PyDict_GetItem(_SCHEMA_TYPE_DICT, value)
+        if dict_result is not NULL:
+            return (<PyType>dict_result)._type
+
+    # otherwise determine class based on text content type
+    el_class = _guessElementClass(c_node)
+    if el_class is not None:
+        return el_class
+
+    # if element is a root node => default to tree node
+    if c_node.parent is NULL or not tree._isElement(c_node.parent):
+        return lookup.tree_class
+
+    return lookup.empty_data_class
+
+
+################################################################################
+# Type annotations
+
+cdef PyType _check_type(tree.xmlNode* c_node, PyType pytype):
+    if pytype is None:
+        return None
+    value = textOf(c_node)
+    try:
+        pytype.type_check(value)
+        return pytype
+    except IGNORABLE_ERRORS:
+        # could not be parsed as the specified type => ignore
+        pass
+    return None
+
+def pyannotate(element_or_tree, *, ignore_old=False, ignore_xsi=False,
+             empty_pytype=None):
+    u"""pyannotate(element_or_tree, ignore_old=False, ignore_xsi=False, empty_pytype=None)
+
+    Recursively annotates the elements of an XML tree with 'pytype'
+    attributes.
+
+    If the 'ignore_old' keyword argument is True (the default), current 'pytype'
+    attributes will be ignored and replaced.  Otherwise, they will be checked
+    and only replaced if they no longer fit the current text value.
+
+    Setting the keyword argument ``ignore_xsi`` to True makes the function
+    additionally ignore existing ``xsi:type`` annotations.  The default is to
+    use them as a type hint.
+
+    The default annotation of empty elements can be set with the
+    ``empty_pytype`` keyword argument.  The default is not to annotate empty
+    elements.  Pass 'str', for example, to make string values the default.
+    """
+    cdef _Element  element
+    element = cetree.rootNodeOrRaise(element_or_tree)
+    _annotate(element, 0, 1, ignore_xsi, ignore_old, None, empty_pytype)
+
+def xsiannotate(element_or_tree, *, ignore_old=False, ignore_pytype=False,
+                empty_type=None):
+    u"""xsiannotate(element_or_tree, ignore_old=False, ignore_pytype=False, empty_type=None)
+
+    Recursively annotates the elements of an XML tree with 'xsi:type'
+    attributes.
+
+    If the 'ignore_old' keyword argument is True (the default), current
+    'xsi:type' attributes will be ignored and replaced.  Otherwise, they will be
+    checked and only replaced if they no longer fit the current text value.
+
+    Note that the mapping from Python types to XSI types is usually ambiguous.
+    Currently, only the first XSI type name in the corresponding PyType
+    definition will be used for annotation.  Thus, you should consider naming
+    the widest type first if you define additional types.
+
+    Setting the keyword argument ``ignore_pytype`` to True makes the function
+    additionally ignore existing ``pytype`` annotations.  The default is to
+    use them as a type hint.
+
+    The default annotation of empty elements can be set with the
+    ``empty_type`` keyword argument.  The default is not to annotate empty
+    elements.  Pass 'string', for example, to make string values the default.
+    """
+    cdef _Element  element
+    element = cetree.rootNodeOrRaise(element_or_tree)
+    _annotate(element, 1, 0, ignore_old, ignore_pytype, empty_type, None)
+
+def annotate(element_or_tree, *, ignore_old=True, ignore_xsi=False,
+             empty_pytype=None, empty_type=None, annotate_xsi=0,
+             annotate_pytype=1):
+    u"""annotate(element_or_tree, ignore_old=True, ignore_xsi=False, empty_pytype=None, empty_type=None, annotate_xsi=0, annotate_pytype=1)
+
+    Recursively annotates the elements of an XML tree with 'xsi:type'
+    and/or 'py:pytype' attributes.
+
+    If the 'ignore_old' keyword argument is True (the default), current
+    'py:pytype' attributes will be ignored for the type annotation. Set to False
+    if you want reuse existing 'py:pytype' information (iff appropriate for the
+    element text value).
+
+    If the 'ignore_xsi' keyword argument is False (the default), existing
+    'xsi:type' attributes will be used for the type annotation, if they fit the
+    element text values. 
+    
+    Note that the mapping from Python types to XSI types is usually ambiguous.
+    Currently, only the first XSI type name in the corresponding PyType
+    definition will be used for annotation.  Thus, you should consider naming
+    the widest type first if you define additional types.
+
+    The default 'py:pytype' annotation of empty elements can be set with the
+    ``empty_pytype`` keyword argument. Pass 'str', for example, to make
+    string values the default.
+
+    The default 'xsi:type' annotation of empty elements can be set with the
+    ``empty_type`` keyword argument.  The default is not to annotate empty
+    elements.  Pass 'string', for example, to make string values the default.
+
+    The keyword arguments 'annotate_xsi' (default: 0) and 'annotate_pytype'
+    (default: 1) control which kind(s) of annotation to use. 
+    """
+    cdef _Element  element
+    element = cetree.rootNodeOrRaise(element_or_tree)
+    _annotate(element, annotate_xsi, annotate_pytype, ignore_xsi,
+              ignore_old, empty_type, empty_pytype)
+
+
+cdef _annotate(_Element element, bint annotate_xsi, bint annotate_pytype,
+               bint ignore_xsi, bint ignore_pytype,
+               empty_type_name, empty_pytype_name):
+    cdef _Document doc
+    cdef tree.xmlNode* c_node
+    cdef PyType empty_pytype, StrType, NoneType
+
+    if not annotate_xsi and not annotate_pytype:
+        return
+
+    if empty_type_name is not None:
+        if isinstance(empty_type_name, bytes):
+            empty_type_name = (<bytes>empty_type_name).decode("ascii")
+        dict_result = python.PyDict_GetItem(_SCHEMA_TYPE_DICT, empty_type_name)
+    elif empty_pytype_name is not None:
+        if isinstance(empty_pytype_name, bytes):
+            empty_pytype_name = (<bytes>empty_pytype_name).decode("ascii")
+        dict_result = python.PyDict_GetItem(_PYTYPE_DICT, empty_pytype_name)
+    else:
+        dict_result = NULL
+    if dict_result is not NULL:
+        empty_pytype = <PyType>dict_result
+    else:
+        empty_pytype = None
+
+    StrType  = _PYTYPE_DICT.get(u'str')
+    NoneType = _PYTYPE_DICT.get(u'NoneType')
+
+    doc = element._doc
+    c_node = element._c_node
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        _annotate_element(c_node, doc, annotate_xsi, annotate_pytype,
+                          ignore_xsi, ignore_pytype,
+                          empty_type_name, empty_pytype, StrType, NoneType)
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+
+cdef int _annotate_element(tree.xmlNode* c_node, _Document doc,
+                           bint annotate_xsi, bint annotate_pytype,
+                           bint ignore_xsi, bint ignore_pytype,
+                           empty_type_name, PyType empty_pytype,
+                           PyType StrType, PyType NoneType) except -1:
+    cdef tree.xmlNs*   c_ns
+    cdef python.PyObject* dict_result
+    cdef PyType pytype = None
+    typename = None
+    istree = 0
+
+    # if element is defined as xsi:nil, represent it as None
+    if cetree.attributeValueFromNsName(
+        c_node, _XML_SCHEMA_INSTANCE_NS, <unsigned char*>"nil") == "true":
+        pytype = NoneType
+
+    if  pytype is None and not ignore_xsi:
+        # check that old xsi type value is valid
+        typename = cetree.attributeValueFromNsName(
+            c_node, _XML_SCHEMA_INSTANCE_NS, <unsigned char*>"type")
+        if typename is not None:
+            dict_result = python.PyDict_GetItem(
+                _SCHEMA_TYPE_DICT, typename)
+            if dict_result is NULL and u':' in typename:
+                prefix, typename = typename.split(u':', 1)
+                dict_result = python.PyDict_GetItem(
+                    _SCHEMA_TYPE_DICT, typename)
+            if dict_result is not NULL:
+                pytype = <PyType>dict_result
+                if pytype is not StrType:
+                    # StrType does not have a typecheck but is the default
+                    # anyway, so just accept it if given as type
+                    # information
+                    pytype = _check_type(c_node, pytype)
+                    if pytype is None:
+                        typename = None
+
+    if pytype is None and not ignore_pytype:
+        # check that old pytype value is valid
+        old_pytypename = cetree.attributeValueFromNsName(
+            c_node, _PYTYPE_NAMESPACE, _PYTYPE_ATTRIBUTE_NAME)
+        if old_pytypename is not None:
+            if old_pytypename == TREE_PYTYPE_NAME:
+                if not cetree.hasChild(c_node):
+                    # only case where we should keep it,
+                    # everything else is clear enough
+                    pytype = TREE_PYTYPE
+            else:
+                if old_pytypename == 'none':
+                    # transition from lxml 1.x
+                    old_pytypename = "NoneType"
+                dict_result = python.PyDict_GetItem(
+                    _PYTYPE_DICT, old_pytypename)
+                if dict_result is not NULL:
+                    pytype = <PyType>dict_result
+                    if pytype is not StrType:
+                        # StrType does not have a typecheck but is the
+                        # default anyway, so just accept it if given as
+                        # type information
+                        pytype = _check_type(c_node, pytype)
+
+    if pytype is None:
+        # try to guess type
+        if not cetree.hasChild(c_node):
+            # element has no children => data class
+            pytype = _guessPyType(textOf(c_node), StrType)
+        else:
+            istree = 1
+
+    if pytype is None:
+        # use default type for empty elements
+        if cetree.hasText(c_node):
+            pytype = StrType
+        else:
+            pytype = empty_pytype
+            if typename is None:
+                typename = empty_type_name
+
+    if pytype is not None:
+        if typename is None:
+            if not istree:
+                if python.PyList_GET_SIZE(pytype._schema_types) > 0:
+                    # pytype->xsi:type is a 1:n mapping
+                    # simply take the first
+                    typename = pytype._schema_types[0]
+        elif typename not in pytype._schema_types:
+            typename = pytype._schema_types[0]
+
+    if annotate_xsi:
+        if typename is None or istree:
+            cetree.delAttributeFromNsName(
+                c_node, _XML_SCHEMA_INSTANCE_NS, <unsigned char*>"type")
+        else:
+            # update or create attribute
+            typename_utf8 = cetree.utf8(typename)
+            c_ns = cetree.findOrBuildNodeNsPrefix(
+                doc, c_node, _XML_SCHEMA_NS, <unsigned char*>'xsd')
+            if c_ns is not NULL:
+                if b':' in typename_utf8:
+                    prefix, name = typename_utf8.split(b':', 1)
+                    if c_ns.prefix is NULL or c_ns.prefix[0] == c'\0':
+                        typename_utf8 = name
+                    elif tree.xmlStrcmp(_xcstr(prefix), c_ns.prefix) != 0:
+                        typename_utf8 = (<unsigned char*>c_ns.prefix) + b':' + name
+                elif c_ns.prefix is not NULL and c_ns.prefix[0] != c'\0':
+                    typename_utf8 = (<unsigned char*>c_ns.prefix) + b':' + typename_utf8
+            c_ns = cetree.findOrBuildNodeNsPrefix(
+                doc, c_node, _XML_SCHEMA_INSTANCE_NS, <unsigned char*>'xsi')
+            tree.xmlSetNsProp(c_node, c_ns, <unsigned char*>"type", _xcstr(typename_utf8))
+
+    if annotate_pytype:
+        if pytype is None:
+            # delete attribute if it exists
+            cetree.delAttributeFromNsName(
+                c_node, _PYTYPE_NAMESPACE, _PYTYPE_ATTRIBUTE_NAME)
+        else:
+            # update or create attribute
+            c_ns = cetree.findOrBuildNodeNsPrefix(
+                doc, c_node, _PYTYPE_NAMESPACE, <unsigned char*>'py')
+            pytype_name = cetree.utf8(pytype.name)
+            tree.xmlSetNsProp(c_node, c_ns, _PYTYPE_ATTRIBUTE_NAME,
+                              _xcstr(pytype_name))
+            if pytype is NoneType:
+                c_ns = cetree.findOrBuildNodeNsPrefix(
+                    doc, c_node, _XML_SCHEMA_INSTANCE_NS, <unsigned char*>'xsi')
+                tree.xmlSetNsProp(c_node, c_ns, <unsigned char*>"nil", <unsigned char*>"true")
+
+    return 0
+
+cdef object _strip_attributes = etree.strip_attributes
+cdef object _cleanup_namespaces = etree.cleanup_namespaces
+
+def deannotate(element_or_tree, *, bint pytype=True, bint xsi=True,
+               bint xsi_nil=False, bint cleanup_namespaces=False):
+    u"""deannotate(element_or_tree, pytype=True, xsi=True, xsi_nil=False, cleanup_namespaces=False)
+
+    Recursively de-annotate the elements of an XML tree by removing 'py:pytype'
+    and/or 'xsi:type' attributes and/or 'xsi:nil' attributes.
+
+    If the 'pytype' keyword argument is True (the default), 'py:pytype'
+    attributes will be removed. If the 'xsi' keyword argument is True (the 
+    default), 'xsi:type' attributes will be removed.
+    If the 'xsi_nil' keyword argument is True (default: False), 'xsi:nil'
+    attributes will be removed.
+
+    Note that this does not touch the namespace declarations by
+    default.  If you want to remove unused namespace declarations from
+    the tree, pass the option ``cleanup_namespaces=True``.
+    """
+    cdef list attribute_names = []
+
+    if pytype:
+        attribute_names.append(PYTYPE_ATTRIBUTE)
+    if xsi:
+        attribute_names.append(XML_SCHEMA_INSTANCE_TYPE_ATTR)
+    if xsi_nil:
+        attribute_names.append(XML_SCHEMA_INSTANCE_NIL_ATTR)
+
+    _strip_attributes(element_or_tree, *attribute_names)
+    if cleanup_namespaces:
+        _cleanup_namespaces(element_or_tree)
+
+################################################################################
+# Module level parser setup
+
+cdef object __DEFAULT_PARSER
+__DEFAULT_PARSER = etree.XMLParser(remove_blank_text=True)
+__DEFAULT_PARSER.set_element_class_lookup( ObjectifyElementClassLookup() )
+
+cdef object objectify_parser
+objectify_parser = __DEFAULT_PARSER
+
+def set_default_parser(new_parser = None):
+    u"""set_default_parser(new_parser = None)
+
+    Replace the default parser used by objectify's Element() and
+    fromstring() functions.
+
+    The new parser must be an etree.XMLParser.
+
+    Call without arguments to reset to the original parser.
+    """
+    global objectify_parser
+    if new_parser is None:
+        objectify_parser = __DEFAULT_PARSER
+    elif isinstance(new_parser, etree.XMLParser):
+        objectify_parser = new_parser
+    else:
+        raise TypeError, u"parser must inherit from lxml.etree.XMLParser"
+
+def makeparser(**kw):
+    u"""makeparser(remove_blank_text=True, **kw)
+
+    Create a new XML parser for objectify trees.
+
+    You can pass all keyword arguments that are supported by
+    ``etree.XMLParser()``.  Note that this parser defaults to removing
+    blank text.  You can disable this by passing the
+    ``remove_blank_text`` boolean keyword option yourself.
+    """
+    if 'remove_blank_text' not in kw:
+        kw['remove_blank_text'] = True
+    parser = etree.XMLParser(**kw)
+    parser.set_element_class_lookup( ObjectifyElementClassLookup() )
+    return parser
+
+cdef _Element _makeElement(tag, text, attrib, nsmap):
+    return cetree.makeElement(tag, None, objectify_parser, text, None, attrib, nsmap)
+
+################################################################################
+# Module level factory functions
+
+cdef object _fromstring
+_fromstring = etree.fromstring
+
+SubElement = etree.SubElement
+
+def fromstring(xml, parser=None, *, base_url=None):
+    u"""fromstring(xml, parser=None, base_url=None)
+
+    Objectify specific version of the lxml.etree fromstring() function
+    that uses the objectify parser.
+
+    You can pass a different parser as second argument.
+
+    The ``base_url`` keyword argument allows to set the original base URL of
+    the document to support relative Paths when looking up external entities
+    (DTD, XInclude, ...).
+    """
+    if parser is None:
+        parser = objectify_parser
+    return _fromstring(xml, parser, base_url=base_url)
+
+def XML(xml, parser=None, *, base_url=None):
+    u"""XML(xml, parser=None, base_url=None)
+
+    Objectify specific version of the lxml.etree XML() literal factory
+    that uses the objectify parser.
+
+    You can pass a different parser as second argument.
+
+    The ``base_url`` keyword argument allows to set the original base URL of
+    the document to support relative Paths when looking up external entities
+    (DTD, XInclude, ...).
+    """
+    if parser is None:
+        parser = objectify_parser
+    return _fromstring(xml, parser, base_url=base_url)
+
+cdef object _parse
+_parse = etree.parse
+
+def parse(f, parser=None, *, base_url=None):
+    u"""parse(f, parser=None, base_url=None)
+
+    Parse a file or file-like object with the objectify parser.
+
+    You can pass a different parser as second argument.
+
+    The ``base_url`` keyword allows setting a URL for the document
+    when parsing from a file-like object.  This is needed when looking
+    up external entities (DTD, XInclude, ...) with relative paths.
+    """
+    if parser is None:
+        parser = objectify_parser
+    return _parse(f, parser, base_url=base_url)
+
+cdef dict _DEFAULT_NSMAP = {
+    "py"  : PYTYPE_NAMESPACE,
+    "xsi" : XML_SCHEMA_INSTANCE_NS,
+    "xsd" : XML_SCHEMA_NS
+}
+
+E = ElementMaker()
+
+def Element(_tag, attrib=None, nsmap=None, *, _pytype=None, **_attributes):
+    u"""Element(_tag, attrib=None, nsmap=None, _pytype=None, **_attributes)
+
+    Objectify specific version of the lxml.etree Element() factory that
+    always creates a structural (tree) element.
+
+    NOTE: requires parser based element class lookup activated in lxml.etree!
+    """
+    if attrib is not None:
+        if python.PyDict_Size(_attributes):
+            attrib = dict(attrib)
+            attrib.update(_attributes)
+        _attributes = attrib
+    if _pytype is None:
+        _pytype = TREE_PYTYPE_NAME
+    if nsmap is None:
+        nsmap = _DEFAULT_NSMAP
+    _attributes[PYTYPE_ATTRIBUTE] = _pytype
+    return _makeElement(_tag, None, _attributes, nsmap)
+
+def DataElement(_value, attrib=None, nsmap=None, *, _pytype=None, _xsi=None,
+                **_attributes):
+    u"""DataElement(_value, attrib=None, nsmap=None, _pytype=None, _xsi=None, **_attributes)
+
+    Create a new element from a Python value and XML attributes taken from
+    keyword arguments or a dictionary passed as second argument.
+
+    Automatically adds a 'pytype' attribute for the Python type of the value,
+    if the type can be identified.  If '_pytype' or '_xsi' are among the
+    keyword arguments, they will be used instead.
+
+    If the _value argument is an ObjectifiedDataElement instance, its py:pytype,
+    xsi:type and other attributes and nsmap are reused unless they are redefined
+    in attrib and/or keyword arguments.
+    """
+    cdef python.PyObject* dict_result
+    if nsmap is None:
+        nsmap = _DEFAULT_NSMAP
+    if attrib is not None and attrib:
+        if _attributes:
+            attrib = dict(attrib)
+            attrib.update(_attributes)
+        _attributes = attrib
+    if isinstance(_value, ObjectifiedElement):
+        if _pytype is None:
+            if _xsi is None and not _attributes and nsmap is _DEFAULT_NSMAP:
+                # special case: no change!
+                return _value.__copy__()
+    if isinstance(_value, ObjectifiedDataElement):
+        # reuse existing nsmap unless redefined in nsmap parameter
+        temp = _value.nsmap
+        if temp is not None and temp:
+            temp = dict(temp)
+            temp.update(nsmap)
+            nsmap = temp
+        # reuse existing attributes unless redefined in attrib/_attributes
+        temp = _value.attrib
+        if temp is not None and temp:
+            temp = dict(temp)
+            temp.update(_attributes)
+            _attributes = temp
+        # reuse existing xsi:type or py:pytype attributes, unless provided as
+        # arguments
+        if _xsi is None and _pytype is None:
+            dict_result = python.PyDict_GetItem(_attributes,
+                                                XML_SCHEMA_INSTANCE_TYPE_ATTR)
+            if dict_result is not NULL:
+                _xsi = <object>dict_result
+            dict_result = python.PyDict_GetItem(_attributes, PYTYPE_ATTRIBUTE)
+            if dict_result is not NULL:
+                _pytype = <object>dict_result
+
+    if _xsi is not None:
+        if u':' in _xsi:
+            prefix, name = _xsi.split(u':', 1)
+            ns = nsmap.get(prefix)
+            if ns != XML_SCHEMA_NS:
+                raise ValueError, u"XSD types require the XSD namespace"
+        elif nsmap is _DEFAULT_NSMAP:
+            name = _xsi
+            _xsi = u'xsd:' + _xsi
+        else:
+            name = _xsi
+            for prefix, ns in nsmap.items():
+                if ns == XML_SCHEMA_NS:
+                    if prefix is not None and prefix:
+                        _xsi = prefix + u':' + _xsi
+                    break
+            else:
+                raise ValueError, u"XSD types require the XSD namespace"
+        _attributes[XML_SCHEMA_INSTANCE_TYPE_ATTR] = _xsi
+        if _pytype is None:
+            # allow using unregistered or even wrong xsi:type names
+            dict_result = python.PyDict_GetItem(_SCHEMA_TYPE_DICT, _xsi)
+            if dict_result is NULL:
+                dict_result = python.PyDict_GetItem(_SCHEMA_TYPE_DICT, name)
+            if dict_result is not NULL:
+                _pytype = (<PyType>dict_result).name
+
+    if _pytype is None:
+        _pytype = _pytypename(_value)
+
+    if _value is None and _pytype != u"str":
+        _pytype = _pytype or u"NoneType"
+        strval = None
+    elif python._isString(_value):
+        strval = _value
+    elif isinstance(_value, bool):
+        if _value:
+            strval = u"true"
+        else:
+            strval = u"false"
+    else:
+        stringify = unicode
+        dict_result = python.PyDict_GetItem(_PYTYPE_DICT, _pytype)
+        if dict_result is not NULL:
+            stringify = (<PyType>dict_result).stringify
+        strval = stringify(_value)
+
+    if _pytype is not None: 
+        if _pytype == u"NoneType" or _pytype == u"none":
+            strval = None
+            _attributes[XML_SCHEMA_INSTANCE_NIL_ATTR] = u"true"
+        else:
+            # check if type information from arguments is valid
+            dict_result = python.PyDict_GetItem(_PYTYPE_DICT, _pytype)
+            if dict_result is not NULL:
+                type_check = (<PyType>dict_result).type_check
+                if type_check is not None:
+                    type_check(strval)
+
+                _attributes[PYTYPE_ATTRIBUTE] = _pytype
+
+    return _makeElement(u"value", strval, _attributes, nsmap)
+
+
+################################################################################
+# ObjectPath
+
+include "objectpath.pxi"
diff --git a/lib/lxml/lxml_endian.h b/lib/lxml/lxml_endian.h
new file mode 100644
index 00000000..f53cb7ad
--- /dev/null
+++ b/lib/lxml/lxml_endian.h
@@ -0,0 +1,14 @@
+#ifndef PY_BIG_ENDIAN
+
+#ifdef _MSC_VER
+typedef unsigned __int32 uint32_t;
+#else
+#include <stdint.h>
+#endif
+
+static CYTHON_INLINE int _lx__is_big_endian(void) {
+    union {uint32_t i; char c[4];} x = {0x01020304};
+    return x.c[0] == 1;
+}
+#define PY_BIG_ENDIAN _lx__is_big_endian()
+#endif
diff --git a/lib/lxml/nsclasses.pxi b/lib/lxml/nsclasses.pxi
new file mode 100644
index 00000000..b592951e
--- /dev/null
+++ b/lib/lxml/nsclasses.pxi
@@ -0,0 +1,239 @@
+# module-level API for namespace implementations
+
+class LxmlRegistryError(LxmlError):
+    u"""Base class of lxml registry errors.
+    """
+    pass
+
+class NamespaceRegistryError(LxmlRegistryError):
+    u"""Error registering a namespace extension.
+    """
+    pass
+
+
+@cython.internal
+cdef class _NamespaceRegistry:
+    u"Dictionary-like namespace registry"
+    cdef object _ns_uri
+    cdef bytes _ns_uri_utf
+    cdef dict _entries
+    cdef char* _c_ns_uri_utf
+    def __cinit__(self, ns_uri):
+        self._ns_uri = ns_uri
+        if ns_uri is None:
+            self._ns_uri_utf = None
+            self._c_ns_uri_utf = NULL
+        else:
+            self._ns_uri_utf = _utf8(ns_uri)
+            self._c_ns_uri_utf = _cstr(self._ns_uri_utf)
+        self._entries = {}
+
+    def update(self, class_dict_iterable):
+        u"""update(self, class_dict_iterable)
+
+        Forgivingly update the registry.
+
+        ``class_dict_iterable`` may be a dict or some other iterable
+        that yields (name, value) pairs.
+
+        If a value does not match the required type for this registry,
+        or if the name starts with '_', it will be silently discarded.
+        This allows registrations at the module or class level using
+        vars(), globals() etc."""
+        if hasattr(class_dict_iterable, u'items'):
+            class_dict_iterable = class_dict_iterable.items()
+        for name, item in class_dict_iterable:
+            if (name is None or name[:1] != '_') and callable(item):
+                self[name] = item
+
+    def __getitem__(self, name):
+        if name is not None:
+            name = _utf8(name)
+        return self._get(name)
+
+    def __delitem__(self, name):
+        if name is not None:
+            name = _utf8(name)
+        del self._entries[name]
+
+    cdef object _get(self, object name):
+        cdef python.PyObject* dict_result
+        dict_result = python.PyDict_GetItem(self._entries, name)
+        if dict_result is NULL:
+            raise KeyError, u"Name not registered."
+        return <object>dict_result
+
+    cdef object _getForString(self, char* name):
+        cdef python.PyObject* dict_result
+        dict_result = python.PyDict_GetItem(self._entries, name)
+        if dict_result is NULL:
+            raise KeyError, u"Name not registered."
+        return <object>dict_result
+
+    def __iter__(self):
+        return iter(self._entries)
+
+    def items(self):
+        return list(self._entries.items())
+
+    def iteritems(self):
+        return iter(self._entries.items())
+
+    def clear(self):
+        self._entries.clear()
+
+@cython.final
+@cython.internal
+cdef class _ClassNamespaceRegistry(_NamespaceRegistry):
+    u"Dictionary-like registry for namespace implementation classes"
+    def __setitem__(self, name, item):
+        if not python.PyType_Check(item) or not issubclass(item, ElementBase):
+            raise NamespaceRegistryError, \
+                u"Registered element classes must be subtypes of ElementBase"
+        if name is not None:
+            name = _utf8(name)
+        self._entries[name] = item
+
+    def __repr__(self):
+        return u"Namespace(%r)" % self._ns_uri
+
+
+cdef class ElementNamespaceClassLookup(FallbackElementClassLookup):
+    u"""ElementNamespaceClassLookup(self, fallback=None)
+
+    Element class lookup scheme that searches the Element class in the
+    Namespace registry.
+    """
+    cdef dict _namespace_registries
+    def __cinit__(self):
+        self._namespace_registries = {}
+
+    def __init__(self, ElementClassLookup fallback=None):
+        FallbackElementClassLookup.__init__(self, fallback)
+        self._lookup_function = _find_nselement_class
+
+    def get_namespace(self, ns_uri):
+        u"""get_namespace(self, ns_uri)
+
+        Retrieve the namespace object associated with the given URI.
+        Pass None for the empty namespace.
+
+        Creates a new namespace object if it does not yet exist."""
+        if ns_uri:
+            ns_utf = _utf8(ns_uri)
+        else:
+            ns_utf = None
+        try:
+            return self._namespace_registries[ns_utf]
+        except KeyError:
+            registry = self._namespace_registries[ns_utf] = \
+                       _ClassNamespaceRegistry(ns_uri)
+            return registry
+
+cdef object _find_nselement_class(state, _Document doc, xmlNode* c_node):
+    cdef python.PyObject* dict_result
+    cdef ElementNamespaceClassLookup lookup
+    cdef _NamespaceRegistry registry
+    if state is None:
+        return _lookupDefaultElementClass(None, doc, c_node)
+
+    lookup = <ElementNamespaceClassLookup>state
+    if c_node.type != tree.XML_ELEMENT_NODE:
+        return _callLookupFallback(lookup, doc, c_node)
+
+    c_namespace_utf = _getNs(c_node)
+    if c_namespace_utf is not NULL:
+        dict_result = python.PyDict_GetItem(
+            lookup._namespace_registries, <unsigned char*>c_namespace_utf)
+    else:
+        dict_result = python.PyDict_GetItem(
+            lookup._namespace_registries, None)
+    if dict_result is not NULL:
+        registry = <_NamespaceRegistry>dict_result
+        classes = registry._entries
+
+        if c_node.name is not NULL:
+            dict_result = python.PyDict_GetItem(
+                classes, <unsigned char*>c_node.name)
+        else:
+            dict_result = NULL
+
+        if dict_result is NULL:
+            dict_result = python.PyDict_GetItem(classes, None)
+
+        if dict_result is not NULL:
+            return <object>dict_result
+    return _callLookupFallback(lookup, doc, c_node)
+
+
+################################################################################
+# XPath extension functions
+
+cdef dict __FUNCTION_NAMESPACE_REGISTRIES
+__FUNCTION_NAMESPACE_REGISTRIES = {}
+
+def FunctionNamespace(ns_uri):
+    u"""FunctionNamespace(ns_uri)
+
+    Retrieve the function namespace object associated with the given
+    URI.
+
+    Creates a new one if it does not yet exist. A function namespace
+    can only be used to register extension functions."""
+    ns_utf = _utf8(ns_uri) if ns_uri else None
+    try:
+        return __FUNCTION_NAMESPACE_REGISTRIES[ns_utf]
+    except KeyError:
+        registry = __FUNCTION_NAMESPACE_REGISTRIES[ns_utf] = \
+                   _XPathFunctionNamespaceRegistry(ns_uri)
+        return registry
+
+@cython.internal
+cdef class _FunctionNamespaceRegistry(_NamespaceRegistry):
+    def __setitem__(self, name, item):
+        if not callable(item):
+            raise NamespaceRegistryError, \
+                u"Registered functions must be callable."
+        if not name:
+            raise ValueError, \
+                u"extensions must have non empty names"
+        self._entries[_utf8(name)] = item
+
+    def __repr__(self):
+        return u"FunctionNamespace(%r)" % self._ns_uri
+
+@cython.final
+@cython.internal
+cdef class _XPathFunctionNamespaceRegistry(_FunctionNamespaceRegistry):
+    cdef object _prefix
+    cdef bytes _prefix_utf
+
+    property prefix:
+        u"Namespace prefix for extension functions."
+        def __del__(self):
+            self._prefix = None # no prefix configured
+            self._prefix_utf = None
+        def __get__(self):
+            if self._prefix is None:
+                return ''
+            else:
+                return self._prefix
+        def __set__(self, prefix):
+            if prefix == '':
+                prefix = None # empty prefix
+            if prefix is None:
+                self._prefix_utf = None
+            else:
+                self._prefix_utf = _utf8(prefix)
+            self._prefix = prefix
+
+cdef list _find_all_extension_prefixes():
+    u"Internal lookup function to find all function prefixes for XSLT/XPath."
+    cdef _XPathFunctionNamespaceRegistry registry
+    cdef list ns_prefixes = []
+    for registry in __FUNCTION_NAMESPACE_REGISTRIES.itervalues():
+        if registry._prefix_utf is not None:
+            if registry._ns_uri_utf is not None:
+                ns_prefixes.append(
+                    (registry._prefix_utf, registry._ns_uri_utf))
+    return ns_prefixes
diff --git a/lib/lxml/objectpath.pxi b/lib/lxml/objectpath.pxi
new file mode 100644
index 00000000..0a51984f
--- /dev/null
+++ b/lib/lxml/objectpath.pxi
@@ -0,0 +1,330 @@
+################################################################################
+# ObjectPath
+
+ctypedef struct _ObjectPath:
+    const_xmlChar* href
+    const_xmlChar* name
+    Py_ssize_t index
+
+
+cdef class ObjectPath:
+    u"""ObjectPath(path)
+    Immutable object that represents a compiled object path.
+
+    Example for a path: 'root.child[1].{other}child[25]'
+    """
+    cdef readonly object find
+    cdef object _path
+    cdef object _path_str
+    cdef _ObjectPath*  _c_path
+    cdef Py_ssize_t _path_len
+    def __init__(self, path):
+        if python._isString(path):
+            self._path = _parseObjectPathString(path)
+            self._path_str = path
+        else:
+            self._path = _parseObjectPathList(path)
+            self._path_str = u'.'.join(path)
+        self._path_len = python.PyList_GET_SIZE(self._path)
+        self._c_path = _buildObjectPathSegments(self._path)
+        self.find = self.__call__
+
+    def __dealloc__(self):
+        if self._c_path is not NULL:
+            python.PyMem_Free(self._c_path)
+
+    def __str__(self):
+        return self._path_str
+
+    def __call__(self, _Element root not None, *default):
+        u"""Follow the attribute path in the object structure and return the
+        target attribute value.
+
+        If it it not found, either returns a default value (if one was passed
+        as second argument) or raises AttributeError.
+        """
+        cdef Py_ssize_t use_default
+        use_default = python.PyTuple_GET_SIZE(default)
+        if use_default == 1:
+            default = python.PyTuple_GET_ITEM(default, 0)
+            python.Py_INCREF(default)
+            use_default = 1
+        elif use_default > 1:
+            raise TypeError, u"invalid number of arguments: needs one or two"
+        return _findObjectPath(root, self._c_path, self._path_len,
+                               default, use_default)
+
+    def hasattr(self, _Element root not None):
+        u"hasattr(self, root)"
+        try:
+            _findObjectPath(root, self._c_path, self._path_len, None, 0)
+        except AttributeError:
+            return False
+        return True
+
+    def setattr(self, _Element root not None, value):
+        u"""setattr(self, root, value)
+
+        Set the value of the target element in a subtree.
+
+        If any of the children on the path does not exist, it is created.
+        """
+        _createObjectPath(root, self._c_path, self._path_len, 1, value)
+
+    def addattr(self, _Element root not None, value):
+        u"""addattr(self, root, value)
+
+        Append a value to the target element in a subtree.
+
+        If any of the children on the path does not exist, it is created.
+        """
+        _createObjectPath(root, self._c_path, self._path_len, 0, value)
+
+cdef object __MATCH_PATH_SEGMENT
+__MATCH_PATH_SEGMENT = re.compile(
+    ur"(\.?)\s*(?:\{([^}]*)\})?\s*([^.{}\[\]\s]+)\s*(?:\[\s*([-0-9]+)\s*\])?",
+    re.U).match
+
+cdef object _RELATIVE_PATH_SEGMENT
+_RELATIVE_PATH_SEGMENT = (None, None, 0)
+
+cdef _parseObjectPathString(path):
+    u"""Parse object path string into a (ns, name, index) list.
+    """
+    cdef bint has_dot
+    cdef list new_path = []
+    if isinstance(path, bytes):
+        path = (<bytes>path).decode('ascii')
+    path = path.strip()
+    if path == u'.':
+        return [_RELATIVE_PATH_SEGMENT]
+    path_pos = 0
+    while python.PyUnicode_GET_SIZE(path) > 0:
+        match = __MATCH_PATH_SEGMENT(path, path_pos)
+        if match is None:
+            break
+
+        dot, ns, name, index = match.groups()
+        if index is None or not index:
+            index = 0
+        else:
+            index = int(index)
+        has_dot = dot == u'.'
+        if python.PyList_GET_SIZE(new_path) == 0:
+            if has_dot:
+                # path '.child' => ignore root
+                new_path.append(_RELATIVE_PATH_SEGMENT)
+            elif index != 0:
+                raise ValueError, u"index not allowed on root node"
+        elif not has_dot:
+            raise ValueError, u"invalid path"
+        if ns is not None:
+            ns = python.PyUnicode_AsUTF8String(ns)
+        name = python.PyUnicode_AsUTF8String(name)
+        new_path.append( (ns, name, index) )
+
+        path_pos = match.end()
+    if python.PyList_GET_SIZE(new_path) == 0 or \
+           python.PyUnicode_GET_SIZE(path) > path_pos:
+        raise ValueError, u"invalid path"
+    return new_path
+
+cdef _parseObjectPathList(path):
+    u"""Parse object path sequence into a (ns, name, index) list.
+    """
+    cdef list new_path = []
+    for item in path:
+        item = item.strip()
+        if python.PyList_GET_SIZE(new_path) == 0 and item == u'':
+            # path '.child' => ignore root
+            ns = name = None
+            index = 0
+        else:
+            ns, name = cetree.getNsTag(item)
+            c_name = _xcstr(name)
+            index_pos = tree.xmlStrchr(c_name, c'[')
+            if index_pos is NULL:
+                index = 0
+            else:
+                index_end = tree.xmlStrchr(index_pos + 1, c']')
+                if index_end is NULL:
+                    raise ValueError, u"index must be enclosed in []"
+                index = int(index_pos[1:index_end - index_pos])
+                if python.PyList_GET_SIZE(new_path) == 0 and index != 0:
+                    raise ValueError, u"index not allowed on root node"
+                name = <bytes>c_name[:index_pos - c_name]
+        new_path.append( (ns, name, index) )
+    if python.PyList_GET_SIZE(new_path) == 0:
+        raise ValueError, u"invalid path"
+    return new_path
+
+cdef _ObjectPath* _buildObjectPathSegments(path_list) except NULL:
+    cdef _ObjectPath* c_path
+    cdef _ObjectPath* c_path_segments
+    c_path_segments = <_ObjectPath*>python.PyMem_Malloc(
+        sizeof(_ObjectPath) * python.PyList_GET_SIZE(path_list))
+    if c_path_segments is NULL:
+        raise MemoryError()
+    c_path = c_path_segments
+    for href, name, index in path_list:
+        c_path[0].href = _xcstr(href) if href is not None else NULL
+        c_path[0].name = _xcstr(name) if name is not None else NULL
+        c_path[0].index = index
+        c_path += 1
+    return c_path_segments
+
+cdef _findObjectPath(_Element root, _ObjectPath* c_path, Py_ssize_t c_path_len,
+                     default_value, int use_default):
+    u"""Follow the path to find the target element.
+    """
+    cdef tree.xmlNode* c_node
+    cdef Py_ssize_t c_index
+    c_node = root._c_node
+    c_name = c_path[0].name
+    c_href = c_path[0].href
+    if c_href is NULL or c_href[0] == c'\0':
+        c_href = tree._getNs(c_node)
+    if not cetree.tagMatches(c_node, c_href, c_name):
+        if use_default:
+            return default_value
+        else:
+            raise ValueError, \
+                u"root element does not match: need %s, got %s" % \
+                (cetree.namespacedNameFromNsName(c_href, c_name), root.tag)
+
+    while c_node is not NULL:
+        c_path_len -= 1
+        if c_path_len <= 0:
+            break
+
+        c_path += 1
+        if c_path[0].href is not NULL:
+            c_href = c_path[0].href # otherwise: keep parent namespace
+        c_name = tree.xmlDictExists(c_node.doc.dict, c_path[0].name, -1)
+        if c_name is NULL:
+            c_name = c_path[0].name
+            c_node = NULL
+            break
+        c_index = c_path[0].index
+        c_node = c_node.last if c_index < 0 else c_node.children
+        c_node = _findFollowingSibling(c_node, c_href, c_name, c_index)
+
+    if c_node is not NULL:
+        return cetree.elementFactory(root._doc, c_node)
+    elif use_default:
+        return default_value
+    else:
+        tag = cetree.namespacedNameFromNsName(c_href, c_name)
+        raise AttributeError, u"no such child: " + tag
+
+cdef _createObjectPath(_Element root, _ObjectPath* c_path,
+                       Py_ssize_t c_path_len, int replace, value):
+    u"""Follow the path to find the target element, build the missing children
+    as needed and set the target element to 'value'.  If replace is true, an
+    existing value is replaced, otherwise the new value is added.
+    """
+    cdef _Element child
+    cdef tree.xmlNode* c_node
+    cdef tree.xmlNode* c_child
+    cdef Py_ssize_t c_index
+    if c_path_len == 1:
+        raise TypeError, u"cannot update root node"
+
+    c_node = root._c_node
+    c_name = c_path[0].name
+    c_href = c_path[0].href
+    if c_href is NULL or c_href[0] == c'\0':
+        c_href = tree._getNs(c_node)
+    if not cetree.tagMatches(c_node, c_href, c_name):
+        raise ValueError, \
+            u"root element does not match: need %s, got %s" % \
+            (cetree.namespacedNameFromNsName(c_href, c_name), root.tag)
+
+    while c_path_len > 1:
+        c_path_len -= 1
+        c_path += 1
+        if c_path[0].href is not NULL:
+            c_href = c_path[0].href # otherwise: keep parent namespace
+        c_index = c_path[0].index
+        c_name = tree.xmlDictExists(c_node.doc.dict, c_path[0].name, -1)
+        if c_name is NULL:
+            c_name = c_path[0].name
+            c_child = NULL
+        else:
+            c_child = c_node.last if c_index < 0 else c_node.children
+            c_child = _findFollowingSibling(c_child, c_href, c_name, c_index)
+
+        if c_child is not NULL:
+            c_node = c_child
+        elif c_index != 0:
+            raise TypeError, \
+                u"creating indexed path attributes is not supported"
+        elif c_path_len == 1:
+            _appendValue(cetree.elementFactory(root._doc, c_node),
+                         cetree.namespacedNameFromNsName(c_href, c_name),
+                         value)
+            return
+        else:
+            child = cetree.makeSubElement(
+                cetree.elementFactory(root._doc, c_node),
+                cetree.namespacedNameFromNsName(c_href, c_name),
+                None, None, None, None)
+            c_node = child._c_node
+
+    # if we get here, the entire path was already there
+    if replace:
+        element = cetree.elementFactory(root._doc, c_node)
+        _replaceElement(element, value)
+    else:
+        _appendValue(cetree.elementFactory(root._doc, c_node.parent),
+                     cetree.namespacedName(c_node), value)
+
+cdef list _buildDescendantPaths(tree.xmlNode* c_node, prefix_string):
+    u"""Returns a list of all descendant paths.
+    """
+    cdef list path, path_list
+    tag = cetree.namespacedName(c_node)
+    if prefix_string:
+        if prefix_string[-1] != u'.':
+            prefix_string += u'.'
+        prefix_string = prefix_string + tag
+    else:
+        prefix_string = tag
+    path = [prefix_string]
+    path_list = []
+    _recursiveBuildDescendantPaths(c_node, path, path_list)
+    return path_list
+
+cdef int _recursiveBuildDescendantPaths(tree.xmlNode* c_node,
+                                        list path, list path_list) except -1:
+    u"""Fills the list 'path_list' with all descendant paths, initial prefix
+    being in the list 'path'.
+    """
+    cdef python.PyObject* dict_result
+    cdef tree.xmlNode* c_child
+    cdef dict tags = {}
+    path_list.append( u'.'.join(path) )
+    c_href = tree._getNs(c_node)
+    c_child = c_node.children
+    while c_child is not NULL:
+        while c_child.type != tree.XML_ELEMENT_NODE:
+            c_child = c_child.next
+            if c_child is NULL:
+                return 0
+        if c_href is tree._getNs(c_child):
+            tag = pyunicode(c_child.name)
+        elif c_href is not NULL and tree._getNs(c_child) is NULL:
+            # special case: parent has namespace, child does not
+            tag = u'{}' + pyunicode(c_child.name)
+        else:
+            tag = cetree.namespacedName(c_child)
+        dict_result = python.PyDict_GetItem(tags, tag)
+        count = (<object>dict_result) + 1 if dict_result is not NULL else 0
+        tags[tag] = count
+        if count > 0:
+            tag += u'[%d]' % count
+        path.append(tag)
+        _recursiveBuildDescendantPaths(c_child, path, path_list)
+        del path[-1]
+        c_child = c_child.next
+    return 0
diff --git a/lib/lxml/parser.pxi b/lib/lxml/parser.pxi
new file mode 100644
index 00000000..fbcff6fa
--- /dev/null
+++ b/lib/lxml/parser.pxi
@@ -0,0 +1,1780 @@
+# Parsers for XML and HTML
+
+from lxml.includes cimport xmlparser
+from lxml.includes cimport htmlparser
+
+cdef class _ParserContext(_ResolverContext)
+cdef class _SaxParserContext(_ParserContext)
+cdef class _TargetParserContext(_SaxParserContext)
+cdef class _ParserSchemaValidationContext
+cdef class _Validator
+cdef class XMLSchema(_Validator)
+
+class ParseError(LxmlSyntaxError):
+    u"""Syntax error while parsing an XML document.
+
+    For compatibility with ElementTree 1.3 and later.
+    """
+    def __init__(self, message, code, line, column):
+        super(_ParseError, self).__init__(message)
+        self.position = (line, column)
+        self.code = code
+
+cdef object _ParseError = ParseError
+
+class XMLSyntaxError(ParseError):
+    u"""Syntax error while parsing an XML document.
+    """
+    pass
+
+class ParserError(LxmlError):
+    u"""Internal lxml parser error.
+    """
+    pass
+
+@cython.final
+@cython.internal
+cdef class _ParserDictionaryContext:
+    # Global parser context to share the string dictionary.
+    #
+    # This class is a delegate singleton!
+    #
+    # It creates _ParserDictionaryContext objects for each thread to keep thread state,
+    # but those must never be used directly.  Always stick to using the static
+    # __GLOBAL_PARSER_CONTEXT as defined below the class.
+    #
+
+    cdef tree.xmlDict* _c_dict
+    cdef _BaseParser _default_parser
+    cdef list _implied_parser_contexts
+
+    def __cinit__(self):
+        self._c_dict = NULL
+        self._implied_parser_contexts = []
+
+    def __dealloc__(self):
+        if self._c_dict is not NULL:
+            xmlparser.xmlDictFree(self._c_dict)
+
+    cdef void initMainParserContext(self):
+        u"""Put the global context into the thread dictionary of the main
+        thread.  To be called once and only in the main thread."""
+        cdef python.PyObject* thread_dict
+        cdef python.PyObject* result
+        thread_dict = python.PyThreadState_GetDict()
+        if thread_dict is not NULL:
+            (<dict>thread_dict)[u"_ParserDictionaryContext"] = self
+
+    cdef _ParserDictionaryContext _findThreadParserContext(self):
+        u"Find (or create) the _ParserDictionaryContext object for the current thread"
+        cdef python.PyObject* thread_dict
+        cdef python.PyObject* result
+        cdef _ParserDictionaryContext context
+        thread_dict = python.PyThreadState_GetDict()
+        if thread_dict is NULL:
+            return self
+        d = <dict>thread_dict
+        result = python.PyDict_GetItem(d, u"_ParserDictionaryContext")
+        if result is not NULL:
+            return <object>result
+        context = _ParserDictionaryContext()
+        d[u"_ParserDictionaryContext"] = context
+        return context
+
+    cdef void setDefaultParser(self, _BaseParser parser):
+        u"Set the default parser for the current thread"
+        cdef _ParserDictionaryContext context
+        context = self._findThreadParserContext()
+        context._default_parser = parser
+
+    cdef _BaseParser getDefaultParser(self):
+        u"Return (or create) the default parser of the current thread"
+        cdef _ParserDictionaryContext context
+        context = self._findThreadParserContext()
+        if context._default_parser is None:
+            if self._default_parser is None:
+                self._default_parser = __DEFAULT_XML_PARSER._copy()
+            if context is not self:
+                context._default_parser = self._default_parser._copy()
+        return context._default_parser
+
+    cdef tree.xmlDict* _getThreadDict(self, tree.xmlDict* default):
+        u"Return the thread-local dict or create a new one if necessary."
+        cdef _ParserDictionaryContext context
+        context = self._findThreadParserContext()
+        if context._c_dict is NULL:
+            # thread dict not yet set up => use default or create a new one
+            if default is not NULL:
+                context._c_dict = default
+                xmlparser.xmlDictReference(default)
+                return default
+            if self._c_dict is NULL:
+                self._c_dict = xmlparser.xmlDictCreate()
+            if context is not self:
+                context._c_dict = xmlparser.xmlDictCreateSub(self._c_dict)
+        return context._c_dict
+
+    cdef void initThreadDictRef(self, tree.xmlDict** c_dict_ref):
+        cdef tree.xmlDict* c_dict
+        cdef tree.xmlDict* c_thread_dict
+        c_dict = c_dict_ref[0]
+        c_thread_dict = self._getThreadDict(c_dict)
+        if c_dict is c_thread_dict:
+            return
+        if c_dict is not NULL:
+            xmlparser.xmlDictFree(c_dict)
+        c_dict_ref[0] = c_thread_dict
+        xmlparser.xmlDictReference(c_thread_dict)
+
+    cdef void initParserDict(self, xmlparser.xmlParserCtxt* pctxt):
+        u"Assure we always use the same string dictionary."
+        self.initThreadDictRef(&pctxt.dict)
+        pctxt.dictNames = 1
+
+    cdef void initXPathParserDict(self, xpath.xmlXPathContext* pctxt):
+        u"Assure we always use the same string dictionary."
+        self.initThreadDictRef(&pctxt.dict)
+
+    cdef void initDocDict(self, xmlDoc* result):
+        u"Store dict of last object parsed if no shared dict yet"
+        # XXX We also free the result dict here if there already was one.
+        # This case should only occur for new documents with empty dicts,
+        # otherwise we'd free data that's in use => segfault
+        self.initThreadDictRef(&result.dict)
+
+    cdef _ParserContext findImpliedContext(self):
+        u"""Return any current implied xml parser context for the current
+        thread.  This is used when the resolver functions are called
+        with an xmlParserCtxt that was generated from within libxml2
+        (i.e. without a _ParserContext) - which happens when parsing
+        schema and xinclude external references."""
+        cdef _ParserDictionaryContext context
+        cdef _ParserContext implied_context
+
+        # see if we have a current implied parser
+        context = self._findThreadParserContext()
+        if context._implied_parser_contexts:
+            implied_context = context._implied_parser_contexts[-1]
+            return implied_context
+        return None
+
+    cdef void pushImpliedContextFromParser(self, _BaseParser parser):
+        u"Push a new implied context object taken from the parser."
+        if parser is not None:
+            self.pushImpliedContext(parser._getParserContext())
+        else:
+            self.pushImpliedContext(None)
+
+    cdef void pushImpliedContext(self, _ParserContext parser_context):
+        u"Push a new implied context object."
+        cdef _ParserDictionaryContext context
+        context = self._findThreadParserContext()
+        context._implied_parser_contexts.append(parser_context)
+
+    cdef void popImpliedContext(self):
+        u"Pop the current implied context object."
+        cdef _ParserDictionaryContext context
+        context = self._findThreadParserContext()
+        context._implied_parser_contexts.pop()
+
+cdef _ParserDictionaryContext __GLOBAL_PARSER_CONTEXT
+__GLOBAL_PARSER_CONTEXT = _ParserDictionaryContext()
+__GLOBAL_PARSER_CONTEXT.initMainParserContext()
+
+############################################################
+## support for Python unicode I/O
+############################################################
+
+# name of Python unicode encoding as known to libxml2
+cdef const_char* _UNICODE_ENCODING = NULL
+
+cdef int _setupPythonUnicode() except -1:
+    u"""Sets _UNICODE_ENCODING to the internal encoding name of Python unicode
+    strings if libxml2 supports reading native Python unicode.  This depends
+    on iconv and the local Python installation, so we simply check if we find
+    a matching encoding handler.
+    """
+    cdef tree.xmlCharEncodingHandler* enchandler
+    cdef Py_ssize_t l
+    cdef const_char* enc
+    cdef Py_UNICODE *uchars = [c'<', c't', c'e', c's', c't', c'/', c'>']
+    cdef const_xmlChar* buffer = <const_xmlChar*>uchars
+    # apparently, libxml2 can't detect UTF-16 on some systems
+    if (buffer[0] == c'<' and buffer[1] == c'\0' and
+            buffer[2] == c't' and buffer[3] == c'\0'):
+        enc = "UTF-16LE"
+    elif (buffer[0] == c'\0' and buffer[1] == c'<' and
+            buffer[2] == c'\0' and buffer[3] == c't'):
+        enc = "UTF-16BE"
+    else:
+        # let libxml2 give it a try
+        enc = _findEncodingName(buffer, sizeof(Py_UNICODE) * 7)
+        if enc is NULL:
+            # not my fault, it's YOUR broken system :)
+            return 0
+    enchandler = tree.xmlFindCharEncodingHandler(enc)
+    if enchandler is not NULL:
+        global _UNICODE_ENCODING
+        tree.xmlCharEncCloseFunc(enchandler)
+        _UNICODE_ENCODING = enc
+    return 0
+
+cdef const_char* _findEncodingName(const_xmlChar* buffer, int size):
+    u"Work around bug in libxml2: find iconv name of encoding on our own."
+    cdef tree.xmlCharEncoding enc
+    enc = tree.xmlDetectCharEncoding(buffer, size)
+    if enc == tree.XML_CHAR_ENCODING_UTF16LE:
+        return "UTF-16LE"
+    elif enc == tree.XML_CHAR_ENCODING_UTF16BE:
+        return "UTF-16BE"
+    elif enc == tree.XML_CHAR_ENCODING_UCS4LE:
+        return "UCS-4LE"
+    elif enc == tree.XML_CHAR_ENCODING_UCS4BE:
+        return "UCS-4BE"
+    elif enc == tree.XML_CHAR_ENCODING_NONE:
+        return NULL
+    else:
+        # returns a constant char*, no need to free it
+        return tree.xmlGetCharEncodingName(enc)
+
+_setupPythonUnicode()
+
+############################################################
+## support for file-like objects
+############################################################
+
+@cython.final
+@cython.internal
+cdef class _FileReaderContext:
+    cdef object _filelike
+    cdef object _encoding
+    cdef object _url
+    cdef object _bytes
+    cdef _ExceptionContext _exc_context
+    cdef Py_ssize_t _bytes_read
+    cdef char* _c_url
+    cdef bint _close_file_after_read
+
+    def __cinit__(self, filelike, exc_context not None, url, encoding=None, bint close_file=False):
+        self._exc_context = exc_context
+        self._filelike = filelike
+        self._close_file_after_read = close_file
+        self._encoding = encoding
+        if url is None:
+            self._c_url = NULL
+        else:
+            url = _encodeFilename(url)
+            self._c_url = _cstr(url)
+        self._url = url
+        self._bytes  = b''
+        self._bytes_read = 0
+
+    cdef _close_file(self):
+        if self._filelike is None or not self._close_file_after_read:
+            return
+        try:
+            close = self._filelike.close
+        except AttributeError:
+            close = None
+        finally:
+            self._filelike = None
+        if close is not None:
+            close()
+
+    cdef xmlparser.xmlParserInputBuffer* _createParserInputBuffer(self):
+        cdef stdio.FILE* c_stream
+        cdef xmlparser.xmlParserInputBuffer* c_buffer
+        c_buffer = xmlparser.xmlAllocParserInputBuffer(0)
+        c_stream = python.PyFile_AsFile(self._filelike)
+        if c_stream is NULL:
+            c_buffer.readcallback  = _readFilelikeParser
+            c_buffer.context = <python.PyObject*>self
+        else:
+            c_buffer.readcallback  = _readFileParser
+            c_buffer.context = c_stream
+        return c_buffer
+
+    cdef xmlparser.xmlParserInput* _createParserInput(
+            self, xmlparser.xmlParserCtxt* ctxt):
+        cdef xmlparser.xmlParserInputBuffer* c_buffer
+        c_buffer = self._createParserInputBuffer()
+        return xmlparser.xmlNewIOInputStream(ctxt, c_buffer, 0)
+
+    cdef tree.xmlDtd* _readDtd(self):
+        cdef xmlparser.xmlParserInputBuffer* c_buffer
+        c_buffer = self._createParserInputBuffer()
+        with nogil:
+            return xmlparser.xmlIOParseDTD(NULL, c_buffer, 0)
+
+    cdef xmlDoc* _readDoc(self, xmlparser.xmlParserCtxt* ctxt, int options):
+        cdef xmlDoc* result
+        cdef char* c_encoding
+        cdef stdio.FILE* c_stream
+        cdef xmlparser.xmlInputReadCallback c_read_callback
+        cdef xmlparser.xmlInputCloseCallback c_close_callback
+        cdef void* c_callback_context
+
+        if self._encoding is None:
+            c_encoding = NULL
+        else:
+            c_encoding = _cstr(self._encoding)
+
+        c_stream = python.PyFile_AsFile(self._filelike)
+        if c_stream is NULL:
+            c_read_callback  = _readFilelikeParser
+            c_callback_context = <python.PyObject*>self
+        else:
+            c_read_callback  = _readFileParser
+            c_callback_context = c_stream
+
+        orig_options = ctxt.options
+        with nogil:
+            if ctxt.html:
+                result = htmlparser.htmlCtxtReadIO(
+                        ctxt, c_read_callback, NULL, c_callback_context,
+                        self._c_url, c_encoding, options)
+                if result is not NULL:
+                    if _fixHtmlDictNames(ctxt.dict, result) < 0:
+                        tree.xmlFreeDoc(result)
+                        result = NULL
+            else:
+                result = xmlparser.xmlCtxtReadIO(
+                    ctxt, c_read_callback, NULL, c_callback_context,
+                    self._c_url, c_encoding, options)
+        ctxt.options = orig_options # work around libxml2 problem
+        try:
+            self._close_file()
+        except:
+            self._exc_context._store_raised()
+        finally:
+            return result  # swallow any exceptions
+
+    cdef int copyToBuffer(self, char* c_buffer, int c_requested):
+        cdef int c_byte_count = 0
+        cdef char* c_start
+        cdef Py_ssize_t byte_count, remaining
+        if self._bytes_read < 0:
+            return 0
+        try:
+            byte_count = python.PyBytes_GET_SIZE(self._bytes)
+            remaining  = byte_count - self._bytes_read
+            while c_requested > remaining:
+                c_start = _cstr(self._bytes) + self._bytes_read
+                cstring_h.memcpy(c_buffer, c_start, remaining)
+                c_byte_count += remaining
+                c_buffer += remaining
+                c_requested -= remaining
+
+                self._bytes = self._filelike.read(c_requested)
+                if not isinstance(self._bytes, bytes):
+                    if isinstance(self._bytes, unicode):
+                        if self._encoding is None:
+                            self._bytes = (<unicode>self._bytes).encode('utf8')
+                        else:
+                            self._bytes = python.PyUnicode_AsEncodedString(
+                                self._bytes, _cstr(self._encoding), NULL)
+                    else:
+                        self._close_file()
+                        raise TypeError, \
+                            u"reading from file-like objects must return byte strings or unicode strings"
+
+                remaining = python.PyBytes_GET_SIZE(self._bytes)
+                if remaining == 0:
+                    self._bytes_read = -1
+                    self._close_file()
+                    return c_byte_count
+                self._bytes_read = 0
+
+            if c_requested > 0:
+                c_start = _cstr(self._bytes) + self._bytes_read
+                cstring_h.memcpy(c_buffer, c_start, c_requested)
+                c_byte_count += c_requested
+                self._bytes_read += c_requested
+        except:
+            c_byte_count = -1
+            self._exc_context._store_raised()
+            try:
+                self._close_file()
+            except:
+                self._exc_context._store_raised()
+        finally:
+            return c_byte_count  # swallow any exceptions
+
+cdef int _readFilelikeParser(void* ctxt, char* c_buffer, int c_size) with gil:
+    return (<_FileReaderContext>ctxt).copyToBuffer(c_buffer, c_size)
+
+cdef int _readFileParser(void* ctxt, char* c_buffer, int c_size) nogil:
+    return stdio.fread(c_buffer, 1,  c_size, <stdio.FILE*>ctxt)
+
+############################################################
+## support for custom document loaders
+############################################################
+
+cdef xmlparser.xmlParserInput* _local_resolver(const_char* c_url, const_char* c_pubid,
+                                               xmlparser.xmlParserCtxt* c_context) with gil:
+    cdef _ResolverContext context
+    cdef xmlparser.xmlParserInput* c_input
+    cdef _InputDocument doc_ref
+    cdef _FileReaderContext file_context
+    # if there is no _ParserContext associated with the xmlParserCtxt
+    # passed, check to see if the thread state object has an implied
+    # context.
+    if c_context._private is not NULL:
+        context = <_ResolverContext>c_context._private
+    else:
+        context = __GLOBAL_PARSER_CONTEXT.findImpliedContext()
+
+    if context is None:
+        if __DEFAULT_ENTITY_LOADER is NULL:
+            return NULL
+        with nogil:
+            # free the GIL as we might do serious I/O here (e.g. HTTP)
+            c_input = __DEFAULT_ENTITY_LOADER(c_url, c_pubid, c_context)
+        return c_input
+
+    try:
+        if c_url is NULL:
+            url = None
+        else:
+            # parsing a related document (DTD etc.) => UTF-8 encoded URL?
+            url = _decodeFilename(<const_xmlChar*>c_url)
+        if c_pubid is NULL:
+            pubid = None
+        else:
+            pubid = funicode(<const_xmlChar*>c_pubid) # always UTF-8
+
+        doc_ref = context._resolvers.resolve(url, pubid, context)
+    except:
+        context._store_raised()
+        return NULL
+
+    if doc_ref is not None:
+        if doc_ref._type == PARSER_DATA_STRING:
+            data = doc_ref._data_bytes
+            c_input = xmlparser.xmlNewInputStream(c_context)
+            if c_input is not NULL:
+                c_input.base = _xcstr(data)
+                c_input.length = python.PyBytes_GET_SIZE(data)
+                c_input.cur = c_input.base
+                c_input.end = c_input.base + c_input.length
+        elif doc_ref._type == PARSER_DATA_FILENAME:
+            data = None
+            c_filename = _cstr(doc_ref._filename)
+            with nogil:
+                # free the GIL as we might do serious I/O here
+                c_input = xmlparser.xmlNewInputFromFile(
+                    c_context, c_filename)
+        elif doc_ref._type == PARSER_DATA_FILE:
+            file_context = _FileReaderContext(doc_ref._file, context, url,
+                                              None, doc_ref._close_file)
+            c_input = file_context._createParserInput(c_context)
+            data = file_context
+        else:
+            data = None
+            c_input = NULL
+
+        if data is not None:
+            context._storage.add(data)
+        if c_input is not NULL:
+            return c_input
+
+    if __DEFAULT_ENTITY_LOADER is NULL:
+        return NULL
+
+    with nogil:
+        # free the GIL as we might do serious I/O here (e.g. HTTP)
+        c_input = __DEFAULT_ENTITY_LOADER(c_url, c_pubid, c_context)
+    return c_input
+
+cdef xmlparser.xmlExternalEntityLoader __DEFAULT_ENTITY_LOADER
+__DEFAULT_ENTITY_LOADER = xmlparser.xmlGetExternalEntityLoader()
+
+xmlparser.xmlSetExternalEntityLoader(<xmlparser.xmlExternalEntityLoader>_local_resolver)
+
+############################################################
+## Parsers
+############################################################
+
+@cython.internal
+cdef class _ParserContext(_ResolverContext):
+    cdef _ErrorLog _error_log
+    cdef _ParserSchemaValidationContext _validator
+    cdef xmlparser.xmlParserCtxt* _c_ctxt
+    cdef python.PyThread_type_lock _lock
+    cdef _Document _doc
+
+    def __cinit__(self):
+        self._c_ctxt = NULL
+        if not config.ENABLE_THREADING:
+            self._lock = NULL
+        else:
+            self._lock = python.PyThread_allocate_lock()
+        self._error_log = _ErrorLog()
+
+    def __dealloc__(self):
+        if config.ENABLE_THREADING and self._lock is not NULL:
+            python.PyThread_free_lock(self._lock)
+        if self._c_ctxt is not NULL:
+            xmlparser.xmlFreeParserCtxt(self._c_ctxt)
+
+    cdef _ParserContext _copy(self):
+        cdef _ParserContext context
+        context = self.__class__()
+        context._validator = self._validator.copy()
+        _initParserContext(context, self._resolvers._copy(), NULL)
+        return context
+
+    cdef void _initParserContext(self, xmlparser.xmlParserCtxt* c_ctxt):
+        self._c_ctxt = c_ctxt
+        c_ctxt._private = <void*>self
+
+    cdef void _resetParserContext(self):
+        if self._c_ctxt is not NULL:
+            if self._c_ctxt.html:
+                htmlparser.htmlCtxtReset(self._c_ctxt)
+                self._c_ctxt.disableSAX = 0 # work around bug in libxml2
+            else:
+                xmlparser.xmlClearParserCtxt(self._c_ctxt)
+
+    cdef int prepare(self) except -1:
+        cdef int result
+        if config.ENABLE_THREADING and self._lock is not NULL:
+            with nogil:
+                result = python.PyThread_acquire_lock(
+                    self._lock, python.WAIT_LOCK)
+            if result == 0:
+                raise ParserError, u"parser locking failed"
+        self._error_log.clear()
+        self._doc = None
+        self._c_ctxt.sax.serror = _receiveParserError
+        if self._validator is not None:
+            self._validator.connect(self._c_ctxt, self._error_log)
+        return 0
+
+    cdef int cleanup(self) except -1:
+        if self._validator is not None:
+            self._validator.disconnect()
+        self._resetParserContext()
+        self.clear()
+        self._doc = None
+        self._c_ctxt.sax.serror = NULL
+        if config.ENABLE_THREADING and self._lock is not NULL:
+            python.PyThread_release_lock(self._lock)
+        return 0
+
+    cdef object _handleParseResult(self, _BaseParser parser,
+                                   xmlDoc* result, filename):
+        c_doc = self._handleParseResultDoc(parser, result, filename)
+        if self._doc is not None and self._doc._c_doc is c_doc:
+            return self._doc
+        else:
+            return _documentFactory(c_doc, parser)
+
+    cdef xmlDoc* _handleParseResultDoc(self, _BaseParser parser,
+                                       xmlDoc* result, filename) except NULL:
+        recover = parser._parse_options & xmlparser.XML_PARSE_RECOVER
+        return _handleParseResult(self, self._c_ctxt, result,
+                                  filename, recover,
+                                  free_doc=self._doc is None)
+
+cdef _initParserContext(_ParserContext context,
+                        _ResolverRegistry resolvers,
+                        xmlparser.xmlParserCtxt* c_ctxt):
+    _initResolverContext(context, resolvers)
+    if c_ctxt is not NULL:
+        context._initParserContext(c_ctxt)
+
+cdef void _forwardParserError(xmlparser.xmlParserCtxt* _parser_context, xmlerror.xmlError* error) with gil:
+    (<_ParserContext>_parser_context._private)._error_log._receive(error)
+
+cdef void _receiveParserError(void* c_context, xmlerror.xmlError* error) nogil:
+    if __DEBUG:
+        if c_context is NULL or (<xmlparser.xmlParserCtxt*>c_context)._private is NULL:
+            _forwardError(NULL, error)
+        else:
+            _forwardParserError(<xmlparser.xmlParserCtxt*>c_context, error)
+
+cdef int _raiseParseError(xmlparser.xmlParserCtxt* ctxt, filename,
+                          _ErrorLog error_log) except 0:
+    if filename is not None and \
+           ctxt.lastError.domain == xmlerror.XML_FROM_IO:
+        if isinstance(filename, bytes):
+            filename = _decodeFilenameWithLength(
+                <bytes>filename, len(<bytes>filename))
+        if ctxt.lastError.message is not NULL:
+            try:
+                message = (ctxt.lastError.message).decode('utf-8')
+            except UnicodeDecodeError:
+                # the filename may be in there => play safe
+                message = (ctxt.lastError.message).decode('iso8859-1')
+            message = u"Error reading file '%s': %s" % (
+                filename, message.strip())
+        else:
+            message = u"Error reading '%s'" % filename
+        raise IOError, message
+    elif error_log:
+        raise error_log._buildParseException(
+            XMLSyntaxError, u"Document is not well formed")
+    elif ctxt.lastError.message is not NULL:
+        message = (ctxt.lastError.message).strip()
+        code = ctxt.lastError.code
+        line = ctxt.lastError.line
+        column = ctxt.lastError.int2
+        if ctxt.lastError.line > 0:
+            message = u"line %d: %s" % (line, message)
+        raise XMLSyntaxError(message, code, line, column)
+    else:
+        raise XMLSyntaxError(None, xmlerror.XML_ERR_INTERNAL_ERROR, 0, 0)
+
+cdef xmlDoc* _handleParseResult(_ParserContext context,
+                                xmlparser.xmlParserCtxt* c_ctxt,
+                                xmlDoc* result, filename,
+                                bint recover, bint free_doc) except NULL:
+    cdef bint well_formed
+    if result is not NULL:
+        __GLOBAL_PARSER_CONTEXT.initDocDict(result)
+
+    if c_ctxt.myDoc is not NULL:
+        if c_ctxt.myDoc is not result:
+            __GLOBAL_PARSER_CONTEXT.initDocDict(c_ctxt.myDoc)
+            tree.xmlFreeDoc(c_ctxt.myDoc)
+        c_ctxt.myDoc = NULL
+
+    if result is not NULL:
+        if context._validator is not None and \
+                not context._validator.isvalid():
+            well_formed = 0 # actually not 'valid', but anyway ...
+        elif recover or (c_ctxt.wellFormed and
+                         c_ctxt.lastError.level < xmlerror.XML_ERR_ERROR):
+            well_formed = 1
+        elif not c_ctxt.replaceEntities and not c_ctxt.validate \
+                 and context is not None:
+            # in this mode, we ignore errors about undefined entities
+            for error in context._error_log.filter_from_errors():
+                if error.type != ErrorTypes.WAR_UNDECLARED_ENTITY and \
+                       error.type != ErrorTypes.ERR_UNDECLARED_ENTITY:
+                    well_formed = 0
+                    break
+            else:
+                well_formed = 1
+        else:
+            well_formed = 0
+
+        if not well_formed:
+            if free_doc:
+                tree.xmlFreeDoc(result)
+            result = NULL
+
+    if context is not None and context._has_raised():
+        if result is not NULL:
+            if free_doc:
+                tree.xmlFreeDoc(result)
+            result = NULL
+        context._raise_if_stored()
+
+    if result is NULL:
+        if context is not None:
+            _raiseParseError(c_ctxt, filename, context._error_log)
+        else:
+            _raiseParseError(c_ctxt, filename, None)
+    else:
+        if result.URL is NULL and filename is not None:
+            result.URL = tree.xmlStrdup(_xcstr(filename))
+        if result.encoding is NULL:
+            result.encoding = tree.xmlStrdup(<unsigned char*>"UTF-8")
+
+    if context._validator is not None and \
+           context._validator._add_default_attributes:
+        # we currently need to do this here as libxml2 does not
+        # support inserting default attributes during parse-time
+        # validation
+        context._validator.inject_default_attributes(result)
+
+    return result
+
+cdef int _fixHtmlDictNames(tree.xmlDict* c_dict, xmlDoc* c_doc) nogil:
+    cdef xmlNode* c_node
+    if c_doc is NULL:
+        return 0
+    c_node = c_doc.children
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(<xmlNode*>c_doc, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        if _fixHtmlDictNodeNames(c_dict, c_node) < 0:
+            return -1
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+    return 0
+
+cdef int _fixHtmlDictSubtreeNames(tree.xmlDict* c_dict, xmlDoc* c_doc,
+                                  xmlNode* c_start_node) nogil:
+    """
+    Move names to the dict, iterating in document order, starting at
+    c_start_node. This is used in incremental parsing after each chunk.
+    """
+    cdef xmlNode* c_node
+    if not c_doc:
+        return 0
+    if not c_start_node:
+        return _fixHtmlDictNames(c_dict, c_doc)
+    c_node = c_start_node
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(<xmlNode*>c_doc, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        if _fixHtmlDictNodeNames(c_dict, c_node) < 0:
+            return -1
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+    return 0
+
+cdef inline int _fixHtmlDictNodeNames(tree.xmlDict* c_dict,
+                                      xmlNode* c_node) nogil:
+    cdef xmlNode* c_attr
+    c_name = tree.xmlDictLookup(c_dict, c_node.name, -1)
+    if c_name is NULL:
+        return -1
+    if c_name is not c_node.name:
+        tree.xmlFree(<char*>c_node.name)
+        c_node.name = c_name
+    c_attr = <xmlNode*>c_node.properties
+    while c_attr is not NULL:
+        c_name = tree.xmlDictLookup(c_dict, c_attr.name, -1)
+        if c_name is NULL:
+            return -1
+        if c_name is not c_attr.name:
+            tree.xmlFree(<char*>c_attr.name)
+            c_attr.name = c_name
+        c_attr = c_attr.next
+    return 0
+
+@cython.internal
+cdef class _BaseParser:
+    cdef ElementClassLookup _class_lookup
+    cdef _ResolverRegistry _resolvers
+    cdef _ParserContext _parser_context
+    cdef _ParserContext _push_parser_context
+    cdef int _parse_options
+    cdef bint _for_html
+    cdef bint _remove_comments
+    cdef bint _remove_pis
+    cdef bint _strip_cdata
+    cdef XMLSchema _schema
+    cdef bytes _filename
+    cdef readonly object target
+    cdef object _default_encoding
+    cdef tuple _events_to_collect  # (event_types, tag)
+
+    def __init__(self, int parse_options, bint for_html, XMLSchema schema,
+                 remove_comments, remove_pis, strip_cdata, target, encoding):
+        cdef tree.xmlCharEncodingHandler* enchandler
+        cdef int c_encoding
+        if not isinstance(self, (XMLParser, HTMLParser)):
+            raise TypeError, u"This class cannot be instantiated"
+
+        self._parse_options = parse_options
+        self.target = target
+        self._for_html = for_html
+        self._remove_comments = remove_comments
+        self._remove_pis = remove_pis
+        self._strip_cdata = strip_cdata
+        self._schema = schema
+
+        self._resolvers = _ResolverRegistry()
+
+        if encoding is None:
+            self._default_encoding = None
+        else:
+            encoding = _utf8(encoding)
+            enchandler = tree.xmlFindCharEncodingHandler(_cstr(encoding))
+            if enchandler is NULL:
+                raise LookupError, u"unknown encoding: '%s'" % encoding
+            tree.xmlCharEncCloseFunc(enchandler)
+            self._default_encoding = encoding
+
+    cdef _setBaseURL(self, base_url):
+        self._filename = _encodeFilename(base_url)
+
+    cdef _collectEvents(self, event_types, tag):
+        if event_types is None:
+            event_types = ()
+        else:
+            event_types = tuple(set(event_types))
+            _buildParseEventFilter(event_types)  # purely for validation
+        self._events_to_collect = (event_types, tag)
+
+    cdef _ParserContext _getParserContext(self):
+        cdef xmlparser.xmlParserCtxt* pctxt
+        if self._parser_context is None:
+            self._parser_context = self._createContext(self.target, None)
+            if self._schema is not None:
+                self._parser_context._validator = \
+                    self._schema._newSaxValidator(
+                        self._parse_options & xmlparser.XML_PARSE_DTDATTR)
+            pctxt = self._newParserCtxt()
+            _initParserContext(self._parser_context, self._resolvers, pctxt)
+            if self._remove_comments:
+                pctxt.sax.comment = NULL
+            if self._remove_pis:
+                pctxt.sax.processingInstruction = NULL
+            if self._strip_cdata:
+                # hard switch-off for CDATA nodes => makes them plain text
+                pctxt.sax.cdataBlock = NULL
+        return self._parser_context
+
+    cdef _ParserContext _getPushParserContext(self):
+        cdef xmlparser.xmlParserCtxt* pctxt
+        if self._push_parser_context is None:
+            self._push_parser_context = self._createContext(
+                self.target, self._events_to_collect)
+            if self._schema is not None:
+                self._push_parser_context._validator = \
+                    self._schema._newSaxValidator(
+                        self._parse_options & xmlparser.XML_PARSE_DTDATTR)
+            pctxt = self._newPushParserCtxt()
+            _initParserContext(
+                self._push_parser_context, self._resolvers, pctxt)
+            if self._remove_comments:
+                pctxt.sax.comment = NULL
+            if self._remove_pis:
+                pctxt.sax.processingInstruction = NULL
+            if self._strip_cdata:
+                # hard switch-off for CDATA nodes => makes them plain text
+                pctxt.sax.cdataBlock = NULL
+        return self._push_parser_context
+
+    cdef _ParserContext _createContext(self, target, events_to_collect):
+        cdef _SaxParserContext sax_context
+        if target is not None:
+            sax_context = _TargetParserContext(self)
+            (<_TargetParserContext>sax_context)._setTarget(target)
+        elif events_to_collect:
+            sax_context = _SaxParserContext(self)
+        else:
+            # nothing special to configure
+            return _ParserContext()
+        if events_to_collect:
+            events, tag = events_to_collect
+            sax_context._setEventFilter(events, tag)
+        return sax_context
+
+    cdef int _registerHtmlErrorHandler(self, xmlparser.xmlParserCtxt* c_ctxt) except -1:
+        cdef xmlparser.xmlSAXHandler* sax = c_ctxt.sax
+        if sax is not NULL and sax.initialized and sax.initialized != xmlparser.XML_SAX2_MAGIC:
+            # need to extend SAX1 context to SAX2 to get proper error reports
+            if <xmlparser.xmlSAXHandlerV1*>sax is &htmlparser.htmlDefaultSAXHandler:
+                sax = <xmlparser.xmlSAXHandler*> stdlib.malloc(sizeof(xmlparser.xmlSAXHandler))
+                if sax is NULL:
+                    raise MemoryError()
+                cstring_h.memcpy(sax, &htmlparser.htmlDefaultSAXHandler,
+                                 sizeof(htmlparser.htmlDefaultSAXHandler))
+                c_ctxt.sax = sax
+            sax.initialized = xmlparser.XML_SAX2_MAGIC
+            sax.serror = _receiveParserError
+            sax.startElementNs = NULL
+            sax.endElementNs = NULL
+            sax._private = NULL
+        return 0
+
+    cdef xmlparser.xmlParserCtxt* _newParserCtxt(self) except NULL:
+        cdef xmlparser.xmlParserCtxt* c_ctxt
+        if self._for_html:
+            c_ctxt = htmlparser.htmlCreateMemoryParserCtxt('dummy', 5)
+            if c_ctxt is not NULL:
+                self._registerHtmlErrorHandler(c_ctxt)
+        else:
+            c_ctxt = xmlparser.xmlNewParserCtxt()
+        if c_ctxt is NULL:
+            raise MemoryError
+        return c_ctxt
+
+    cdef xmlparser.xmlParserCtxt* _newPushParserCtxt(self) except NULL:
+        cdef xmlparser.xmlParserCtxt* c_ctxt
+        cdef char* c_filename = _cstr(self._filename) if self._filename is not None else NULL
+        if self._for_html:
+            c_ctxt = htmlparser.htmlCreatePushParserCtxt(
+                NULL, NULL, NULL, 0, c_filename, tree.XML_CHAR_ENCODING_NONE)
+            if c_ctxt is not NULL:
+                self._registerHtmlErrorHandler(c_ctxt)
+                htmlparser.htmlCtxtUseOptions(c_ctxt, self._parse_options)
+        else:
+            c_ctxt = xmlparser.xmlCreatePushParserCtxt(
+                NULL, NULL, NULL, 0, c_filename)
+            if c_ctxt is not NULL:
+                xmlparser.xmlCtxtUseOptions(c_ctxt, self._parse_options)
+        if c_ctxt is NULL:
+            raise MemoryError()
+        return c_ctxt
+
+    property error_log:
+        u"""The error log of the last parser run.
+        """
+        def __get__(self):
+            cdef _ParserContext context
+            context = self._getParserContext()
+            return context._error_log.copy()
+
+    property resolvers:
+        u"The custom resolver registry of this parser."
+        def __get__(self):
+            return self._resolvers
+
+    property version:
+        u"The version of the underlying XML parser."
+        def __get__(self):
+            return u"libxml2 %d.%d.%d" % LIBXML_VERSION
+
+    def setElementClassLookup(self, ElementClassLookup lookup = None):
+        u":deprecated: use ``parser.set_element_class_lookup(lookup)`` instead."
+        self.set_element_class_lookup(lookup)
+
+    def set_element_class_lookup(self, ElementClassLookup lookup = None):
+        u"""set_element_class_lookup(self, lookup = None)
+
+        Set a lookup scheme for element classes generated from this parser.
+
+        Reset it by passing None or nothing.
+        """
+        self._class_lookup = lookup
+
+    cdef _BaseParser _copy(self):
+        u"Create a new parser with the same configuration."
+        cdef _BaseParser parser
+        parser = self.__class__()
+        parser._parse_options = self._parse_options
+        parser._for_html = self._for_html
+        parser._remove_comments = self._remove_comments
+        parser._remove_pis = self._remove_pis
+        parser._strip_cdata = self._strip_cdata
+        parser._filename = self._filename
+        parser._resolvers = self._resolvers
+        parser.target = self.target
+        parser._class_lookup  = self._class_lookup
+        parser._default_encoding = self._default_encoding
+        parser._schema = self._schema
+        parser._events_to_collect = self._events_to_collect
+        return parser
+
+    def copy(self):
+        u"""copy(self)
+
+        Create a new parser with the same configuration.
+        """
+        return self._copy()
+
+    def makeelement(self, _tag, attrib=None, nsmap=None, **_extra):
+        u"""makeelement(self, _tag, attrib=None, nsmap=None, **_extra)
+
+        Creates a new element associated with this parser.
+        """
+        return _makeElement(_tag, NULL, None, self, None, None,
+                            attrib, nsmap, _extra)
+
+    # internal parser methods
+
+    cdef xmlDoc* _parseUnicodeDoc(self, utext, char* c_filename) except NULL:
+        u"""Parse unicode document, share dictionary if possible.
+        """
+        cdef _ParserContext context
+        cdef xmlDoc* result
+        cdef xmlparser.xmlParserCtxt* pctxt
+        cdef Py_ssize_t py_buffer_len
+        cdef int buffer_len, c_kind
+        cdef const_char* c_text
+        cdef const_char* c_encoding = _UNICODE_ENCODING
+        cdef bint is_pep393_string = (
+            python.PEP393_ENABLED and python.PyUnicode_IS_READY(utext))
+        if is_pep393_string:
+            c_text = <const_char*>python.PyUnicode_DATA(utext)
+            py_buffer_len = python.PyUnicode_GET_LENGTH(utext)
+            c_kind = python.PyUnicode_KIND(utext)
+            if c_kind == 1:
+                c_encoding = 'ISO-8859-1'
+            elif c_kind == 2:
+                py_buffer_len *= 2
+                if python.PY_BIG_ENDIAN:
+                    c_encoding = 'UTF-16BE'  # actually UCS-2
+                else:
+                    c_encoding = 'UTF-16LE'  # actually UCS-2
+            elif c_kind == 4:
+                py_buffer_len *= 4
+                if python.PY_BIG_ENDIAN:
+                    c_encoding = 'UCS-4BE'
+                else:
+                    c_encoding = 'UCS-4LE'
+            else:
+                assert False, "Illegal Unicode kind %d" % c_kind
+        else:
+            py_buffer_len = python.PyUnicode_GET_DATA_SIZE(utext)
+            c_text = python.PyUnicode_AS_DATA(utext)
+        assert py_buffer_len <= limits.INT_MAX
+        buffer_len = py_buffer_len
+
+        context = self._getParserContext()
+        context.prepare()
+        try:
+            pctxt = context._c_ctxt
+            __GLOBAL_PARSER_CONTEXT.initParserDict(pctxt)
+            orig_options = pctxt.options
+            with nogil:
+                if self._for_html:
+                    result = htmlparser.htmlCtxtReadMemory(
+                        pctxt, c_text, buffer_len, c_filename, c_encoding,
+                        self._parse_options)
+                    if result is not NULL:
+                        if _fixHtmlDictNames(pctxt.dict, result) < 0:
+                            tree.xmlFreeDoc(result)
+                            result = NULL
+                else:
+                    result = xmlparser.xmlCtxtReadMemory(
+                        pctxt, c_text, buffer_len, c_filename, c_encoding,
+                        self._parse_options)
+            pctxt.options = orig_options # work around libxml2 problem
+
+            return context._handleParseResultDoc(self, result, None)
+        finally:
+            context.cleanup()
+
+    cdef xmlDoc* _parseDoc(self, char* c_text, int c_len,
+                           char* c_filename) except NULL:
+        u"""Parse document, share dictionary if possible.
+        """
+        cdef _ParserContext context
+        cdef xmlDoc* result
+        cdef xmlparser.xmlParserCtxt* pctxt
+        cdef char* c_encoding
+        context = self._getParserContext()
+        context.prepare()
+        try:
+            pctxt = context._c_ctxt
+            __GLOBAL_PARSER_CONTEXT.initParserDict(pctxt)
+
+            if self._default_encoding is None:
+                c_encoding = NULL
+            else:
+                c_encoding = _cstr(self._default_encoding)
+
+            orig_options = pctxt.options
+            with nogil:
+                if self._for_html:
+                    result = htmlparser.htmlCtxtReadMemory(
+                        pctxt, c_text, c_len, c_filename,
+                        c_encoding, self._parse_options)
+                    if result is not NULL:
+                        if _fixHtmlDictNames(pctxt.dict, result) < 0:
+                            tree.xmlFreeDoc(result)
+                            result = NULL
+                else:
+                    result = xmlparser.xmlCtxtReadMemory(
+                        pctxt, c_text, c_len, c_filename,
+                        c_encoding, self._parse_options)
+            pctxt.options = orig_options # work around libxml2 problem
+
+            return context._handleParseResultDoc(self, result, None)
+        finally:
+            context.cleanup()
+
+    cdef xmlDoc* _parseDocFromFile(self, char* c_filename) except NULL:
+        cdef _ParserContext context
+        cdef xmlDoc* result
+        cdef xmlparser.xmlParserCtxt* pctxt
+        cdef char* c_encoding
+        result = NULL
+
+        context = self._getParserContext()
+        context.prepare()
+        try:
+            pctxt = context._c_ctxt
+            __GLOBAL_PARSER_CONTEXT.initParserDict(pctxt)
+
+            if self._default_encoding is None:
+                c_encoding = NULL
+            else:
+                c_encoding = _cstr(self._default_encoding)
+
+            orig_options = pctxt.options
+            with nogil:
+                if self._for_html:
+                    result = htmlparser.htmlCtxtReadFile(
+                        pctxt, c_filename, c_encoding, self._parse_options)
+                    if result is not NULL:
+                        if _fixHtmlDictNames(pctxt.dict, result) < 0:
+                            tree.xmlFreeDoc(result)
+                            result = NULL
+                else:
+                    result = xmlparser.xmlCtxtReadFile(
+                        pctxt, c_filename, c_encoding, self._parse_options)
+            pctxt.options = orig_options # work around libxml2 problem
+
+            return context._handleParseResultDoc(self, result, c_filename)
+        finally:
+            context.cleanup()
+
+    cdef xmlDoc* _parseDocFromFilelike(self, filelike, filename,
+                                       encoding) except NULL:
+        cdef _ParserContext context
+        cdef _FileReaderContext file_context
+        cdef xmlDoc* result
+        cdef xmlparser.xmlParserCtxt* pctxt
+        cdef char* c_filename
+        if not filename:
+            filename = None
+
+        context = self._getParserContext()
+        context.prepare()
+        try:
+            pctxt = context._c_ctxt
+            __GLOBAL_PARSER_CONTEXT.initParserDict(pctxt)
+            file_context = _FileReaderContext(
+                filelike, context, filename,
+                encoding or self._default_encoding)
+            result = file_context._readDoc(pctxt, self._parse_options)
+
+            return context._handleParseResultDoc(
+                self, result, filename)
+        finally:
+            context.cleanup()
+
+############################################################
+## ET feed parser
+############################################################
+
+cdef class _FeedParser(_BaseParser):
+    cdef bint _feed_parser_running
+
+    property feed_error_log:
+        u"""The error log of the last (or current) run of the feed parser.
+
+        Note that this is local to the feed parser and thus is
+        different from what the ``error_log`` property returns.
+        """
+        def __get__(self):
+            return self._getPushParserContext()._error_log.copy()
+
+    cpdef feed(self, data):
+        u"""feed(self, data)
+
+        Feeds data to the parser.  The argument should be an 8-bit string
+        buffer containing encoded data, although Unicode is supported as long
+        as both string types are not mixed.
+
+        This is the main entry point to the consumer interface of a
+        parser.  The parser will parse as much of the XML stream as it
+        can on each call.  To finish parsing or to reset the parser,
+        call the ``close()`` method.  Both methods may raise
+        ParseError if errors occur in the input data.  If an error is
+        raised, there is no longer a need to call ``close()``.
+
+        The feed parser interface is independent of the normal parser
+        usage.  You can use the same parser as a feed parser and in
+        the ``parse()`` function concurrently.
+        """
+        cdef _ParserContext context
+        cdef xmlparser.xmlParserCtxt* pctxt
+        cdef Py_ssize_t py_buffer_len
+        cdef const_char* c_data
+        cdef const_char* c_encoding
+        cdef int buffer_len
+        cdef int error
+        cdef bint recover = self._parse_options & xmlparser.XML_PARSE_RECOVER
+        if isinstance(data, bytes):
+            if self._default_encoding is None:
+                c_encoding = NULL
+            else:
+                c_encoding = self._default_encoding
+            c_data = _cstr(data)
+            py_buffer_len = python.PyBytes_GET_SIZE(data)
+        elif isinstance(data, unicode):
+            if _UNICODE_ENCODING is NULL:
+                raise ParserError, \
+                    u"Unicode parsing is not supported on this platform"
+            c_encoding = _UNICODE_ENCODING
+            c_data = python.PyUnicode_AS_DATA(data)
+            py_buffer_len = python.PyUnicode_GET_DATA_SIZE(data)
+        else:
+            raise TypeError, u"Parsing requires string data"
+
+        context = self._getPushParserContext()
+        pctxt = context._c_ctxt
+        error = 0
+        if not self._feed_parser_running:
+            context.prepare()
+            self._feed_parser_running = 1
+            c_filename = (_cstr(self._filename)
+                          if self._filename is not None else NULL)
+
+            if c_encoding is NULL and py_buffer_len >= 2:
+                # libxml2 can't handle BOMs here, so let's try ourselves
+                if c_data[0] in b'\xfe\xef\xff':
+                    # likely a BOM, let's take a closer look
+                    c_encoding = _findEncodingName(
+                        <const_xmlChar*>c_data,
+                        4 if py_buffer_len > 4 else <int>py_buffer_len)
+                    if c_encoding is not NULL:
+                        # found it => skip over BOM (if there is one)
+                        if (c_data[0] == b'\xef' and
+                                c_data[1] == b'\xbb' and
+                                c_data[2] == b'\xbf'):
+                            c_data += 3  # UTF-8 BOM
+                            py_buffer_len -= 3
+                        elif (c_data[0] == b'\xfe' and c_data[1] == b'\xff' or
+                                c_data[0] == b'\xff' and c_data[1] == b'\xfe'):
+                            # UTF-16 BE/LE
+                            c_data += 2
+                            py_buffer_len -= 2
+
+            if self._for_html:
+                error = _htmlCtxtResetPush(
+                    pctxt, NULL, 0, c_filename, c_encoding,
+                    self._parse_options)
+            else:
+                xmlparser.xmlCtxtUseOptions(pctxt, self._parse_options)
+                error = xmlparser.xmlCtxtResetPush(
+                    pctxt, NULL, 0, c_filename, c_encoding)
+            if error:
+                raise MemoryError()
+            __GLOBAL_PARSER_CONTEXT.initParserDict(pctxt)
+
+        #print pctxt.charset, 'NONE' if c_encoding is NULL else c_encoding
+
+        fixup_error = 0
+        while py_buffer_len > 0 and (error == 0 or recover):
+            with nogil:
+                if py_buffer_len > limits.INT_MAX:
+                    buffer_len = limits.INT_MAX
+                else:
+                    buffer_len = <int>py_buffer_len
+                if self._for_html:
+                    c_node = pctxt.node  # last node where the parser stopped
+                    error = htmlparser.htmlParseChunk(pctxt, c_data, buffer_len, 0)
+                    # and now for the fun part: move node names to the dict
+                    if pctxt.myDoc:
+                        fixup_error = _fixHtmlDictSubtreeNames(
+                            pctxt.dict, pctxt.myDoc, c_node)
+                        if pctxt.myDoc.dict and pctxt.myDoc.dict is not pctxt.dict:
+                            xmlparser.xmlDictFree(pctxt.myDoc.dict)
+                            pctxt.myDoc.dict = pctxt.dict
+                            xmlparser.xmlDictReference(pctxt.dict)
+                else:
+                    error = xmlparser.xmlParseChunk(pctxt, c_data, buffer_len, 0)
+                py_buffer_len -= buffer_len
+                c_data += buffer_len
+
+            if fixup_error and not context.has_raised():
+                context.store_exception(MemoryError())
+
+            if error and not pctxt.replaceEntities and not pctxt.validate:
+                # in this mode, we ignore errors about undefined entities
+                for entry in context._error_log.filter_from_errors():
+                    if entry.type != ErrorTypes.WAR_UNDECLARED_ENTITY and \
+                           entry.type != ErrorTypes.ERR_UNDECLARED_ENTITY:
+                        break
+                else:
+                    error = 0
+
+        if fixup_error or not recover and (error or not pctxt.wellFormed):
+            self._feed_parser_running = 0
+            try:
+                context._handleParseResult(self, pctxt.myDoc, None)
+            finally:
+                context.cleanup()
+
+    cpdef close(self):
+        u"""close(self)
+
+        Terminates feeding data to this parser.  This tells the parser to
+        process any remaining data in the feed buffer, and then returns the
+        root Element of the tree that was parsed.
+
+        This method must be called after passing the last chunk of data into
+        the ``feed()`` method.  It should only be called when using the feed
+        parser interface, all other usage is undefined.
+        """
+        if not self._feed_parser_running:
+            raise XMLSyntaxError(u"no element found",
+                                 xmlerror.XML_ERR_INTERNAL_ERROR, 0, 0)
+
+        context = self._getPushParserContext()
+        pctxt = context._c_ctxt
+
+        self._feed_parser_running = 0
+        if self._for_html:
+            htmlparser.htmlParseChunk(pctxt, NULL, 0, 1)
+        else:
+            xmlparser.xmlParseChunk(pctxt, NULL, 0, 1)
+
+        if (pctxt.recovery and not pctxt.disableSAX and
+                isinstance(context, _SaxParserContext)):
+            # apply any left-over 'end' events
+            (<_SaxParserContext>context).flushEvents()
+
+        try:
+            result = context._handleParseResult(self, pctxt.myDoc, None)
+        finally:
+            context.cleanup()
+
+        if isinstance(result, _Document):
+            return (<_Document>result).getroot()
+        else:
+            return result
+
+cdef int _htmlCtxtResetPush(xmlparser.xmlParserCtxt* c_ctxt,
+                             const_char* c_data, int buffer_len,
+                             const_char* c_filename, const_char* c_encoding,
+                             int parse_options) except -1:
+    cdef xmlparser.xmlParserInput* c_input_stream
+    # libxml2 lacks an HTML push parser setup function
+    error = xmlparser.xmlCtxtResetPush(
+        c_ctxt, NULL, 0, c_filename, c_encoding)
+    if error:
+        return error
+
+    # fix libxml2 setup for HTML
+    c_ctxt.progressive = 1
+    c_ctxt.html = 1
+    htmlparser.htmlCtxtUseOptions(c_ctxt, parse_options)
+
+    if c_data is not NULL and buffer_len > 0:
+        return htmlparser.htmlParseChunk(c_ctxt, c_data, buffer_len, 0)
+    return 0
+
+############################################################
+## XML parser
+############################################################
+
+cdef int _XML_DEFAULT_PARSE_OPTIONS
+_XML_DEFAULT_PARSE_OPTIONS = (
+    xmlparser.XML_PARSE_NOENT   |
+    xmlparser.XML_PARSE_NOCDATA |
+    xmlparser.XML_PARSE_NONET   |
+    xmlparser.XML_PARSE_COMPACT |
+    xmlparser.XML_PARSE_BIG_LINES
+    )
+
+cdef class XMLParser(_FeedParser):
+    u"""XMLParser(self, encoding=None, attribute_defaults=False, dtd_validation=False, load_dtd=False, no_network=True, ns_clean=False, recover=False, XMLSchema schema=None, remove_blank_text=False, resolve_entities=True, remove_comments=False, remove_pis=False, strip_cdata=True, target=None, compact=True)
+
+    The XML parser.
+
+    Parsers can be supplied as additional argument to various parse
+    functions of the lxml API.  A default parser is always available
+    and can be replaced by a call to the global function
+    'set_default_parser'.  New parsers can be created at any time
+    without a major run-time overhead.
+
+    The keyword arguments in the constructor are mainly based on the
+    libxml2 parser configuration.  A DTD will also be loaded if DTD
+    validation or attribute default values are requested (unless you
+    additionally provide an XMLSchema from which the default
+    attributes can be read).
+
+    Available boolean keyword arguments:
+
+    - attribute_defaults - inject default attributes from DTD or XMLSchema
+    - dtd_validation     - validate against a DTD referenced by the document
+    - load_dtd           - use DTD for parsing
+    - no_network         - prevent network access for related files (default: True)
+    - ns_clean           - clean up redundant namespace declarations
+    - recover            - try hard to parse through broken XML
+    - remove_blank_text  - discard blank text nodes that appear ignorable
+    - remove_comments    - discard comments
+    - remove_pis         - discard processing instructions
+    - strip_cdata        - replace CDATA sections by normal text content (default: True)
+    - compact            - safe memory for short text content (default: True)
+    - resolve_entities   - replace entities by their text value (default: True)
+    - huge_tree          - disable security restrictions and support very deep trees
+                           and very long text content (only affects libxml2 2.7+)
+
+    Other keyword arguments:
+
+    - encoding - override the document encoding
+    - target   - a parser target object that will receive the parse events
+    - schema   - an XMLSchema to validate against
+
+    Note that you should avoid sharing parsers between threads.  While this is
+    not harmful, it is more efficient to use separate parsers.  This does not
+    apply to the default parser.
+    """
+    def __init__(self, *, encoding=None, attribute_defaults=False,
+                 dtd_validation=False, load_dtd=False, no_network=True,
+                 ns_clean=False, recover=False, XMLSchema schema=None,
+                 huge_tree=False, remove_blank_text=False, resolve_entities=True,
+                 remove_comments=False, remove_pis=False, strip_cdata=True,
+                 target=None, compact=True):
+        cdef int parse_options
+        parse_options = _XML_DEFAULT_PARSE_OPTIONS
+        if load_dtd:
+            parse_options = parse_options | xmlparser.XML_PARSE_DTDLOAD
+        if dtd_validation:
+            parse_options = parse_options | xmlparser.XML_PARSE_DTDVALID | \
+                            xmlparser.XML_PARSE_DTDLOAD
+        if attribute_defaults:
+            parse_options = parse_options | xmlparser.XML_PARSE_DTDATTR
+            if schema is None:
+                parse_options = parse_options | xmlparser.XML_PARSE_DTDLOAD
+        if ns_clean:
+            parse_options = parse_options | xmlparser.XML_PARSE_NSCLEAN
+        if recover:
+            parse_options = parse_options | xmlparser.XML_PARSE_RECOVER
+        if remove_blank_text:
+            parse_options = parse_options | xmlparser.XML_PARSE_NOBLANKS
+        if huge_tree:
+            parse_options = parse_options | xmlparser.XML_PARSE_HUGE
+        if not no_network:
+            parse_options = parse_options ^ xmlparser.XML_PARSE_NONET
+        if not compact:
+            parse_options = parse_options ^ xmlparser.XML_PARSE_COMPACT
+        if not resolve_entities:
+            parse_options = parse_options ^ xmlparser.XML_PARSE_NOENT
+        if not strip_cdata:
+            parse_options = parse_options ^ xmlparser.XML_PARSE_NOCDATA
+
+        _BaseParser.__init__(self, parse_options, 0, schema,
+                             remove_comments, remove_pis, strip_cdata,
+                             target, encoding)
+
+
+cdef class XMLPullParser(XMLParser):
+    """XMLPullParser(self, events=None, *, tag=None, **kwargs)
+
+    XML parser that collects parse events in an iterator.
+
+    The collected events are the same as for iterparse(), but the
+    parser itself is non-blocking in the sense that it receives
+    data chunks incrementally through its .feed() method, instead
+    of reading them directly from a file(-like) object all by itself.
+
+    By default, it collects Element end events.  To change that,
+    pass any subset of the available events into the ``events``
+    argument: ``'start'``, ``'end'``, ``'start-ns'``,
+    ``'end-ns'``, ``'comment'``, ``'pi'``.
+
+    To support loading external dependencies relative to the input
+    source, you can pass the ``base_url``.
+    """
+    def __init__(self, events=None, *, tag=None, base_url=None, **kwargs):
+        XMLParser.__init__(self, **kwargs)
+        if events is None:
+            events = ('end',)
+        self._setBaseURL(base_url)
+        self._collectEvents(events, tag)
+
+    def read_events(self):
+        return (<_SaxParserContext?>self._getPushParserContext()).events_iterator
+
+
+cdef class ETCompatXMLParser(XMLParser):
+    u"""ETCompatXMLParser(self, encoding=None, attribute_defaults=False, \
+                 dtd_validation=False, load_dtd=False, no_network=True, \
+                 ns_clean=False, recover=False, schema=None, \
+                 huge_tree=False, remove_blank_text=False, resolve_entities=True, \
+                 remove_comments=True, remove_pis=True, strip_cdata=True, \
+                 target=None, compact=True)
+
+    An XML parser with an ElementTree compatible default setup.
+
+    See the XMLParser class for details.
+
+    This parser has ``remove_comments`` and ``remove_pis`` enabled by default
+    and thus ignores comments and processing instructions.
+    """
+    def __init__(self, *, encoding=None, attribute_defaults=False,
+                 dtd_validation=False, load_dtd=False, no_network=True,
+                 ns_clean=False, recover=False, schema=None,
+                 huge_tree=False, remove_blank_text=False, resolve_entities=True,
+                 remove_comments=True, remove_pis=True, strip_cdata=True,
+                 target=None, compact=True):
+        XMLParser.__init__(self,
+                           attribute_defaults=attribute_defaults,
+                           dtd_validation=dtd_validation,
+                           load_dtd=load_dtd,
+                           no_network=no_network,
+                           ns_clean=ns_clean,
+                           recover=recover,
+                           remove_blank_text=remove_blank_text,
+                           huge_tree=huge_tree,
+                           compact=compact,
+                           resolve_entities=resolve_entities,
+                           remove_comments=remove_comments,
+                           remove_pis=remove_pis,
+                           strip_cdata=strip_cdata,
+                           target=target,
+                           encoding=encoding,
+                           schema=schema)
+
+# ET 1.2 compatible name
+XMLTreeBuilder = ETCompatXMLParser
+
+
+cdef XMLParser __DEFAULT_XML_PARSER
+__DEFAULT_XML_PARSER = XMLParser()
+
+__GLOBAL_PARSER_CONTEXT.setDefaultParser(__DEFAULT_XML_PARSER)
+
+def set_default_parser(_BaseParser parser=None):
+    u"""set_default_parser(parser=None)
+
+    Set a default parser for the current thread.  This parser is used
+    globally whenever no parser is supplied to the various parse functions of
+    the lxml API.  If this function is called without a parser (or if it is
+    None), the default parser is reset to the original configuration.
+
+    Note that the pre-installed default parser is not thread-safe.  Avoid the
+    default parser in multi-threaded environments.  You can create a separate
+    parser for each thread explicitly or use a parser pool.
+    """
+    if parser is None:
+        parser = __DEFAULT_XML_PARSER
+    __GLOBAL_PARSER_CONTEXT.setDefaultParser(parser)
+
+def get_default_parser():
+    u"get_default_parser()"
+    return __GLOBAL_PARSER_CONTEXT.getDefaultParser()
+
+############################################################
+## HTML parser
+############################################################
+
+cdef int _HTML_DEFAULT_PARSE_OPTIONS
+_HTML_DEFAULT_PARSE_OPTIONS = (
+    htmlparser.HTML_PARSE_RECOVER |
+    htmlparser.HTML_PARSE_NONET   |
+    htmlparser.HTML_PARSE_COMPACT
+    )
+
+cdef class HTMLParser(_FeedParser):
+    u"""HTMLParser(self, encoding=None, remove_blank_text=False, \
+                   remove_comments=False, remove_pis=False, strip_cdata=True, \
+                   no_network=True, target=None, XMLSchema schema=None, \
+                   recover=True, compact=True)
+
+    The HTML parser.
+
+    This parser allows reading HTML into a normal XML tree.  By
+    default, it can read broken (non well-formed) HTML, depending on
+    the capabilities of libxml2.  Use the 'recover' option to switch
+    this off.
+
+    Available boolean keyword arguments:
+
+    - recover            - try hard to parse through broken HTML (default: True)
+    - no_network         - prevent network access for related files (default: True)
+    - remove_blank_text  - discard empty text nodes that are ignorable (i.e. not actual text content)
+    - remove_comments    - discard comments
+    - remove_pis         - discard processing instructions
+    - strip_cdata        - replace CDATA sections by normal text content (default: True)
+    - compact            - safe memory for short text content (default: True)
+
+    Other keyword arguments:
+
+    - encoding - override the document encoding
+    - target   - a parser target object that will receive the parse events
+    - schema   - an XMLSchema to validate against
+
+    Note that you should avoid sharing parsers between threads for performance
+    reasons.
+    """
+    def __init__(self, *, encoding=None, remove_blank_text=False,
+                 remove_comments=False, remove_pis=False, strip_cdata=True,
+                 no_network=True, target=None, XMLSchema schema=None,
+                 recover=True, compact=True):
+        cdef int parse_options
+        parse_options = _HTML_DEFAULT_PARSE_OPTIONS
+        if remove_blank_text:
+            parse_options = parse_options | htmlparser.HTML_PARSE_NOBLANKS
+        if not recover:
+            parse_options = parse_options ^ htmlparser.HTML_PARSE_RECOVER
+        if not no_network:
+            parse_options = parse_options ^ htmlparser.HTML_PARSE_NONET
+        if not compact:
+            parse_options = parse_options ^ htmlparser.HTML_PARSE_COMPACT
+
+        _BaseParser.__init__(self, parse_options, 1, schema,
+                             remove_comments, remove_pis, strip_cdata,
+                             target, encoding)
+
+
+cdef HTMLParser __DEFAULT_HTML_PARSER
+__DEFAULT_HTML_PARSER = HTMLParser()
+
+
+cdef class HTMLPullParser(HTMLParser):
+    """HTMLPullParser(self, events=None, *, tag=None, base_url=None, **kwargs)
+
+    HTML parser that collects parse events in an iterator.
+
+    The collected events are the same as for iterparse(), but the
+    parser itself is non-blocking in the sense that it receives
+    data chunks incrementally through its .feed() method, instead
+    of reading them directly from a file(-like) object all by itself.
+
+    By default, it collects Element end events.  To change that,
+    pass any subset of the available events into the ``events``
+    argument: ``'start'``, ``'end'``, ``'start-ns'``,
+    ``'end-ns'``, ``'comment'``, ``'pi'``.
+
+    To support loading external dependencies relative to the input
+    source, you can pass the ``base_url``.
+    """
+    def __init__(self, events=None, *, tag=None, base_url=None, **kwargs):
+        HTMLParser.__init__(self, **kwargs)
+        if events is None:
+            events = ('end',)
+        self._setBaseURL(base_url)
+        self._collectEvents(events, tag)
+
+    def read_events(self):
+        return (<_SaxParserContext?>self._getPushParserContext()).events_iterator
+
+
+############################################################
+## helper functions for document creation
+############################################################
+
+cdef xmlDoc* _parseDoc(text, filename, _BaseParser parser) except NULL:
+    cdef char* c_filename
+    cdef char* c_text
+    cdef Py_ssize_t c_len
+    cdef bint is_pep393_string
+    if parser is None:
+        parser = __GLOBAL_PARSER_CONTEXT.getDefaultParser()
+    if not filename:
+        c_filename = NULL
+    else:
+        filename_utf = _encodeFilenameUTF8(filename)
+        c_filename = _cstr(filename_utf)
+    if isinstance(text, unicode):
+        is_pep393_string = (
+            python.PEP393_ENABLED and python.PyUnicode_IS_READY(text))
+        if is_pep393_string:
+            c_len = python.PyUnicode_GET_LENGTH(text)
+            c_len *= python.PyUnicode_KIND(text)
+        else:
+            c_len = python.PyUnicode_GET_DATA_SIZE(text)
+        if c_len > limits.INT_MAX:
+            return (<_BaseParser>parser)._parseDocFromFilelike(
+                StringIO(text), filename, None)
+        if _UNICODE_ENCODING is NULL and not is_pep393_string:
+            text = (<unicode>text).encode('utf8')
+            return (<_BaseParser>parser)._parseDocFromFilelike(
+                BytesIO(text), filename, "UTF-8")
+        return (<_BaseParser>parser)._parseUnicodeDoc(text, c_filename)
+    else:
+        c_len = python.PyBytes_GET_SIZE(text)
+        if c_len > limits.INT_MAX:
+            return (<_BaseParser>parser)._parseDocFromFilelike(
+                BytesIO(text), filename, None)
+        c_text = _cstr(text)
+        return (<_BaseParser>parser)._parseDoc(c_text, c_len, c_filename)
+
+cdef xmlDoc* _parseDocFromFile(filename8, _BaseParser parser) except NULL:
+    if parser is None:
+        parser = __GLOBAL_PARSER_CONTEXT.getDefaultParser()
+    return (<_BaseParser>parser)._parseDocFromFile(_cstr(filename8))
+
+cdef xmlDoc* _parseDocFromFilelike(source, filename,
+                                   _BaseParser parser) except NULL:
+    if parser is None:
+        parser = __GLOBAL_PARSER_CONTEXT.getDefaultParser()
+    return (<_BaseParser>parser)._parseDocFromFilelike(source, filename, None)
+
+cdef xmlDoc* _newXMLDoc() except NULL:
+    cdef xmlDoc* result
+    result = tree.xmlNewDoc(NULL)
+    if result is NULL:
+        raise MemoryError()
+    if result.encoding is NULL:
+        result.encoding = tree.xmlStrdup(<unsigned char*>"UTF-8")
+    __GLOBAL_PARSER_CONTEXT.initDocDict(result)
+    return result
+
+cdef xmlDoc* _newHTMLDoc() except NULL:
+    cdef xmlDoc* result
+    result = tree.htmlNewDoc(NULL, NULL)
+    if result is NULL:
+        raise MemoryError()
+    __GLOBAL_PARSER_CONTEXT.initDocDict(result)
+    return result
+
+cdef xmlDoc* _copyDoc(xmlDoc* c_doc, int recursive) except NULL:
+    cdef xmlDoc* result
+    if recursive:
+        with nogil:
+            result = tree.xmlCopyDoc(c_doc, recursive)
+    else:
+        result = tree.xmlCopyDoc(c_doc, 0)
+    if result is NULL:
+        raise MemoryError()
+    __GLOBAL_PARSER_CONTEXT.initDocDict(result)
+    return result
+
+cdef xmlDoc* _copyDocRoot(xmlDoc* c_doc, xmlNode* c_new_root) except NULL:
+    u"Recursively copy the document and make c_new_root the new root node."
+    cdef xmlDoc* result
+    cdef xmlNode* c_node
+    result = tree.xmlCopyDoc(c_doc, 0) # non recursive
+    __GLOBAL_PARSER_CONTEXT.initDocDict(result)
+    with nogil:
+        c_node = tree.xmlDocCopyNode(c_new_root, result, 1) # recursive
+    if c_node is NULL:
+        raise MemoryError()
+    tree.xmlDocSetRootElement(result, c_node)
+    _copyTail(c_new_root.next, c_node)
+    return result
+
+cdef xmlNode* _copyNodeToDoc(xmlNode* c_node, xmlDoc* c_doc) except NULL:
+    u"Recursively copy the element into the document. c_doc is not modified."
+    cdef xmlNode* c_root
+    c_root = tree.xmlDocCopyNode(c_node, c_doc, 1) # recursive
+    if c_root is NULL:
+        raise MemoryError()
+    _copyTail(c_node.next, c_root)
+    return c_root
+
+
+############################################################
+## API level helper functions for _Document creation
+############################################################
+
+cdef _Document _parseDocument(source, _BaseParser parser, base_url):
+    cdef _Document doc
+    if _isString(source):
+        # parse the file directly from the filesystem
+        doc = _parseDocumentFromURL(_encodeFilename(source), parser)
+        # fix base URL if requested
+        if base_url is not None:
+            base_url = _encodeFilenameUTF8(base_url)
+            if doc._c_doc.URL is not NULL:
+                tree.xmlFree(<char*>doc._c_doc.URL)
+            doc._c_doc.URL = tree.xmlStrdup(_xcstr(base_url))
+        return doc
+
+    if base_url is not None:
+        url = base_url
+    else:
+        url = _getFilenameForFile(source)
+
+    if hasattr(source, u'getvalue') and hasattr(source, u'tell'):
+        # StringIO - reading from start?
+        if source.tell() == 0:
+            return _parseMemoryDocument(source.getvalue(), url, parser)
+
+    # Support for file-like objects (urlgrabber.urlopen, ...)
+    if hasattr(source, u'read'):
+        return _parseFilelikeDocument(source, url, parser)
+
+    raise TypeError, u"cannot parse from '%s'" % python._fqtypename(source).decode('UTF-8')
+
+cdef _Document _parseDocumentFromURL(url, _BaseParser parser):
+    c_doc = _parseDocFromFile(url, parser)
+    return _documentFactory(c_doc, parser)
+
+cdef _Document _parseMemoryDocument(text, url, _BaseParser parser):
+    if isinstance(text, unicode):
+        if _hasEncodingDeclaration(text):
+            raise ValueError(
+                u"Unicode strings with encoding declaration are not supported. "
+                u"Please use bytes input or XML fragments without declaration.")
+    elif not isinstance(text, bytes):
+        raise ValueError, u"can only parse strings"
+    c_doc = _parseDoc(text, url, parser)
+    return _documentFactory(c_doc, parser)
+
+cdef _Document _parseFilelikeDocument(source, url, _BaseParser parser):
+    c_doc = _parseDocFromFilelike(source, url, parser)
+    return _documentFactory(c_doc, parser)
diff --git a/lib/lxml/parsertarget.pxi b/lib/lxml/parsertarget.pxi
new file mode 100644
index 00000000..28dc8c40
--- /dev/null
+++ b/lib/lxml/parsertarget.pxi
@@ -0,0 +1,168 @@
+# Parser target context (ET target interface)
+
+cdef object inspect_getargspec
+from inspect import getargspec as inspect_getargspec
+
+class _TargetParserResult(Exception):
+    # Admittedly, this is somewhat ugly, but it's the easiest way
+    # to push the Python level parser result through the parser
+    # machinery towards the API level functions
+    def __init__(self, result):
+        self.result = result
+
+@cython.final
+@cython.internal
+cdef class _PythonSaxParserTarget(_SaxParserTarget):
+    cdef object _target_start
+    cdef object _target_end
+    cdef object _target_data
+    cdef object _target_doctype
+    cdef object _target_pi
+    cdef object _target_comment
+    cdef bint _start_takes_nsmap
+
+    def __cinit__(self, target):
+        cdef int event_filter
+        event_filter = 0
+        self._start_takes_nsmap = 0
+        try:
+            self._target_start = target.start
+            if self._target_start is not None:
+                event_filter |= SAX_EVENT_START
+        except AttributeError:
+            pass
+        else:
+            try:
+                arguments = inspect_getargspec(self._target_start)
+                if len(arguments[0]) > 3 or arguments[1] is not None:
+                    self._start_takes_nsmap = 1
+            except TypeError:
+                pass
+        try:
+            self._target_end = target.end
+            if self._target_end is not None:
+                event_filter |= SAX_EVENT_END
+        except AttributeError:
+            pass
+        try:
+            self._target_data = target.data
+            if self._target_data is not None:
+                event_filter |= SAX_EVENT_DATA
+        except AttributeError:
+            pass
+        try:
+            self._target_doctype = target.doctype
+            if self._target_doctype is not None:
+                event_filter |= SAX_EVENT_DOCTYPE
+        except AttributeError:
+            pass
+        try:
+            self._target_pi = target.pi
+            if self._target_pi is not None:
+                event_filter |= SAX_EVENT_PI
+        except AttributeError:
+            pass
+        try:
+            self._target_comment = target.comment
+            if self._target_comment is not None:
+                event_filter |= SAX_EVENT_COMMENT
+        except AttributeError:
+            pass
+        self._sax_event_filter = event_filter
+
+    cdef _handleSaxStart(self, tag, attrib, nsmap):
+        if self._start_takes_nsmap:
+            return self._target_start(tag, attrib, nsmap)
+        else:
+            return self._target_start(tag, attrib)
+
+    cdef _handleSaxEnd(self, tag):
+        return self._target_end(tag)
+
+    cdef int _handleSaxData(self, data) except -1:
+        self._target_data(data)
+
+    cdef int _handleSaxDoctype(self, root_tag, public_id, system_id) except -1:
+        self._target_doctype(root_tag, public_id, system_id)
+
+    cdef _handleSaxPi(self, target, data):
+        return self._target_pi(target, data)
+
+    cdef _handleSaxComment(self, comment):
+        return self._target_comment(comment)
+
+
+@cython.final
+@cython.internal
+cdef class _TargetParserContext(_SaxParserContext):
+    u"""This class maps SAX2 events to the ET parser target interface.
+    """
+    cdef object _python_target
+    cdef int _setTarget(self, target) except -1:
+        self._python_target = target
+        if not isinstance(target, _SaxParserTarget) or \
+                hasattr(target, u'__dict__'):
+            target = _PythonSaxParserTarget(target)
+        self._setSaxParserTarget(target)
+        return 0
+
+    cdef _ParserContext _copy(self):
+        cdef _TargetParserContext context
+        context = _ParserContext._copy(self)
+        context._setTarget(self._python_target)
+        return context
+
+    cdef void _cleanupTargetParserContext(self, xmlDoc* result):
+        if self._c_ctxt.myDoc is not NULL:
+            if self._c_ctxt.myDoc is not result and \
+                    self._c_ctxt.myDoc._private is NULL:
+                # no _Document proxy => orphen
+                tree.xmlFreeDoc(self._c_ctxt.myDoc)
+            self._c_ctxt.myDoc = NULL
+
+    cdef object _handleParseResult(self, _BaseParser parser, xmlDoc* result,
+                                   filename):
+        cdef bint recover
+        recover = parser._parse_options & xmlparser.XML_PARSE_RECOVER
+        try:
+            if self._has_raised():
+                self._cleanupTargetParserContext(result)
+                self._raise_if_stored()
+            if not self._c_ctxt.wellFormed and not recover:
+                _raiseParseError(self._c_ctxt, filename, self._error_log)
+        except:
+            if python.IS_PYTHON3:
+                self._python_target.close()
+                raise
+            else:
+                exc = sys.exc_info()
+                # Python 2 can't chain exceptions
+                try: self._python_target.close()
+                except: pass
+                raise exc[0], exc[1], exc[2]
+        return self._python_target.close()
+
+    cdef xmlDoc* _handleParseResultDoc(self, _BaseParser parser,
+                                       xmlDoc* result, filename) except NULL:
+        cdef bint recover
+        recover = parser._parse_options & xmlparser.XML_PARSE_RECOVER
+        if result is not NULL and result._private is NULL:
+            # no _Document proxy => orphen
+            tree.xmlFreeDoc(result)
+        try:
+            self._cleanupTargetParserContext(result)
+            self._raise_if_stored()
+            if not self._c_ctxt.wellFormed and not recover:
+                _raiseParseError(self._c_ctxt, filename, self._error_log)
+        except:
+            if python.IS_PYTHON3:
+                self._python_target.close()
+                raise
+            else:
+                exc = sys.exc_info()
+                # Python 2 can't chain exceptions
+                try: self._python_target.close()
+                except: pass
+                raise exc[0], exc[1], exc[2]
+        parse_result = self._python_target.close()
+        raise _TargetParserResult(parse_result)
diff --git a/lib/lxml/proxy.pxi b/lib/lxml/proxy.pxi
new file mode 100644
index 00000000..52909f69
--- /dev/null
+++ b/lib/lxml/proxy.pxi
@@ -0,0 +1,503 @@
+# Proxy functions and low level node allocation stuff
+
+# Proxies represent elements, their reference is stored in the C
+# structure of the respective node to avoid multiple instantiation of
+# the Python class.
+#
+# In PyPy, we store weak references instead of borrowed back-pointer
+# references as borrowed references cannot be long-lived in its
+# compatibility layer cpyext. Since we can't know when the object dies
+# (and even the weak-ref callback won't tell us that), we double check
+# on access that the object really is still alive and delete the
+# weak-ref if it isn't.
+
+cdef inline _Element getProxy(xmlNode* c_node):
+    u"""Get a proxy for a given node.
+    """
+    #print "getProxy for:", <int>c_node
+    if c_node is not NULL and c_node._private is not NULL:
+        if python.IS_PYPY:
+            return <_Element>python.PyWeakref_LockObject(<python.PyObject*>c_node._private)
+        else:
+            return <_Element>c_node._private
+    else:
+        return None
+
+cdef inline bint hasProxy(xmlNode* c_node):
+    if c_node._private is NULL:
+        return False
+    if python.IS_PYPY:
+        return _isProxyAliveInPypy(c_node)
+    return True
+
+cdef bint _isProxyAliveInPypy(xmlNode* c_node):
+    retval = True
+    if python.PyWeakref_LockObject(<python.PyObject*>c_node._private) is None:
+        # proxy has already died => remove weak reference
+        weakref_ptr = <python.PyObject*>c_node._private
+        c_node._private = NULL
+        python.Py_XDECREF(weakref_ptr)
+        retval = False
+    return retval
+
+cdef inline int _registerProxy(_Element proxy, _Document doc,
+                               xmlNode* c_node) except -1:
+    u"""Register a proxy and type for the node it's proxying for.
+    """
+    #print "registering for:", <int>proxy._c_node
+    assert not hasProxy(c_node), u"double registering proxy!"
+    proxy._doc = doc
+    proxy._c_node = c_node
+    if python.IS_PYPY:
+        c_node._private = <void*>python.PyWeakref_NewRef(proxy, NULL)
+    else:
+        c_node._private = <void*>proxy
+    return 0
+
+cdef inline int _unregisterProxy(_Element proxy) except -1:
+    u"""Unregister a proxy for the node it's proxying for.
+    """
+    cdef xmlNode* c_node = proxy._c_node
+    if python.IS_PYPY:
+        weakref_ptr = <python.PyObject*>c_node._private
+        c_node._private = NULL
+        python.Py_XDECREF(weakref_ptr)
+    else:
+        assert c_node._private is <void*>proxy, u"Tried to unregister unknown proxy"
+        c_node._private = NULL
+    return 0
+
+################################################################################
+# temporarily make a node the root node of its document
+
+cdef xmlDoc* _fakeRootDoc(xmlDoc* c_base_doc, xmlNode* c_node) except NULL:
+    return _plainFakeRootDoc(c_base_doc, c_node, 1)
+
+cdef xmlDoc* _plainFakeRootDoc(xmlDoc* c_base_doc, xmlNode* c_node,
+                               bint with_siblings) except NULL:
+    # build a temporary document that has the given node as root node
+    # note that copy and original must not be modified during its lifetime!!
+    # always call _destroyFakeDoc() after use!
+    cdef xmlNode* c_child
+    cdef xmlNode* c_root
+    cdef xmlNode* c_new_root
+    cdef xmlDoc*  c_doc
+    if with_siblings or (c_node.prev is NULL and c_node.next is NULL):
+        c_root = tree.xmlDocGetRootElement(c_base_doc)
+        if c_root is c_node:
+            # already the root node, no siblings
+            return c_base_doc
+
+    c_doc  = _copyDoc(c_base_doc, 0)                   # non recursive!
+    c_new_root = tree.xmlDocCopyNode(c_node, c_doc, 2) # non recursive!
+    tree.xmlDocSetRootElement(c_doc, c_new_root)
+    _copyParentNamespaces(c_node, c_new_root)
+
+    c_new_root.children = c_node.children
+    c_new_root.last = c_node.last
+    c_new_root.next = c_new_root.prev = NULL
+
+    # store original node
+    c_doc._private = c_node
+
+    # divert parent pointers of children
+    c_child = c_new_root.children
+    while c_child is not NULL:
+        c_child.parent = c_new_root
+        c_child = c_child.next
+
+    c_doc.children = c_new_root
+    return c_doc
+
+cdef void _destroyFakeDoc(xmlDoc* c_base_doc, xmlDoc* c_doc):
+    # delete a temporary document
+    cdef xmlNode* c_child
+    cdef xmlNode* c_parent
+    cdef xmlNode* c_root
+    if c_doc is c_base_doc:
+        return
+    c_root = tree.xmlDocGetRootElement(c_doc)
+
+    # restore parent pointers of children
+    c_parent = <xmlNode*>c_doc._private
+    c_child = c_root.children
+    while c_child is not NULL:
+        c_child.parent = c_parent
+        c_child = c_child.next
+
+    # prevent recursive removal of children
+    c_root.children = c_root.last = NULL
+    tree.xmlFreeDoc(c_doc)
+
+cdef _Element _fakeDocElementFactory(_Document doc, xmlNode* c_element):
+    u"""Special element factory for cases where we need to create a fake
+    root document, but still need to instantiate arbitrary nodes from
+    it.  If we instantiate the fake root node, things will turn bad
+    when it's destroyed.
+
+    Instead, if we are asked to instantiate the fake root node, we
+    instantiate the original node instead.
+    """
+    if c_element.doc is not doc._c_doc:
+        if c_element.doc._private is not NULL:
+            if c_element is c_element.doc.children:
+                c_element = <xmlNode*>c_element.doc._private
+                #assert c_element.type == tree.XML_ELEMENT_NODE
+    return _elementFactory(doc, c_element)
+
+################################################################################
+# support for freeing tree elements when proxy objects are destroyed
+
+cdef int attemptDeallocation(xmlNode* c_node):
+    u"""Attempt deallocation of c_node (or higher up in tree).
+    """
+    cdef xmlNode* c_top
+    # could be we actually aren't referring to the tree at all
+    if c_node is NULL:
+        #print "not freeing, node is NULL"
+        return 0
+    c_top = getDeallocationTop(c_node)
+    if c_top is not NULL:
+        #print "freeing:", c_top.name
+        _removeText(c_top.next) # tail
+        tree.xmlFreeNode(c_top)
+        return 1
+    return 0
+
+cdef xmlNode* getDeallocationTop(xmlNode* c_node):
+    u"""Return the top of the tree that can be deallocated, or NULL.
+    """
+    #print "trying to do deallocating:", c_node.type
+    if hasProxy(c_node):
+        #print "Not freeing: proxies still exist"
+        return NULL
+    while c_node.parent is not NULL:
+        c_node = c_node.parent
+        #print "checking:", c_current.type
+        if c_node.type == tree.XML_DOCUMENT_NODE or \
+               c_node.type == tree.XML_HTML_DOCUMENT_NODE:
+            #print "not freeing: still in doc"
+            return NULL
+        # if we're still attached to the document, don't deallocate
+        if hasProxy(c_node):
+            #print "Not freeing: proxies still exist"
+            return NULL
+    # see whether we have children to deallocate
+    if canDeallocateChildNodes(c_node):
+        return c_node
+    else:
+        return NULL
+
+cdef int canDeallocateChildNodes(xmlNode* c_parent):
+    cdef xmlNode* c_node
+    c_node = c_parent.children
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_parent, c_node, 1)
+    if hasProxy(c_node):
+        return 0
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+    return 1
+
+################################################################################
+# fix _Document references and namespaces when a node changes documents
+
+cdef void _copyParentNamespaces(xmlNode* c_from_node, xmlNode* c_to_node) nogil:
+    u"""Copy the namespaces of all ancestors of c_from_node to c_to_node.
+    """
+    cdef xmlNode* c_parent
+    cdef xmlNs* c_ns
+    cdef xmlNs* c_new_ns
+    cdef int prefix_known
+    c_parent = c_from_node.parent
+    while c_parent and (tree._isElementOrXInclude(c_parent) or
+                        c_parent.type == tree.XML_DOCUMENT_NODE):
+        c_new_ns = c_parent.nsDef
+        while c_new_ns:
+            # libxml2 will check if the prefix is already defined
+            tree.xmlNewNs(c_to_node, c_new_ns.href, c_new_ns.prefix)
+            c_new_ns = c_new_ns.next
+        c_parent = c_parent.parent
+
+ctypedef struct _nscache:
+    xmlNs** new
+    xmlNs** old
+    size_t size
+    size_t last
+
+cdef int _growNsCache(_nscache* c_ns_cache) except -1:
+    cdef xmlNs** c_ns_ptr
+    if c_ns_cache.size == 0:
+        c_ns_cache.size = 20
+    else:
+        c_ns_cache.size *= 2
+    c_ns_ptr = <xmlNs**> stdlib.realloc(
+        c_ns_cache.new, c_ns_cache.size * sizeof(xmlNs*))
+    if c_ns_ptr is not NULL:
+        c_ns_cache.new = c_ns_ptr
+        c_ns_ptr = <xmlNs**> stdlib.realloc(
+            c_ns_cache.old, c_ns_cache.size * sizeof(xmlNs*))
+    if c_ns_ptr is not NULL:
+        c_ns_cache.old = c_ns_ptr
+    else:
+        stdlib.free(c_ns_cache.new)
+        stdlib.free(c_ns_cache.old)
+        raise MemoryError()
+    return 0
+
+cdef inline int _appendToNsCache(_nscache* c_ns_cache,
+                                 xmlNs* c_old_ns, xmlNs* c_new_ns) except -1:
+    if c_ns_cache.last >= c_ns_cache.size:
+        _growNsCache(c_ns_cache)
+    c_ns_cache.old[c_ns_cache.last] = c_old_ns
+    c_ns_cache.new[c_ns_cache.last] = c_new_ns
+    c_ns_cache.last += 1
+
+cdef int _stripRedundantNamespaceDeclarations(
+    xmlNode* c_element, _nscache* c_ns_cache, xmlNs** c_del_ns_list) except -1:
+    u"""Removes namespace declarations from an element that are already
+    defined in its parents.  Does not free the xmlNs's, just prepends
+    them to the c_del_ns_list.
+    """
+    cdef xmlNs* c_ns
+    cdef xmlNs* c_ns_next
+    cdef xmlNs** c_nsdef
+    # use a xmlNs** to handle assignments to "c_element.nsDef" correctly
+    c_nsdef = &c_element.nsDef
+    while c_nsdef[0] is not NULL:
+        c_ns = tree.xmlSearchNsByHref(
+            c_element.doc, c_element.parent, c_nsdef[0].href)
+        if c_ns is NULL:
+            # new namespace href => keep and cache the ns declaration
+            _appendToNsCache(c_ns_cache, c_nsdef[0], c_nsdef[0])
+            c_nsdef = &c_nsdef[0].next
+        else:
+            # known namespace href => cache mapping and strip old ns
+            _appendToNsCache(c_ns_cache, c_nsdef[0], c_ns)
+            # cut out c_nsdef.next and prepend it to garbage chain
+            c_ns_next = c_nsdef[0].next
+            c_nsdef[0].next = c_del_ns_list[0]
+            c_del_ns_list[0] = c_nsdef[0]
+            c_nsdef[0] = c_ns_next
+    return 0
+
+cdef int moveNodeToDocument(_Document doc, xmlDoc* c_source_doc,
+                            xmlNode* c_element) except -1:
+    u"""Fix the xmlNs pointers of a node and its subtree that were moved.
+
+    Originally copied from libxml2's xmlReconciliateNs().  Expects
+    libxml2 doc pointers of node to be correct already, but fixes
+    _Document references.
+
+    For each node in the subtree, we do this:
+
+    1) Remove redundant declarations of namespace that are already
+       defined in its parents.
+
+    2) Replace namespaces that are *not* defined on the node or its
+       parents by the equivalent namespace declarations that *are*
+       defined on the node or its parents (possibly using a different
+       prefix).  If a namespace is unknown, declare a new one on the
+       node.
+
+    3) Reassign the names of tags and attribute from the dict of the
+       target document *iff* it is different from the dict used in the
+       source subtree.
+
+    4) Set the Document reference to the new Document (if different).
+       This is done on backtracking to keep the original Document
+       alive as long as possible, until all its elements are updated.
+
+    Note that the namespace declarations are removed from the tree in
+    step 1), but freed only after the complete subtree was traversed
+    and all occurrences were replaced by tree-internal pointers.
+    """
+    cdef xmlNode* c_start_node
+    cdef xmlNode* c_node
+    cdef char* c_name
+    cdef _nscache c_ns_cache
+    cdef xmlNs* c_ns
+    cdef xmlNs* c_ns_next
+    cdef xmlNs* c_nsdef
+    cdef xmlNs* c_del_ns_list
+    cdef size_t i, proxy_count = 0
+
+    if not tree._isElementOrXInclude(c_element):
+        return 0
+
+    c_start_node = c_element
+    c_del_ns_list = NULL
+
+    c_ns_cache.new = NULL
+    c_ns_cache.old = NULL
+    c_ns_cache.size = 0
+    c_ns_cache.last = 0
+
+    tree.BEGIN_FOR_EACH_FROM(c_element, c_element, 1)
+    if tree._isElementOrXInclude(c_element):
+        if hasProxy(c_element):
+            proxy_count += 1
+
+        # 1) cut out namespaces defined here that are already known by
+        #    the ancestors
+        if c_element.nsDef is not NULL:
+            _stripRedundantNamespaceDeclarations(
+                c_element, &c_ns_cache, &c_del_ns_list)
+
+        # 2) make sure the namespaces of an element and its attributes
+        #    are declared in this document (i.e. on the node or its parents)
+        c_node = c_element
+        while c_node is not NULL:
+            if c_node.ns is not NULL:
+                c_ns = NULL
+                for i in range(c_ns_cache.last):
+                    if c_node.ns is c_ns_cache.old[i]:
+                        if (c_node.type == tree.XML_ATTRIBUTE_NODE
+                                and c_node.ns.prefix
+                                and not c_ns_cache.new[i].prefix):
+                            # avoid dropping prefix from attributes
+                            continue
+                        c_ns = c_ns_cache.new[i]
+                        break
+
+                if not c_ns:
+                    # not in cache or not acceptable
+                    # => find a replacement from this document
+                    c_ns = doc._findOrBuildNodeNs(
+                        c_start_node, c_node.ns.href, c_node.ns.prefix,
+                        c_node.type == tree.XML_ATTRIBUTE_NODE)
+                    _appendToNsCache(&c_ns_cache, c_node.ns, c_ns)
+                c_node.ns = c_ns
+
+            if c_node is c_element:
+                # after the element, continue with its attributes
+                c_node = <xmlNode*>c_element.properties
+            else:
+                c_node = c_node.next
+    tree.END_FOR_EACH_FROM(c_element)
+
+    # free now unused namespace declarations
+    if c_del_ns_list is not NULL:
+        tree.xmlFreeNsList(c_del_ns_list)
+
+    # cleanup
+    if c_ns_cache.new is not NULL:
+        stdlib.free(c_ns_cache.new)
+    if c_ns_cache.old is not NULL:
+        stdlib.free(c_ns_cache.old)
+
+    # 3) fix the names in the tree if we moved it from a different thread
+    if doc._c_doc.dict is not c_source_doc.dict:
+        fixThreadDictNames(c_start_node, c_source_doc.dict, doc._c_doc.dict)
+
+    # 4) fix _Document references
+    #    (and potentially deallocate the source document)
+    if proxy_count > 0:
+        if proxy_count == 1 and c_start_node._private is not NULL:
+            proxy = getProxy(c_start_node)
+            if proxy is not None:
+                if proxy._doc is not doc:
+                    proxy._doc = doc
+            else:
+                fixElementDocument(c_start_node, doc, proxy_count)
+        else:
+            fixElementDocument(c_start_node, doc, proxy_count)
+
+    return 0
+
+
+cdef void fixElementDocument(xmlNode* c_element, _Document doc,
+                             size_t proxy_count):
+    cdef xmlNode* c_node = c_element
+    cdef _Element proxy = None # init-to-None required due to fake-loop below
+    tree.BEGIN_FOR_EACH_FROM(c_element, c_node, 1)
+    if c_node._private is not NULL:
+        proxy = getProxy(c_node)
+        if proxy is not None:
+            if proxy._doc is not doc:
+                proxy._doc = doc
+            proxy_count -= 1
+            if proxy_count == 0:
+                return
+    tree.END_FOR_EACH_FROM(c_node)
+
+cdef void fixThreadDictNames(xmlNode* c_element,
+                             tree.xmlDict* c_src_dict,
+                             tree.xmlDict* c_dict) nogil:
+    # re-assign the names of tags and attributes
+    #
+    # this should only be called when the element is based on a
+    # different libxml2 tag name dictionary
+    if c_element.type == tree.XML_DOCUMENT_NODE or \
+            c_element.type == tree.XML_HTML_DOCUMENT_NODE:
+        # may define "xml" namespace
+        fixThreadDictNsForNode(c_element, c_src_dict, c_dict)
+        c_element = c_element.children
+        while c_element is not NULL:
+            fixThreadDictNamesForNode(c_element, c_src_dict, c_dict)
+            c_element = c_element.next
+    elif tree._isElementOrXInclude(c_element):
+        fixThreadDictNamesForNode(c_element, c_src_dict, c_dict)
+
+cdef void fixThreadDictNamesForNode(xmlNode* c_element,
+                                    tree.xmlDict* c_src_dict,
+                                    tree.xmlDict* c_dict) nogil:
+    cdef xmlNode* c_node = c_element
+    tree.BEGIN_FOR_EACH_FROM(c_element, c_node, 1)
+    if c_node.name is not NULL:
+        fixThreadDictNameForNode(c_node, c_src_dict, c_dict)
+    if c_node.type in (tree.XML_ELEMENT_NODE, tree.XML_XINCLUDE_START):
+        fixThreadDictNamesForAttributes(
+            c_node.properties, c_src_dict, c_dict)
+        fixThreadDictNsForNode(c_node, c_src_dict, c_dict)
+    elif c_node.type == tree.XML_TEXT_NODE:
+        # libxml2's SAX2 parser interns some indentation space
+        fixThreadDictContentForNode(c_node, c_src_dict, c_dict)
+    tree.END_FOR_EACH_FROM(c_node)
+
+cdef inline void fixThreadDictNamesForAttributes(tree.xmlAttr* c_attr,
+                                                 tree.xmlDict* c_src_dict,
+                                                 tree.xmlDict* c_dict) nogil:
+    cdef xmlNode* c_child
+    cdef xmlNode* c_node = <xmlNode*>c_attr
+    while c_node is not NULL:
+        fixThreadDictNameForNode(c_node, c_src_dict, c_dict)
+        # libxml2 keeps some (!) attribute values in the dict
+        c_child = c_node.children
+        while c_child is not NULL:
+            fixThreadDictContentForNode(c_child, c_src_dict, c_dict)
+            c_child = c_child.next
+        c_node = c_node.next
+
+cdef inline void fixThreadDictNameForNode(xmlNode* c_node,
+                                          tree.xmlDict* c_src_dict,
+                                          tree.xmlDict* c_dict) nogil:
+    cdef const_xmlChar* c_name = c_node.name
+    if c_name is not NULL and \
+           c_node.type != tree.XML_TEXT_NODE and \
+           c_node.type != tree.XML_COMMENT_NODE:
+        if tree.xmlDictOwns(c_src_dict, c_node.name):
+            # c_name can be NULL on memory error, but we don't handle that here
+            c_name = tree.xmlDictLookup(c_dict, c_name, -1)
+            if c_name is not NULL:
+                c_node.name = c_name
+
+cdef inline void fixThreadDictContentForNode(xmlNode* c_node,
+                                             tree.xmlDict* c_src_dict,
+                                             tree.xmlDict* c_dict) nogil:
+    if c_node.content is not NULL and \
+           c_node.content is not <xmlChar*>&c_node.properties:
+        if tree.xmlDictOwns(c_src_dict, c_node.content):
+            # result can be NULL on memory error, but we don't handle that here
+            c_node.content = <xmlChar*>tree.xmlDictLookup(c_dict, c_node.content, -1)
+
+cdef inline void fixThreadDictNsForNode(xmlNode* c_node,
+                                        tree.xmlDict* c_src_dict,
+                                        tree.xmlDict* c_dict) nogil:
+    cdef xmlNs* c_ns = c_node.nsDef
+    while c_ns is not NULL:
+        if c_ns.href is not NULL:
+            if tree.xmlDictOwns(c_src_dict, c_ns.href):
+                c_ns.href = tree.xmlDictLookup(c_dict, c_ns.href, -1)
+        if c_ns.prefix is not NULL:
+            if tree.xmlDictOwns(c_src_dict, c_ns.prefix):
+                c_ns.prefix = tree.xmlDictLookup(c_dict, c_ns.prefix, -1)
+        c_ns = c_ns.next
diff --git a/lib/lxml/public-api.pxi b/lib/lxml/public-api.pxi
new file mode 100644
index 00000000..128e25d3
--- /dev/null
+++ b/lib/lxml/public-api.pxi
@@ -0,0 +1,172 @@
+# Public C API for lxml.etree
+
+cdef public api _Element deepcopyNodeToDocument(_Document doc, xmlNode* c_root):
+    u"Recursively copy the element into the document. doc is not modified."
+    cdef xmlNode* c_node
+    c_node = _copyNodeToDoc(c_root, doc._c_doc)
+    return _elementFactory(doc, c_node)
+
+cdef public api _ElementTree elementTreeFactory(_Element context_node):
+    _assertValidNode(context_node)
+    return newElementTree(context_node, _ElementTree)
+
+cdef public api _ElementTree newElementTree(_Element context_node,
+                                            object subclass):
+    if <void*>context_node is NULL or context_node is None:
+        raise TypeError
+    _assertValidNode(context_node)
+    return _newElementTree(context_node._doc, context_node, subclass)
+
+cdef public api _Element elementFactory(_Document doc, xmlNode* c_node):
+    if c_node is NULL or doc is None:
+        raise TypeError
+    return _elementFactory(doc, c_node)
+
+cdef public api _Element makeElement(tag, _Document doc, parser,
+                                     text, tail, attrib, nsmap):
+    return _makeElement(tag, NULL, doc, parser, text, tail, attrib, nsmap, None)
+
+cdef public api _Element makeSubElement(_Element parent, tag, text, tail,
+                                        attrib, nsmap):
+    _assertValidNode(parent)
+    return _makeSubElement(parent, tag, text, tail, attrib, nsmap, None)
+
+cdef public api void setElementClassLookupFunction(
+    _element_class_lookup_function function, state):
+    _setElementClassLookupFunction(function, state)
+
+cdef public api object lookupDefaultElementClass(state, doc, xmlNode* c_node):
+    return _lookupDefaultElementClass(state, doc, c_node)
+
+cdef public api object lookupNamespaceElementClass(state, doc, xmlNode* c_node):
+    return _find_nselement_class(state, doc, c_node)
+
+cdef public api object callLookupFallback(FallbackElementClassLookup lookup,
+                                          _Document doc, xmlNode* c_node):
+    return _callLookupFallback(lookup, doc, c_node)
+
+cdef public api int tagMatches(xmlNode* c_node, const_xmlChar* c_href, const_xmlChar* c_name):
+    if c_node is NULL:
+        return -1
+    return _tagMatches(c_node, c_href, c_name)
+
+cdef public api _Document documentOrRaise(object input):
+    return _documentOrRaise(input)
+
+cdef public api _Element rootNodeOrRaise(object input):
+    return _rootNodeOrRaise(input)
+
+cdef public api bint hasText(xmlNode* c_node):
+    return _hasText(c_node)
+
+cdef public api bint hasTail(xmlNode* c_node):
+    return _hasTail(c_node)
+
+cdef public api object textOf(xmlNode* c_node):
+    if c_node is NULL:
+        return None
+    return _collectText(c_node.children)
+
+cdef public api object tailOf(xmlNode* c_node):
+    if c_node is NULL:
+        return None
+    return _collectText(c_node.next)
+
+cdef public api int setNodeText(xmlNode* c_node, text) except -1:
+    if c_node is NULL:
+        raise ValueError
+    return _setNodeText(c_node, text)
+
+cdef public api int setTailText(xmlNode* c_node, text) except -1:
+    if c_node is NULL:
+        raise ValueError
+    return _setTailText(c_node, text)
+
+cdef public api object attributeValue(xmlNode* c_element, xmlAttr* c_attrib_node):
+    return _attributeValue(c_element, c_attrib_node)
+
+cdef public api object attributeValueFromNsName(xmlNode* c_element,
+                                                const_xmlChar* ns, const_xmlChar* name):
+    return _attributeValueFromNsName(c_element, ns, name)
+
+cdef public api object getAttributeValue(_Element element, key, default):
+    _assertValidNode(element)
+    return _getAttributeValue(element, key, default)
+
+cdef public api object iterattributes(_Element element, int keysvalues):
+    _assertValidNode(element)
+    return _attributeIteratorFactory(element, keysvalues)
+
+cdef public api list collectAttributes(xmlNode* c_element, int keysvalues):
+    return _collectAttributes(c_element, keysvalues)
+
+cdef public api int setAttributeValue(_Element element, key, value) except -1:
+    _assertValidNode(element)
+    return _setAttributeValue(element, key, value)
+
+cdef public api int delAttribute(_Element element, key) except -1:
+    _assertValidNode(element)
+    return _delAttribute(element, key)
+
+cdef public api int delAttributeFromNsName(tree.xmlNode* c_element,
+                                           const_xmlChar* c_href, const_xmlChar* c_name):
+    return _delAttributeFromNsName(c_element, c_href, c_name)
+
+cdef public api bint hasChild(xmlNode* c_node):
+    return _hasChild(c_node)
+
+cdef public api xmlNode* findChild(xmlNode* c_node, Py_ssize_t index):
+    return _findChild(c_node, index)
+
+cdef public api xmlNode* findChildForwards(xmlNode* c_node, Py_ssize_t index):
+    return _findChildForwards(c_node, index)
+
+cdef public api xmlNode* findChildBackwards(xmlNode* c_node, Py_ssize_t index):
+    return _findChildBackwards(c_node, index)
+
+cdef public api xmlNode* nextElement(xmlNode* c_node):
+    return _nextElement(c_node)
+
+cdef public api xmlNode* previousElement(xmlNode* c_node):
+    return _previousElement(c_node)
+
+cdef public api void appendChild(_Element parent, _Element child):
+    # deprecated, use appendChildToElement() instead!
+    _appendChild(parent, child)
+
+cdef public api int appendChildToElement(_Element parent, _Element child) except -1:
+    return _appendChild(parent, child)
+
+cdef public api object pyunicode(const_xmlChar* s):
+    if s is NULL:
+        raise TypeError
+    return funicode(s)
+
+cdef public api bytes utf8(object s):
+    return _utf8(s)
+
+cdef public api tuple getNsTag(object tag):
+    return _getNsTag(tag)
+
+cdef public api tuple getNsTagWithEmptyNs(object tag):
+    return _getNsTagWithEmptyNs(tag)
+
+cdef public api object namespacedName(xmlNode* c_node):
+    return _namespacedName(c_node)
+
+cdef public api object namespacedNameFromNsName(const_xmlChar* href, const_xmlChar* name):
+    return _namespacedNameFromNsName(href, name)
+
+cdef public api void iteratorStoreNext(_ElementIterator iterator, _Element node):
+    # deprecated!
+    iterator._storeNext(node)
+
+cdef public api void initTagMatch(_ElementTagMatcher matcher, tag):
+    # deprecated!
+    matcher._initTagMatch(tag)
+
+cdef public api tree.xmlNs* findOrBuildNodeNsPrefix(
+        _Document doc, xmlNode* c_node, const_xmlChar* href, const_xmlChar* prefix) except NULL:
+    if doc is None:
+        raise TypeError
+    return doc._findOrBuildNodeNs(c_node, href, prefix, 0)
diff --git a/lib/lxml/pyclasslookup.py b/lib/lxml/pyclasslookup.py
new file mode 100644
index 00000000..32c010cf
--- /dev/null
+++ b/lib/lxml/pyclasslookup.py
@@ -0,0 +1,3 @@
+# dummy module for backwards compatibility
+
+from etree import PythonElementClassLookup
diff --git a/lib/lxml/python.pxd b/lib/lxml/python.pxd
new file mode 100644
index 00000000..1d070860
--- /dev/null
+++ b/lib/lxml/python.pxd
@@ -0,0 +1,135 @@
+from libc cimport stdio
+from libc.string cimport const_char
+cimport cython
+
+cdef extern from *:
+    cdef bint PEP393_ENABLED "CYTHON_PEP393_ENABLED"
+
+cdef extern from "Python.h":
+    ctypedef struct PyObject
+    ctypedef struct PyThreadState
+    cdef int PY_SSIZE_T_MAX
+    cdef int PY_VERSION_HEX
+
+    cdef void Py_INCREF(object o)
+    cdef void Py_DECREF(object o)
+    cdef void Py_XDECREF(PyObject* o)
+
+    cdef stdio.FILE* PyFile_AsFile(object p)
+
+    # PEP 393
+    cdef bint PyUnicode_IS_READY(object u)
+    cdef Py_ssize_t PyUnicode_GET_LENGTH(object u)
+    cdef int PyUnicode_KIND(object u)
+    cdef void* PyUnicode_DATA(object u)
+
+    cdef bytes PyUnicode_AsEncodedString(object u, char* encoding,
+                                         char* errors)
+    cdef cython.unicode PyUnicode_FromFormat(char* format, ...) # Python 3
+    cdef cython.unicode PyUnicode_Decode(char* s, Py_ssize_t size,
+                                         char* encoding, char* errors)
+    cdef cython.unicode PyUnicode_DecodeUTF8(char* s, Py_ssize_t size, char* errors)
+    cdef cython.unicode PyUnicode_DecodeLatin1(char* s, Py_ssize_t size, char* errors)
+    cdef object PyUnicode_RichCompare(object o1, object o2, int op)  # not in Py2.4
+    cdef bytes PyUnicode_AsUTF8String(object ustring)
+    cdef bytes PyUnicode_AsASCIIString(object ustring)
+    cdef char* PyUnicode_AS_DATA(object ustring)
+    cdef Py_ssize_t PyUnicode_GET_DATA_SIZE(object ustring)
+    cdef Py_ssize_t PyUnicode_GET_SIZE(object ustring)
+    cdef bytes PyBytes_FromStringAndSize(char* s, Py_ssize_t size)
+    cdef bytes PyBytes_FromFormat(char* format, ...)
+    cdef Py_ssize_t PyBytes_GET_SIZE(object s)
+
+    cdef object PyNumber_Int(object value)
+    cdef Py_ssize_t PyInt_AsSsize_t(object value)
+
+    cdef Py_ssize_t PyTuple_GET_SIZE(object t)
+    cdef object PyTuple_GET_ITEM(object o, Py_ssize_t pos)
+
+    cdef object PyList_New(Py_ssize_t index)
+    cdef Py_ssize_t PyList_GET_SIZE(object l)
+    cdef object PyList_GET_ITEM(object l, Py_ssize_t index)
+    cdef void PyList_SET_ITEM(object l, Py_ssize_t index, object value)
+    cdef int PyList_Insert(object l, Py_ssize_t index, object o) except -1
+    cdef object PyList_AsTuple(object l)
+    cdef void PyList_Clear(object l)
+
+#    cdef int PyDict_SetItemString(object d, char* key, object value) except -1
+#    cdef int PyDict_SetItem(object d, object key, object value) except -1
+    cdef PyObject* PyDict_GetItemString(object d, char* key)
+    cdef PyObject* PyDict_GetItem(object d, object key)
+#    cdef int PyDict_DelItem(object d, object key) except -1
+    cdef void PyDict_Clear(object d)
+#    cdef object PyDict_Copy(object d)
+    cdef object PyDictProxy_New(object d)
+    # cdef int PyDict_Contains(object d, object key) except -1 # Python 2.4+
+    cdef Py_ssize_t PyDict_Size(object d)
+    cdef object PySequence_List(object o)
+    cdef object PySequence_Tuple(object o)
+
+    cdef bint PyNumber_Check(object instance)
+    cdef bint PySequence_Check(object instance)
+    cdef bint PyType_Check(object instance)
+    cdef bint PyTuple_CheckExact(object instance)
+
+    cdef int _PyEval_SliceIndex(object value, Py_ssize_t* index) except 0
+    cdef int PySlice_GetIndicesEx "_lx_PySlice_GetIndicesEx" (
+            object slice, Py_ssize_t length,
+            Py_ssize_t *start, Py_ssize_t *stop, Py_ssize_t *step,
+            Py_ssize_t *slicelength) except -1
+
+    cdef object PyObject_RichCompare(object o1, object o2, int op)
+    cdef int PyObject_RichCompareBool(object o1, object o2, int op)
+
+    PyObject* PyWeakref_NewRef(object ob, PyObject* callback) except NULL  # used for PyPy only
+    object PyWeakref_LockObject(PyObject* ob) # PyPy only
+
+    cdef void* PyMem_Malloc(size_t size)
+    cdef void* PyMem_Realloc(void* p, size_t size)
+    cdef void PyMem_Free(void* p)
+
+    # always returns NULL to pass on the exception
+    cdef object PyErr_SetFromErrno(object type)
+
+    cdef PyThreadState* PyEval_SaveThread()
+    cdef void PyEval_RestoreThread(PyThreadState* state)
+    cdef PyObject* PyThreadState_GetDict()
+
+    # some handy functions
+    cdef char* _cstr "PyBytes_AS_STRING" (object s)
+    cdef char* __cstr "PyBytes_AS_STRING" (PyObject* s)
+
+    # Py_buffer related flags
+    cdef int PyBUF_SIMPLE
+    cdef int PyBUF_WRITABLE
+    cdef int PyBUF_LOCK
+    cdef int PyBUF_FORMAT
+    cdef int PyBUF_ND
+    cdef int PyBUF_STRIDES
+    cdef int PyBUF_C_CONTIGUOUS
+    cdef int PyBUF_F_CONTIGUOUS
+    cdef int PyBUF_ANY_CONTIGUOUS
+    cdef int PyBUF_INDIRECT
+
+cdef extern from "pythread.h":
+    ctypedef void* PyThread_type_lock
+    cdef PyThread_type_lock PyThread_allocate_lock()
+    cdef void PyThread_free_lock(PyThread_type_lock lock)
+    cdef int  PyThread_acquire_lock(PyThread_type_lock lock, int mode) nogil
+    cdef void PyThread_release_lock(PyThread_type_lock lock)
+    cdef long PyThread_get_thread_ident()
+
+    ctypedef enum __WaitLock:
+        WAIT_LOCK
+        NOWAIT_LOCK
+
+cdef extern from "etree_defs.h": # redefines some functions as macros
+    cdef bint _isString(object obj)
+    cdef const_char* _fqtypename(object t)
+    cdef object PY_NEW(object t)
+    cdef bint LXML_UNICODE_STRINGS
+    cdef bint IS_PYTHON3
+    cdef bint IS_PYPY
+
+cdef extern from "lxml_endian.h":
+    cdef bint PY_BIG_ENDIAN  # defined in later Py3.x versions
diff --git a/lib/lxml/readonlytree.pxi b/lib/lxml/readonlytree.pxi
new file mode 100644
index 00000000..0f42be70
--- /dev/null
+++ b/lib/lxml/readonlytree.pxi
@@ -0,0 +1,554 @@
+# read-only tree implementation
+
+@cython.internal
+cdef class _ReadOnlyProxy:
+    u"A read-only proxy class suitable for PIs/Comments (for internal use only!)."
+    cdef bint _free_after_use
+    cdef xmlNode* _c_node
+    cdef _ReadOnlyProxy _source_proxy
+    cdef list _dependent_proxies
+    def __cinit__(self):
+        self._c_node = NULL
+        self._free_after_use = 0
+
+    cdef int _assertNode(self) except -1:
+        u"""This is our way of saying: this proxy is invalid!
+        """
+        if not self._c_node:
+            raise ReferenceError("Proxy invalidated!")
+        return 0
+
+    cdef int _raise_unsupported_type(self) except -1:
+        raise TypeError("Unsupported node type: %d" % self._c_node.type)
+
+    cdef void free_after_use(self):
+        u"""Should the xmlNode* be freed when releasing the proxy?
+        """
+        self._free_after_use = 1
+
+    property tag:
+        u"""Element tag
+        """
+        def __get__(self):
+            self._assertNode()
+            if self._c_node.type == tree.XML_ELEMENT_NODE:
+                return _namespacedName(self._c_node)
+            elif self._c_node.type == tree.XML_PI_NODE:
+                return ProcessingInstruction
+            elif self._c_node.type == tree.XML_COMMENT_NODE:
+                return Comment
+            elif self._c_node.type == tree.XML_ENTITY_REF_NODE:
+                return Entity
+            else:
+                self._raise_unsupported_type()
+
+    property text:
+        u"""Text before the first subelement. This is either a string or 
+        the value None, if there was no text.
+        """
+        def __get__(self):
+            self._assertNode()
+            if self._c_node.type == tree.XML_ELEMENT_NODE:
+                return _collectText(self._c_node.children)
+            elif self._c_node.type in (tree.XML_PI_NODE,
+                                       tree.XML_COMMENT_NODE):
+                if self._c_node.content is NULL:
+                    return ''
+                else:
+                    return funicode(self._c_node.content)
+            elif self._c_node.type == tree.XML_ENTITY_REF_NODE:
+                return u'&%s;' % funicode(self._c_node.name)
+            else:
+                self._raise_unsupported_type()
+        
+    property tail:
+        u"""Text after this element's end tag, but before the next sibling
+        element's start tag. This is either a string or the value None, if
+        there was no text.
+        """
+        def __get__(self):
+            self._assertNode()
+            return _collectText(self._c_node.next)
+
+    property sourceline:
+        u"""Original line number as found by the parser or None if unknown.
+        """
+        def __get__(self):
+            cdef long line
+            self._assertNode()
+            line = tree.xmlGetLineNo(self._c_node)
+            if line > 0:
+                return line
+            else:
+                return None
+
+    def __repr__(self):
+        self._assertNode()
+        if self._c_node.type == tree.XML_ELEMENT_NODE:
+            return u"<Element %s at 0x%x>" % (self.tag, id(self))
+        elif self._c_node.type == tree.XML_COMMENT_NODE:
+            return u"<!--%s-->" % self.text
+        elif self._c_node.type == tree.XML_ENTITY_NODE:
+            return u"&%s;" % funicode(self._c_node.name)
+        elif self._c_node.type == tree.XML_PI_NODE:
+            text = self.text
+            if text:
+                return u"<?%s %s?>" % (self.target, text)
+            else:
+                return u"<?%s?>" % self.target
+        else:
+            self._raise_unsupported_type()
+
+    def __getitem__(self, x):
+        u"""Returns the subelement at the given position or the requested
+        slice.
+        """
+        cdef xmlNode* c_node = NULL
+        cdef Py_ssize_t step = 0, slicelength = 0
+        cdef Py_ssize_t c, i
+        cdef _node_to_node_function next_element
+        cdef list result
+        self._assertNode()
+        if isinstance(x, slice):
+            # slicing
+            if _isFullSlice(<slice>x):
+                return _collectChildren(self)
+            _findChildSlice(<slice>x, self._c_node, &c_node, &step, &slicelength)
+            if c_node is NULL:
+                return []
+            if step > 0:
+                next_element = _nextElement
+            else:
+                step = -step
+                next_element = _previousElement
+            result = []
+            c = 0
+            while c_node is not NULL and c < slicelength:
+                result.append(_newReadOnlyProxy(self._source_proxy, c_node))
+                result.append(_elementFactory(self._doc, c_node))
+                c = c + 1
+                for i from 0 <= i < step:
+                    c_node = next_element(c_node)
+            return result
+        else:
+            # indexing
+            c_node = _findChild(self._c_node, x)
+            if c_node is NULL:
+                raise IndexError, u"list index out of range"
+            return _newReadOnlyProxy(self._source_proxy, c_node)
+
+    def __len__(self):
+        u"""Returns the number of subelements.
+        """
+        cdef Py_ssize_t c
+        cdef xmlNode* c_node
+        self._assertNode()
+        c = 0
+        c_node = self._c_node.children
+        while c_node is not NULL:
+            if tree._isElement(c_node):
+                c = c + 1
+            c_node = c_node.next
+        return c
+
+    def __nonzero__(self):
+        cdef xmlNode* c_node
+        self._assertNode()
+        c_node = _findChildBackwards(self._c_node, 0)
+        return c_node != NULL
+
+    def __deepcopy__(self, memo):
+        u"__deepcopy__(self, memo)"
+        return self.__copy__()
+        
+    cpdef __copy__(self):
+        u"__copy__(self)"
+        cdef xmlDoc* c_doc
+        cdef xmlNode* c_node
+        cdef _Document new_doc
+        if self._c_node is NULL:
+            return self
+        c_doc = _copyDocRoot(self._c_node.doc, self._c_node) # recursive
+        new_doc = _documentFactory(c_doc, None)
+        root = new_doc.getroot()
+        if root is not None:
+            return root
+        # Comment/PI
+        c_node = c_doc.children
+        while c_node is not NULL and c_node.type != self._c_node.type:
+            c_node = c_node.next
+        if c_node is NULL:
+            return None
+        return _elementFactory(new_doc, c_node)
+
+    def __iter__(self):
+        return iter(self.getchildren())
+
+    def iterchildren(self, tag=None, *, reversed=False):
+        u"""iterchildren(self, tag=None, reversed=False)
+
+        Iterate over the children of this element.
+        """
+        children = self.getchildren()
+        if tag is not None and tag != '*':
+            children = [ el for el in children if el.tag == tag ]
+        if reversed:
+            children = children[::-1]
+        return iter(children)
+
+    cpdef getchildren(self):
+        u"""Returns all subelements. The elements are returned in document
+        order.
+        """
+        cdef xmlNode* c_node
+        cdef list result
+        self._assertNode()
+        result = []
+        c_node = self._c_node.children
+        while c_node is not NULL:
+            if tree._isElement(c_node):
+                result.append(_newReadOnlyProxy(self._source_proxy, c_node))
+            c_node = c_node.next
+        return result
+
+    def getparent(self):
+        u"""Returns the parent of this element or None for the root element.
+        """
+        cdef xmlNode* c_parent
+        self._assertNode()
+        c_parent = self._c_node.parent
+        if c_parent is NULL or not tree._isElement(c_parent):
+            return None
+        else:
+            return _newReadOnlyProxy(self._source_proxy, c_parent)
+
+    def getnext(self):
+        u"""Returns the following sibling of this element or None.
+        """
+        cdef xmlNode* c_node
+        self._assertNode()
+        c_node = _nextElement(self._c_node)
+        if c_node is not NULL:
+            return _newReadOnlyProxy(self._source_proxy, c_node)
+        return None
+
+    def getprevious(self):
+        u"""Returns the preceding sibling of this element or None.
+        """
+        cdef xmlNode* c_node
+        self._assertNode()
+        c_node = _previousElement(self._c_node)
+        if c_node is not NULL:
+            return _newReadOnlyProxy(self._source_proxy, c_node)
+        return None
+
+
+@cython.final
+@cython.internal
+cdef class _ReadOnlyPIProxy(_ReadOnlyProxy):
+    u"A read-only proxy for processing instructions (for internal use only!)"
+    property target:
+        def __get__(self):
+            self._assertNode()
+            return funicode(self._c_node.name)
+
+@cython.final
+@cython.internal
+cdef class _ReadOnlyEntityProxy(_ReadOnlyProxy):
+    u"A read-only proxy for entity references (for internal use only!)"
+    property name:
+        def __get__(self):
+            return funicode(self._c_node.name)
+
+        def __set__(self, value):
+            value_utf = _utf8(value)
+            if u'&' in value or u';' in value:
+                raise ValueError(u"Invalid entity name '%s'" % value)
+            tree.xmlNodeSetName(self._c_node, _xcstr(value_utf))
+
+    property text:
+        def __get__(self):
+            return u'&%s;' % funicode(self._c_node.name)
+
+
+@cython.internal
+cdef class _ReadOnlyElementProxy(_ReadOnlyProxy):
+    u"The main read-only Element proxy class (for internal use only!)."
+
+    property attrib:
+        def __get__(self):
+            self._assertNode()
+            return dict(_collectAttributes(self._c_node, 3))
+
+    property prefix:
+        u"""Namespace prefix or None.
+        """
+        def __get__(self):
+            self._assertNode()
+            if self._c_node.ns is not NULL:
+                if self._c_node.ns.prefix is not NULL:
+                    return funicode(self._c_node.ns.prefix)
+            return None
+
+    def get(self, key, default=None):
+        u"""Gets an element attribute.
+        """
+        self._assertNode()
+        return _getNodeAttributeValue(self._c_node, key, default)
+
+    def keys(self):
+        u"""Gets a list of attribute names. The names are returned in an
+        arbitrary order (just like for an ordinary Python dictionary).
+        """
+        self._assertNode()
+        return _collectAttributes(self._c_node, 1)
+
+    def values(self):
+        u"""Gets element attributes, as a sequence. The attributes are returned
+        in an arbitrary order.
+        """
+        self._assertNode()
+        return _collectAttributes(self._c_node, 2)
+
+    def items(self):
+        u"""Gets element attributes, as a sequence. The attributes are returned
+        in an arbitrary order.
+        """
+        self._assertNode()
+        return _collectAttributes(self._c_node, 3)
+
+cdef _ReadOnlyProxy _newReadOnlyProxy(
+    _ReadOnlyProxy source_proxy, xmlNode* c_node):
+    cdef _ReadOnlyProxy el
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        el = _ReadOnlyElementProxy.__new__(_ReadOnlyElementProxy)
+    elif c_node.type == tree.XML_PI_NODE:
+        el = _ReadOnlyPIProxy.__new__(_ReadOnlyPIProxy)
+    elif c_node.type in (tree.XML_COMMENT_NODE,
+                         tree.XML_ENTITY_REF_NODE):
+        el = _ReadOnlyProxy.__new__(_ReadOnlyProxy)
+    else:
+        raise TypeError("Unsupported element type: %d" % c_node.type)
+    el._c_node = c_node
+    _initReadOnlyProxy(el, source_proxy)
+    return el
+
+cdef inline _initReadOnlyProxy(_ReadOnlyProxy el,
+                               _ReadOnlyProxy source_proxy):
+    if source_proxy is None:
+        el._source_proxy = el
+        el._dependent_proxies = [el]
+    else:
+        el._source_proxy = source_proxy
+        source_proxy._dependent_proxies.append(el)
+
+cdef _freeReadOnlyProxies(_ReadOnlyProxy sourceProxy):
+    cdef xmlNode* c_node
+    cdef _ReadOnlyProxy el
+    if sourceProxy is None:
+        return
+    if sourceProxy._dependent_proxies is None:
+        return
+    for el in sourceProxy._dependent_proxies:
+        c_node = el._c_node
+        el._c_node = NULL
+        if el._free_after_use:
+            tree.xmlFreeNode(c_node)
+    del sourceProxy._dependent_proxies[:]
+
+# opaque wrapper around non-element nodes, e.g. the document node
+#
+# This class does not imply any restrictions on modifiability or
+# read-only status of the node, so use with caution.
+
+@cython.internal
+cdef class _OpaqueNodeWrapper:
+    cdef tree.xmlNode* _c_node
+    def __init__(self):
+        raise TypeError, u"This type cannot be instantiated from Python"
+
+@cython.final
+@cython.internal
+cdef class _OpaqueDocumentWrapper(_OpaqueNodeWrapper):
+    cdef int _assertNode(self) except -1:
+        u"""This is our way of saying: this proxy is invalid!
+        """
+        assert self._c_node is not NULL, u"Proxy invalidated!"
+        return 0
+
+    cpdef append(self, other_element):
+        u"""Append a copy of an Element to the list of children.
+        """
+        cdef xmlNode* c_next
+        cdef xmlNode* c_node
+        self._assertNode()
+        c_node = _roNodeOf(other_element)
+        if c_node.type == tree.XML_ELEMENT_NODE:
+            if tree.xmlDocGetRootElement(<tree.xmlDoc*>self._c_node) is not NULL:
+                raise ValueError, u"cannot append, document already has a root element"
+        elif c_node.type not in (tree.XML_PI_NODE, tree.XML_COMMENT_NODE):
+            raise TypeError, u"unsupported element type for top-level node: %d" % c_node.type
+        c_node = _copyNodeToDoc(c_node, <tree.xmlDoc*>self._c_node)
+        c_next = c_node.next
+        tree.xmlAddChild(self._c_node, c_node)
+        _moveTail(c_next, c_node)
+
+    def extend(self, elements):
+        u"""Append a copy of all Elements from a sequence to the list of
+        children.
+        """
+        self._assertNode()
+        for element in elements:
+            self.append(element)
+
+cdef _OpaqueNodeWrapper _newOpaqueAppendOnlyNodeWrapper(xmlNode* c_node):
+    cdef _OpaqueNodeWrapper node
+    if c_node.type in (tree.XML_DOCUMENT_NODE, tree.XML_HTML_DOCUMENT_NODE):
+        node = _OpaqueDocumentWrapper.__new__(_OpaqueDocumentWrapper)
+    else:
+        node = _OpaqueNodeWrapper.__new__(_OpaqueNodeWrapper)
+    node._c_node = c_node
+    return node
+
+# element proxies that allow restricted modification
+
+@cython.internal
+cdef class _ModifyContentOnlyProxy(_ReadOnlyProxy):
+    u"""A read-only proxy that allows changing the text content.
+    """
+    property text:
+        def __get__(self):
+            self._assertNode()
+            if self._c_node.content is NULL:
+                return ''
+            else:
+                return funicode(self._c_node.content)
+
+        def __set__(self, value):
+            cdef tree.xmlDict* c_dict
+            self._assertNode()
+            if value is None:
+                c_text = <const_xmlChar*>NULL
+            else:
+                value = _utf8(value)
+                c_text = _xcstr(value)
+            tree.xmlNodeSetContent(self._c_node, c_text)
+
+@cython.final
+@cython.internal
+cdef class _ModifyContentOnlyPIProxy(_ModifyContentOnlyProxy):
+    u"""A read-only proxy that allows changing the text/target content of a
+    processing instruction.
+    """
+    property target:
+        def __get__(self):
+            self._assertNode()
+            return funicode(self._c_node.name)
+
+        def __set__(self, value):
+            self._assertNode()
+            value = _utf8(value)
+            c_text = _xcstr(value)
+            tree.xmlNodeSetName(self._c_node, c_text)
+
+@cython.final
+@cython.internal
+cdef class _ModifyContentOnlyEntityProxy(_ModifyContentOnlyProxy):
+    u"A read-only proxy for entity references (for internal use only!)"
+    property name:
+        def __get__(self):
+            return funicode(self._c_node.name)
+
+        def __set__(self, value):
+            value = _utf8(value)
+            assert u'&' not in value and u';' not in value, \
+                u"Invalid entity name '%s'" % value
+            c_text = _xcstr(value)
+            tree.xmlNodeSetName(self._c_node, c_text)
+
+
+@cython.final
+@cython.internal
+cdef class _AppendOnlyElementProxy(_ReadOnlyElementProxy):
+    u"""A read-only element that allows adding children and changing the
+    text content (i.e. everything that adds to the subtree).
+    """
+    cpdef append(self, other_element):
+        u"""Append a copy of an Element to the list of children.
+        """
+        cdef xmlNode* c_next
+        cdef xmlNode* c_node
+        self._assertNode()
+        c_node = _roNodeOf(other_element)
+        c_node = _copyNodeToDoc(c_node, self._c_node.doc)
+        c_next = c_node.next
+        tree.xmlAddChild(self._c_node, c_node)
+        _moveTail(c_next, c_node)
+            
+    def extend(self, elements):
+        u"""Append a copy of all Elements from a sequence to the list of
+        children.
+        """
+        self._assertNode()
+        for element in elements:
+            self.append(element)
+
+    property text:
+        u"""Text before the first subelement. This is either a string or the
+        value None, if there was no text.
+        """
+        def __get__(self):
+            self._assertNode()
+            return _collectText(self._c_node.children)
+
+        def __set__(self, value):
+            self._assertNode()
+            if isinstance(value, QName):
+                value = _resolveQNameText(self, value).decode('utf8')
+            _setNodeText(self._c_node, value)
+
+
+cdef _ReadOnlyProxy _newAppendOnlyProxy(
+    _ReadOnlyProxy source_proxy, xmlNode* c_node):
+    cdef _ReadOnlyProxy el
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        el = _AppendOnlyElementProxy.__new__(_AppendOnlyElementProxy)
+    elif c_node.type == tree.XML_PI_NODE:
+        el = _ModifyContentOnlyPIProxy.__new__(_ModifyContentOnlyPIProxy)
+    elif c_node.type == tree.XML_COMMENT_NODE:
+        el = _ModifyContentOnlyProxy.__new__(_ModifyContentOnlyProxy)
+    else:
+        raise TypeError("Unsupported element type: %d" % c_node.type)
+    el._c_node = c_node
+    _initReadOnlyProxy(el, source_proxy)
+    return el
+
+cdef xmlNode* _roNodeOf(element) except NULL:
+    cdef xmlNode* c_node
+    if isinstance(element, _Element):
+        c_node = (<_Element>element)._c_node
+    elif isinstance(element, _ReadOnlyProxy):
+        c_node = (<_ReadOnlyProxy>element)._c_node
+    elif isinstance(element, _OpaqueNodeWrapper):
+        c_node = (<_OpaqueNodeWrapper>element)._c_node
+    else:
+        raise TypeError, u"invalid argument type %s" % type(element)
+
+    if c_node is NULL:
+        raise TypeError, u"invalid element"
+    return c_node
+
+cdef xmlNode* _nonRoNodeOf(element) except NULL:
+    cdef xmlNode* c_node
+    if isinstance(element, _Element):
+        c_node = (<_Element>element)._c_node
+    elif isinstance(element, _AppendOnlyElementProxy):
+        c_node = (<_AppendOnlyElementProxy>element)._c_node
+    elif isinstance(element, _OpaqueNodeWrapper):
+        c_node = (<_OpaqueNodeWrapper>element)._c_node
+    else:
+        raise TypeError, u"invalid argument type %s" % type(element)
+
+    if c_node is NULL:
+        raise TypeError, u"invalid element"
+    return c_node
diff --git a/lib/lxml/relaxng.pxi b/lib/lxml/relaxng.pxi
new file mode 100644
index 00000000..de486e1b
--- /dev/null
+++ b/lib/lxml/relaxng.pxi
@@ -0,0 +1,123 @@
+# support for RelaxNG validation
+from lxml.includes cimport relaxng
+
+class RelaxNGError(LxmlError):
+    u"""Base class for RelaxNG errors.
+    """
+    pass
+
+class RelaxNGParseError(RelaxNGError):
+    u"""Error while parsing an XML document as RelaxNG.
+    """
+    pass
+
+class RelaxNGValidateError(RelaxNGError):
+    u"""Error while validating an XML document with a RelaxNG schema.
+    """
+    pass
+
+################################################################################
+# RelaxNG
+
+cdef class RelaxNG(_Validator):
+    u"""RelaxNG(self, etree=None, file=None)
+    Turn a document into a Relax NG validator.
+
+    Either pass a schema as Element or ElementTree, or pass a file or
+    filename through the ``file`` keyword argument.
+    """
+    cdef relaxng.xmlRelaxNG* _c_schema
+    def __cinit__(self):
+        self._c_schema = NULL
+
+    def __init__(self, etree=None, *, file=None):
+        cdef _Document doc
+        cdef _Element root_node
+        cdef xmlNode* c_node
+        cdef xmlDoc* fake_c_doc
+        cdef relaxng.xmlRelaxNGParserCtxt* parser_ctxt
+        _Validator.__init__(self)
+        fake_c_doc = NULL
+        if etree is not None:
+            doc = _documentOrRaise(etree)
+            root_node = _rootNodeOrRaise(etree)
+            c_node = root_node._c_node
+            fake_c_doc = _fakeRootDoc(doc._c_doc, root_node._c_node)
+            parser_ctxt = relaxng.xmlRelaxNGNewDocParserCtxt(fake_c_doc)
+        elif file is not None:
+            if _isString(file):
+                doc = None
+                filename = _encodeFilename(file)
+                with self._error_log:
+                    parser_ctxt = relaxng.xmlRelaxNGNewParserCtxt(_cstr(filename))
+            else:
+                doc = _parseDocument(file, None, None)
+                parser_ctxt = relaxng.xmlRelaxNGNewDocParserCtxt(doc._c_doc)
+        else:
+            raise RelaxNGParseError, u"No tree or file given"
+
+        if parser_ctxt is NULL:
+            if fake_c_doc is not NULL:
+                _destroyFakeDoc(doc._c_doc, fake_c_doc)
+            raise RelaxNGParseError(
+                self._error_log._buildExceptionMessage(
+                    u"Document is not parsable as Relax NG"),
+                self._error_log)
+
+        relaxng.xmlRelaxNGSetParserStructuredErrors(
+            parser_ctxt, _receiveError, <void*>self._error_log)
+        self._c_schema = relaxng.xmlRelaxNGParse(parser_ctxt)
+
+        relaxng.xmlRelaxNGFreeParserCtxt(parser_ctxt)
+        if self._c_schema is NULL:
+            if fake_c_doc is not NULL:
+                _destroyFakeDoc(doc._c_doc, fake_c_doc)
+            raise RelaxNGParseError(
+                self._error_log._buildExceptionMessage(
+                    u"Document is not valid Relax NG"),
+                self._error_log)
+        if fake_c_doc is not NULL:
+            _destroyFakeDoc(doc._c_doc, fake_c_doc)
+
+    def __dealloc__(self):
+        relaxng.xmlRelaxNGFree(self._c_schema)
+
+    def __call__(self, etree):
+        u"""__call__(self, etree)
+
+        Validate doc using Relax NG.
+
+        Returns true if document is valid, false if not."""
+        cdef _Document doc
+        cdef _Element root_node
+        cdef xmlDoc* c_doc
+        cdef relaxng.xmlRelaxNGValidCtxt* valid_ctxt
+        cdef int ret
+
+        assert self._c_schema is not NULL, "RelaxNG instance not initialised"
+        doc = _documentOrRaise(etree)
+        root_node = _rootNodeOrRaise(etree)
+
+        valid_ctxt = relaxng.xmlRelaxNGNewValidCtxt(self._c_schema)
+        if valid_ctxt is NULL:
+            raise MemoryError()
+
+        try:
+            self._error_log.clear()
+            relaxng.xmlRelaxNGSetValidStructuredErrors(
+                valid_ctxt, _receiveError, <void*>self._error_log)
+            c_doc = _fakeRootDoc(doc._c_doc, root_node._c_node)
+            with nogil:
+                ret = relaxng.xmlRelaxNGValidateDoc(valid_ctxt, c_doc)
+            _destroyFakeDoc(doc._c_doc, c_doc)
+        finally:
+            relaxng.xmlRelaxNGFreeValidCtxt(valid_ctxt)
+
+        if ret == -1:
+            raise RelaxNGValidateError(
+                u"Internal error in Relax NG validation",
+                self._error_log)
+        if ret == 0:
+            return True
+        else:
+            return False
diff --git a/lib/lxml/sax.py b/lib/lxml/sax.py
new file mode 100644
index 00000000..dc1354d9
--- /dev/null
+++ b/lib/lxml/sax.py
@@ -0,0 +1,247 @@
+"""
+SAX-based adapter to copy trees from/to the Python standard library.
+
+Use the `ElementTreeContentHandler` class to build an ElementTree from
+SAX events.
+
+Use the `ElementTreeProducer` class or the `saxify()` function to fire
+the SAX events of an ElementTree against a SAX ContentHandler.
+
+See http://codespeak.net/lxml/sax.html
+"""
+
+from xml.sax.handler import ContentHandler
+from lxml import etree
+from lxml.etree import ElementTree, SubElement
+from lxml.etree import Comment, ProcessingInstruction
+
+class SaxError(etree.LxmlError):
+    """General SAX error.
+    """
+    pass
+
+def _getNsTag(tag):
+    if tag[0] == '{':
+        return tuple(tag[1:].split('}', 1))
+    else:
+        return (None, tag)
+
+
+class ElementTreeContentHandler(ContentHandler):
+    """Build an lxml ElementTree from SAX events.
+    """
+    def __init__(self, makeelement=None):
+        self._root = None
+        self._root_siblings = []
+        self._element_stack = []
+        self._default_ns = None
+        self._ns_mapping = { None : [None] }
+        self._new_mappings = {}
+        if makeelement is None:
+            makeelement = etree.Element
+        self._makeelement = makeelement
+
+    def _get_etree(self):
+        "Contains the generated ElementTree after parsing is finished."
+        return ElementTree(self._root)
+
+    etree = property(_get_etree, doc=_get_etree.__doc__)
+
+    def setDocumentLocator(self, locator):
+        pass
+
+    def startDocument(self):
+        pass
+
+    def endDocument(self):
+        pass
+
+    def startPrefixMapping(self, prefix, uri):
+        self._new_mappings[prefix] = uri
+        try:
+            self._ns_mapping[prefix].append(uri)
+        except KeyError:
+            self._ns_mapping[prefix] = [uri]
+        if prefix is None:
+            self._default_ns = uri
+
+    def endPrefixMapping(self, prefix):
+        ns_uri_list = self._ns_mapping[prefix]
+        ns_uri_list.pop()
+        if prefix is None:
+            self._default_ns = ns_uri_list[-1]
+
+    def _buildTag(self, ns_name_tuple):
+        ns_uri, local_name = ns_name_tuple
+        if ns_uri:
+            el_tag = "{%s}%s" % ns_name_tuple
+        elif self._default_ns:
+            el_tag = "{%s}%s" % (self._default_ns, local_name)
+        else:
+            el_tag = local_name
+        return el_tag
+
+    def startElementNS(self, ns_name, qname, attributes=None):
+        el_name = self._buildTag(ns_name)
+        if attributes:
+            attrs = {}
+            try:
+                iter_attributes = attributes.iteritems()
+            except AttributeError:
+                iter_attributes = attributes.items()
+
+            for name_tuple, value in iter_attributes:
+                if name_tuple[0]:
+                    attr_name = "{%s}%s" % name_tuple
+                else:
+                    attr_name = name_tuple[1]
+                attrs[attr_name] = value
+        else:
+            attrs = None
+
+        element_stack = self._element_stack
+        if self._root is None:
+            element = self._root = \
+                      self._makeelement(el_name, attrs, self._new_mappings)
+            if self._root_siblings and hasattr(element, 'addprevious'):
+                for sibling in self._root_siblings:
+                    element.addprevious(sibling)
+            del self._root_siblings[:]
+        else:
+            element = SubElement(element_stack[-1], el_name,
+                                 attrs, self._new_mappings)
+        element_stack.append(element)
+
+        self._new_mappings.clear()
+
+    def processingInstruction(self, target, data):
+        pi = ProcessingInstruction(target, data)
+        if self._root is None:
+            self._root_siblings.append(pi)
+        else:
+            self._element_stack[-1].append(pi)
+
+    def endElementNS(self, ns_name, qname):
+        element = self._element_stack.pop()
+        el_tag = self._buildTag(ns_name)
+        if el_tag != element.tag:
+            raise SaxError("Unexpected element closed: " + el_tag)
+
+    def startElement(self, name, attributes=None):
+        if attributes:
+            attributes = dict(
+                    [((None, k), v) for k, v in attributes.items()]
+                )
+        self.startElementNS((None, name), name, attributes)
+
+    def endElement(self, name):
+        self.endElementNS((None, name), name)
+
+    def characters(self, data):
+        last_element = self._element_stack[-1]
+        try:
+            # if there already is a child element, we must append to its tail
+            last_element = last_element[-1]
+            last_element.tail = (last_element.tail or '') + data
+        except IndexError:
+            # otherwise: append to the text
+            last_element.text = (last_element.text or '') + data
+
+    ignorableWhitespace = characters
+
+
+class ElementTreeProducer(object):
+    """Produces SAX events for an element and children.
+    """
+    def __init__(self, element_or_tree, content_handler):
+        try:
+            element = element_or_tree.getroot()
+        except AttributeError:
+            element = element_or_tree
+        self._element = element
+        self._content_handler = content_handler
+        from xml.sax.xmlreader import AttributesNSImpl as attr_class
+        self._attr_class = attr_class
+        self._empty_attributes = attr_class({}, {})
+
+    def saxify(self):
+        self._content_handler.startDocument()
+
+        element = self._element
+        if hasattr(element, 'getprevious'):
+            siblings = []
+            sibling = element.getprevious()
+            while getattr(sibling, 'tag', None) is ProcessingInstruction:
+                siblings.append(sibling)
+                sibling = sibling.getprevious()
+            for sibling in siblings[::-1]:
+                self._recursive_saxify(sibling, {})
+
+        self._recursive_saxify(element, {})
+
+        if hasattr(element, 'getnext'):
+            sibling = element.getnext()
+            while getattr(sibling, 'tag', None) is ProcessingInstruction:
+                self._recursive_saxify(sibling, {})
+                sibling = sibling.getnext()
+
+        self._content_handler.endDocument()
+
+    def _recursive_saxify(self, element, prefixes):
+        content_handler = self._content_handler
+        tag = element.tag
+        if tag is Comment or tag is ProcessingInstruction:
+            if tag is ProcessingInstruction:
+                content_handler.processingInstruction(
+                    element.target, element.text)
+            if element.tail:
+                content_handler.characters(element.tail)
+            return
+
+        new_prefixes = []
+        build_qname = self._build_qname
+        attribs = element.items()
+        if attribs:
+            attr_values = {}
+            attr_qnames = {}
+            for attr_ns_name, value in attribs:
+                attr_ns_tuple = _getNsTag(attr_ns_name)
+                attr_values[attr_ns_tuple] = value
+                attr_qnames[attr_ns_tuple] = build_qname(
+                    attr_ns_tuple[0], attr_ns_tuple[1], prefixes, new_prefixes)
+            sax_attributes = self._attr_class(attr_values, attr_qnames)
+        else:
+            sax_attributes = self._empty_attributes
+
+        ns_uri, local_name = _getNsTag(tag)
+        qname = build_qname(ns_uri, local_name, prefixes, new_prefixes)
+
+        for prefix, uri in new_prefixes:
+            content_handler.startPrefixMapping(prefix, uri)
+        content_handler.startElementNS((ns_uri, local_name),
+                                       qname, sax_attributes)
+        if element.text:
+            content_handler.characters(element.text)
+        for child in element:
+            self._recursive_saxify(child, prefixes)
+        content_handler.endElementNS((ns_uri, local_name), qname)
+        for prefix, uri in new_prefixes:
+            content_handler.endPrefixMapping(prefix)
+        if element.tail:
+            content_handler.characters(element.tail)
+
+    def _build_qname(self, ns_uri, local_name, prefixes, new_prefixes):
+        if ns_uri is None:
+            return local_name
+        try:
+            prefix = prefixes[ns_uri]
+        except KeyError:
+            prefix = prefixes[ns_uri] = 'ns%02d' % len(prefixes)
+            new_prefixes.append( (prefix, ns_uri) )
+        return prefix + ':' + local_name
+
+def saxify(element_or_tree, content_handler):
+    """One-shot helper to generate SAX events from an XML tree and fire
+    them against a SAX ContentHandler.
+    """
+    return ElementTreeProducer(element_or_tree, content_handler).saxify()
diff --git a/lib/lxml/saxparser.pxi b/lib/lxml/saxparser.pxi
new file mode 100644
index 00000000..7f6e0de3
--- /dev/null
+++ b/lib/lxml/saxparser.pxi
@@ -0,0 +1,763 @@
+# SAX-like interfaces
+
+ctypedef enum _SaxParserEvents:
+    SAX_EVENT_START   =  1
+    SAX_EVENT_END     =  2
+    SAX_EVENT_DATA    =  4
+    SAX_EVENT_DOCTYPE =  8
+    SAX_EVENT_PI      = 16
+    SAX_EVENT_COMMENT = 32
+
+ctypedef enum _ParseEventFilter:
+    PARSE_EVENT_FILTER_START     =  1
+    PARSE_EVENT_FILTER_END       =  2
+    PARSE_EVENT_FILTER_START_NS  =  4
+    PARSE_EVENT_FILTER_END_NS    =  8
+    PARSE_EVENT_FILTER_COMMENT   = 16
+    PARSE_EVENT_FILTER_PI        = 32
+
+
+cdef int _buildParseEventFilter(events) except -1:
+    cdef int event_filter
+    event_filter = 0
+    for event in events:
+        if event == 'start':
+            event_filter |= PARSE_EVENT_FILTER_START
+        elif event == 'end':
+            event_filter |= PARSE_EVENT_FILTER_END
+        elif event == 'start-ns':
+            event_filter |= PARSE_EVENT_FILTER_START_NS
+        elif event == 'end-ns':
+            event_filter |= PARSE_EVENT_FILTER_END_NS
+        elif event == 'comment':
+            event_filter |= PARSE_EVENT_FILTER_COMMENT
+        elif event == 'pi':
+            event_filter |= PARSE_EVENT_FILTER_PI
+        else:
+            raise ValueError, u"invalid event name '%s'" % event
+    return event_filter
+
+
+cdef class _SaxParserTarget:
+    cdef int _sax_event_filter
+    def __cinit__(self):
+        self._sax_event_filter = 0
+
+    cdef _handleSaxStart(self, tag, attrib, nsmap):
+        return None
+    cdef _handleSaxEnd(self, tag):
+        return None
+    cdef int _handleSaxData(self, data) except -1:
+        return 0
+    cdef int _handleSaxDoctype(self, root_tag, public_id, system_id) except -1:
+        return 0
+    cdef _handleSaxPi(self, target, data):
+        return None
+    cdef _handleSaxComment(self, comment):
+        return None
+
+
+#@cython.final
+@cython.internal
+cdef class _SaxParserContext(_ParserContext):
+    u"""This class maps SAX2 events to parser target events.
+    """
+    cdef _SaxParserTarget _target
+    cdef _BaseParser _parser
+    cdef xmlparser.startElementNsSAX2Func _origSaxStart
+    cdef xmlparser.endElementNsSAX2Func   _origSaxEnd
+    cdef xmlparser.startElementSAXFunc    _origSaxStartNoNs
+    cdef xmlparser.endElementSAXFunc      _origSaxEndNoNs
+    cdef xmlparser.charactersSAXFunc      _origSaxData
+    cdef xmlparser.cdataBlockSAXFunc      _origSaxCData
+    cdef xmlparser.internalSubsetSAXFunc  _origSaxDoctype
+    cdef xmlparser.commentSAXFunc         _origSaxComment
+    cdef xmlparser.processingInstructionSAXFunc _origSaxPI
+    cdef xmlparser.startDocumentSAXFunc   _origSaxStartDocument
+
+    # for event collecting
+    cdef int _event_filter
+    cdef list _ns_stack
+    cdef list _node_stack
+    cdef _ParseEventsIterator events_iterator
+
+    # for iterparse
+    cdef _Element  _root
+    cdef _MultiTagMatcher _matcher
+
+    def __cinit__(self, _BaseParser parser):
+        self._ns_stack = []
+        self._node_stack = []
+        self._parser = parser
+        self.events_iterator = _ParseEventsIterator()
+
+    cdef void _setSaxParserTarget(self, _SaxParserTarget target):
+        self._target = target
+
+    cdef void _initParserContext(self, xmlparser.xmlParserCtxt* c_ctxt):
+        _ParserContext._initParserContext(self, c_ctxt)
+        if self._target is not None:
+            self._connectTarget(c_ctxt)
+        elif self._event_filter:
+            self._connectEvents(c_ctxt)
+
+    cdef void _connectTarget(self, xmlparser.xmlParserCtxt* c_ctxt):
+        """wrap original SAX2 callbacks to call into parser target"""
+        sax = c_ctxt.sax
+        self._origSaxStart = sax.startElementNs = NULL
+        self._origSaxStartNoNs = sax.startElement = NULL
+        if self._target._sax_event_filter & SAX_EVENT_START:
+            # intercept => overwrite orig callback
+            # FIXME: also intercept on when collecting END events
+            if sax.initialized == xmlparser.XML_SAX2_MAGIC:
+                sax.startElementNs = _handleSaxTargetStart
+            sax.startElement = _handleSaxTargetStartNoNs
+
+        self._origSaxEnd = sax.endElementNs = NULL
+        self._origSaxEndNoNs = sax.endElement = NULL
+        if self._target._sax_event_filter & SAX_EVENT_END:
+            if sax.initialized == xmlparser.XML_SAX2_MAGIC:
+                sax.endElementNs = _handleSaxEnd
+            sax.endElement = _handleSaxEndNoNs
+
+        self._origSaxData = sax.characters = sax.cdataBlock = NULL
+        if self._target._sax_event_filter & SAX_EVENT_DATA:
+            sax.characters = sax.cdataBlock = _handleSaxData
+
+        # doctype propagation is always required for entity replacement
+        self._origSaxDoctype = sax.internalSubset
+        if self._target._sax_event_filter & SAX_EVENT_DOCTYPE:
+            sax.internalSubset = _handleSaxTargetDoctype
+
+        self._origSaxPI = sax.processingInstruction = NULL
+        if self._target._sax_event_filter & SAX_EVENT_PI:
+            sax.processingInstruction = _handleSaxPI
+
+        self._origSaxComment = sax.comment = NULL
+        if self._target._sax_event_filter & SAX_EVENT_COMMENT:
+            sax.comment = _handleSaxTargetComment
+
+        # enforce entity replacement
+        sax.reference = NULL
+        c_ctxt.replaceEntities = 1
+
+    cdef void _connectEvents(self, xmlparser.xmlParserCtxt* c_ctxt):
+        """wrap original SAX2 callbacks to collect parse events"""
+        sax = c_ctxt.sax
+        self._origSaxStartDocument = sax.startDocument
+        sax.startDocument = _handleSaxStartDocument
+        self._origSaxStart = sax.startElementNs
+        self._origSaxStartNoNs = sax.startElement
+        # only override start event handler if needed
+        if self._event_filter == 0 or \
+               self._event_filter & (PARSE_EVENT_FILTER_START |
+                                     PARSE_EVENT_FILTER_END |
+                                     PARSE_EVENT_FILTER_START_NS |
+                                     PARSE_EVENT_FILTER_END_NS):
+            sax.startElementNs = <xmlparser.startElementNsSAX2Func>_handleSaxStart
+            sax.startElement = <xmlparser.startElementSAXFunc>_handleSaxStartNoNs
+
+        self._origSaxEnd = sax.endElementNs
+        self._origSaxEndNoNs = sax.endElement
+        # only override end event handler if needed
+        if self._event_filter == 0 or \
+               self._event_filter & (PARSE_EVENT_FILTER_END |
+                                     PARSE_EVENT_FILTER_END_NS):
+            sax.endElementNs = <xmlparser.endElementNsSAX2Func>_handleSaxEnd
+            sax.endElement = <xmlparser.endElementSAXFunc>_handleSaxEndNoNs
+
+        self._origSaxComment = sax.comment
+        if self._event_filter & PARSE_EVENT_FILTER_COMMENT:
+            sax.comment = <xmlparser.commentSAXFunc>_handleSaxComment
+
+        self._origSaxPI = sax.processingInstruction
+        if self._event_filter & PARSE_EVENT_FILTER_PI:
+            sax.processingInstruction = <xmlparser.processingInstructionSAXFunc>_handleSaxPIEvent
+
+    cdef _setEventFilter(self, events, tag):
+        self._event_filter = _buildParseEventFilter(events)
+        if not self._event_filter or tag is None or tag == '*':
+            self._matcher = None
+        else:
+            self._matcher = _MultiTagMatcher(tag)
+
+    cdef int startDocument(self, xmlDoc* c_doc) except -1:
+        try:
+            self._doc = _documentFactory(c_doc, self._parser)
+        finally:
+            self._parser = None  # clear circular reference ASAP
+        if self._matcher is not None:
+            self._matcher.cacheTags(self._doc, True) # force entry in libxml2 dict
+        return 0
+
+    cdef int pushEvent(self, event, xmlNode* c_node) except -1:
+        cdef _Element root
+        if self._root is None:
+            root = self._doc.getroot()
+            if root is not None and root._c_node.type == tree.XML_ELEMENT_NODE:
+                self._root = root
+        node = _elementFactory(self._doc, c_node)
+        self.events_iterator._events.append( (event, node) )
+        return 0
+
+    cdef int flushEvents(self) except -1:
+        events = self.events_iterator._events
+        while self._node_stack:
+            events.append( ('end', self._node_stack.pop()) )
+            _pushSaxNsEndEvents(self)
+        while self._ns_stack:
+            _pushSaxNsEndEvents(self)
+
+    cdef void _handleSaxException(self, xmlparser.xmlParserCtxt* c_ctxt):
+        if c_ctxt.errNo == xmlerror.XML_ERR_OK:
+            c_ctxt.errNo = xmlerror.XML_ERR_INTERNAL_ERROR
+        # stop parsing immediately
+        c_ctxt.wellFormed = 0
+        c_ctxt.disableSAX = 1
+        self._store_raised()
+
+
+@cython.final
+@cython.internal
+cdef class _ParseEventsIterator:
+    """A reusable parse events iterator"""
+    cdef list _events
+    cdef int _event_index
+
+    def __cinit__(self):
+        self._events = []
+        self._event_index = 0
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        events = self._events
+        event_index = self._event_index
+        if event_index * 2 >= len(events):
+            if event_index:
+                # clean up from time to time
+                del events[:event_index]
+                self._event_index = event_index = 0
+            if event_index >= len(events):
+                raise StopIteration
+        item = events[event_index]
+        self._event_index = event_index + 1
+        return item
+
+
+cdef int _appendNsEvents(_SaxParserContext context, int c_nb_namespaces,
+                         const_xmlChar** c_namespaces) except -1:
+    cdef int i
+    for i in xrange(c_nb_namespaces):
+        ns_tuple = (funicodeOrEmpty(c_namespaces[0]),
+                    funicode(c_namespaces[1]))
+        context.events_iterator._events.append( ("start-ns", ns_tuple) )
+        c_namespaces += 2
+    return 0
+
+
+cdef void _handleSaxStart(
+        void* ctxt, const_xmlChar* c_localname, const_xmlChar* c_prefix,
+        const_xmlChar* c_namespace, int c_nb_namespaces,
+        const_xmlChar** c_namespaces,
+        int c_nb_attributes, int c_nb_defaulted,
+        const_xmlChar** c_attributes) with gil:
+    cdef int i
+    cdef size_t c_len
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        if (c_nb_namespaces and
+                context._event_filter & PARSE_EVENT_FILTER_START_NS):
+            _appendNsEvents(context, c_nb_namespaces, c_namespaces)
+        context._origSaxStart(c_ctxt, c_localname, c_prefix, c_namespace,
+                              c_nb_namespaces, c_namespaces, c_nb_attributes,
+                              c_nb_defaulted, c_attributes)
+        if c_ctxt.html:
+            _fixHtmlDictNodeNames(c_ctxt.dict, c_ctxt.node)
+
+        if context._event_filter & PARSE_EVENT_FILTER_END_NS:
+            context._ns_stack.append(c_nb_namespaces)
+        if context._event_filter & (PARSE_EVENT_FILTER_END |
+                                    PARSE_EVENT_FILTER_START):
+            _pushSaxStartEvent(context, c_ctxt, c_namespace,
+                               c_localname, None)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxTargetStart(
+        void* ctxt, const_xmlChar* c_localname, const_xmlChar* c_prefix,
+        const_xmlChar* c_namespace, int c_nb_namespaces,
+        const_xmlChar** c_namespaces,
+        int c_nb_attributes, int c_nb_defaulted,
+        const_xmlChar** c_attributes) with gil:
+    cdef int i
+    cdef size_t c_len
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        if (c_nb_namespaces and
+                context._event_filter & PARSE_EVENT_FILTER_START_NS):
+            _appendNsEvents(context, c_nb_namespaces, c_namespaces)
+        if c_nb_defaulted > 0:
+            # only add default attributes if we asked for them
+            if c_ctxt.loadsubset & xmlparser.XML_COMPLETE_ATTRS == 0:
+                c_nb_attributes -= c_nb_defaulted
+        if c_nb_attributes == 0:
+            attrib = IMMUTABLE_EMPTY_MAPPING
+        else:
+            attrib = {}
+            for i in xrange(c_nb_attributes):
+                name = _namespacedNameFromNsName(
+                    c_attributes[2], c_attributes[0])
+                if c_attributes[3] is NULL:
+                    value = ''
+                else:
+                    c_len = c_attributes[4] - c_attributes[3]
+                    value = c_attributes[3][:c_len].decode('utf8')
+                attrib[name] = value
+                c_attributes += 5
+        if c_nb_namespaces == 0:
+            nsmap = IMMUTABLE_EMPTY_MAPPING
+        else:
+            nsmap = {}
+            for i in xrange(c_nb_namespaces):
+                prefix = funicodeOrNone(c_namespaces[0])
+                nsmap[prefix] = funicode(c_namespaces[1])
+                c_namespaces += 2
+        element = _callTargetSaxStart(
+            context, c_ctxt,
+            _namespacedNameFromNsName(c_namespace, c_localname),
+            attrib, nsmap)
+
+        if context._event_filter & PARSE_EVENT_FILTER_END_NS:
+            context._ns_stack.append(c_nb_namespaces)
+        if context._event_filter & (PARSE_EVENT_FILTER_END |
+                                    PARSE_EVENT_FILTER_START):
+            _pushSaxStartEvent(context, c_ctxt, c_namespace,
+                               c_localname, element)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxStartNoNs(void* ctxt, const_xmlChar* c_name,
+                              const_xmlChar** c_attributes) with gil:
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        context._origSaxStartNoNs(c_ctxt, c_name, c_attributes)
+        if c_ctxt.html:
+            _fixHtmlDictNodeNames(c_ctxt.dict, c_ctxt.node)
+        if context._event_filter & (PARSE_EVENT_FILTER_END |
+                                    PARSE_EVENT_FILTER_START):
+            _pushSaxStartEvent(context, c_ctxt, NULL, c_name, None)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxTargetStartNoNs(void* ctxt, const_xmlChar* c_name,
+                                    const_xmlChar** c_attributes) with gil:
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        if c_attributes is NULL:
+            attrib = IMMUTABLE_EMPTY_MAPPING
+        else:
+            attrib = {}
+            while c_attributes[0] is not NULL:
+                name = funicode(c_attributes[0])
+                attrib[name] = funicodeOrEmpty(c_attributes[1])
+                c_attributes += 2
+        element = _callTargetSaxStart(
+            context, c_ctxt, funicode(c_name),
+            attrib, IMMUTABLE_EMPTY_MAPPING)
+        if context._event_filter & (PARSE_EVENT_FILTER_END |
+                                    PARSE_EVENT_FILTER_START):
+            _pushSaxStartEvent(context, c_ctxt, NULL, c_name, element)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef _callTargetSaxStart(_SaxParserContext context,
+                         xmlparser.xmlParserCtxt* c_ctxt,
+                         tag, attrib, nsmap):
+    element = context._target._handleSaxStart(tag, attrib, nsmap)
+    if element is not None and c_ctxt.input is not NULL:
+        if isinstance(element, _Element):
+            (<_Element>element)._c_node.line = (
+                <unsigned short>c_ctxt.input.line
+                if c_ctxt.input.line < 65535 else 65535)
+    return element
+
+
+cdef int _pushSaxStartEvent(_SaxParserContext context,
+                            xmlparser.xmlParserCtxt* c_ctxt,
+                            const_xmlChar* c_href,
+                            const_xmlChar* c_name, node) except -1:
+    if (context._matcher is None or
+            context._matcher.matchesNsTag(c_href, c_name)):
+        if node is None and context._target is None:
+            assert context._doc is not None
+            node = _elementFactory(context._doc, c_ctxt.node)
+        if context._event_filter & PARSE_EVENT_FILTER_START:
+            context.events_iterator._events.append(('start', node))
+        if (context._target is None and
+                context._event_filter & PARSE_EVENT_FILTER_END):
+            context._node_stack.append(node)
+    return 0
+
+
+cdef void _handleSaxEnd(void* ctxt, const_xmlChar* c_localname,
+                        const_xmlChar* c_prefix,
+                        const_xmlChar* c_namespace) with gil:
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        if context._target is not None:
+            node = context._target._handleSaxEnd(
+                _namespacedNameFromNsName(c_namespace, c_localname))
+        else:
+            context._origSaxEnd(c_ctxt, c_localname, c_prefix, c_namespace)
+            node = None
+        _pushSaxEndEvent(context, c_namespace, c_localname, node)
+        _pushSaxNsEndEvents(context)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxEndNoNs(void* ctxt, const_xmlChar* c_name) with gil:
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        if context._target is not None:
+            node = context._target._handleSaxEnd(funicode(c_name))
+        else:
+            context._origSaxEndNoNs(c_ctxt, c_name)
+            node = None
+        _pushSaxEndEvent(context, NULL, c_name, node)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef tuple NS_END_EVENT = ('end-ns', None)
+
+
+cdef int _pushSaxNsEndEvents(_SaxParserContext context) except -1:
+    cdef int i
+    if context._event_filter & PARSE_EVENT_FILTER_END_NS:
+        for i in range(context._ns_stack.pop()):
+            context.events_iterator._events.append(NS_END_EVENT)
+    return 0
+
+
+cdef int _pushSaxEndEvent(_SaxParserContext context,
+                          const_xmlChar* c_href,
+                          const_xmlChar* c_name, node) except -1:
+    if context._event_filter & PARSE_EVENT_FILTER_END:
+        if (context._matcher is None or
+                context._matcher.matchesNsTag(c_href, c_name)):
+            if context._target is None:
+                node = context._node_stack.pop()
+            context.events_iterator._events.append(('end', node))
+    return 0
+
+
+cdef void _handleSaxData(void* ctxt, const_xmlChar* c_data, int data_len) with gil:
+    # can only be called if parsing with a target
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL or c_ctxt.disableSAX:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        context._target._handleSaxData(
+            c_data[:data_len].decode('utf8'))
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxTargetDoctype(void* ctxt, const_xmlChar* c_name,
+                                  const_xmlChar* c_public,
+                                  const_xmlChar* c_system) with gil:
+    # can only be called if parsing with a target
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        context._target._handleSaxDoctype(
+            funicodeOrNone(c_name),
+            funicodeOrNone(c_public),
+            funicodeOrNone(c_system))
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxStartDocument(void* ctxt) with gil:
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    context = <_SaxParserContext>c_ctxt._private
+    context._origSaxStartDocument(ctxt)
+    c_doc = c_ctxt.myDoc
+    if c_doc and c_ctxt.dict and not c_doc.dict:
+        # I have no idea why libxml2 disables this - we need it
+        c_ctxt.dictNames = 1
+        c_doc.dict = c_ctxt.dict
+        xmlparser.xmlDictReference(c_ctxt.dict)
+    try:
+        context.startDocument(c_doc)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxPI(void* ctxt, const_xmlChar* c_target,
+                       const_xmlChar* c_data) with gil:
+    # can only be called if parsing with a target
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        pi = context._target._handleSaxPi(
+            funicodeOrNone(c_target),
+            funicodeOrEmpty(c_data))
+        if context._event_filter & PARSE_EVENT_FILTER_PI:
+            context.events_iterator._events.append(('pi', pi))
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxPIEvent(void* ctxt, const_xmlChar* target,
+                            const_xmlChar* data) with gil:
+    # can only be called when collecting pi events
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    context = <_SaxParserContext>c_ctxt._private
+    context._origSaxPI(ctxt, target, data)
+    c_node = _findLastEventNode(c_ctxt)
+    if c_node is NULL:
+        return
+    try:
+        context.pushEvent('pi', c_node)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxTargetComment(void* ctxt, const_xmlChar* c_data) with gil:
+    # can only be called if parsing with a target
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    if c_ctxt._private is NULL:
+        return
+    context = <_SaxParserContext>c_ctxt._private
+    try:
+        comment = context._target._handleSaxComment(funicodeOrEmpty(c_data))
+        if context._event_filter & PARSE_EVENT_FILTER_COMMENT:
+            context.events_iterator._events.append(('comment', comment))
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef void _handleSaxComment(void* ctxt, const_xmlChar* text) with gil:
+    # can only be called when collecting comment events
+    c_ctxt = <xmlparser.xmlParserCtxt*>ctxt
+    context = <_SaxParserContext>c_ctxt._private
+    context._origSaxComment(ctxt, text)
+    c_node = _findLastEventNode(c_ctxt)
+    if c_node is NULL:
+        return
+    try:
+        context.pushEvent('comment', c_node)
+    except:
+        context._handleSaxException(c_ctxt)
+    finally:
+        return  # swallow any further exceptions
+
+
+cdef inline xmlNode* _findLastEventNode(xmlparser.xmlParserCtxt* c_ctxt):
+    # this mimics what libxml2 creates for comments/PIs
+    if c_ctxt.inSubset == 1:
+        return c_ctxt.myDoc.intSubset.last
+    elif c_ctxt.inSubset == 2:
+        return c_ctxt.myDoc.extSubset.last
+    elif c_ctxt.node is NULL:
+        return c_ctxt.myDoc.last
+    elif c_ctxt.node.type == tree.XML_ELEMENT_NODE:
+        return c_ctxt.node.last
+    else:
+        return c_ctxt.node.next
+
+
+############################################################
+## ET compatible XML tree builder
+############################################################
+
+cdef class TreeBuilder(_SaxParserTarget):
+    u"""TreeBuilder(self, element_factory=None, parser=None)
+    Parser target that builds a tree.
+
+    The final tree is returned by the ``close()`` method.
+    """
+    cdef _BaseParser _parser
+    cdef object _factory
+    cdef list _data
+    cdef list _element_stack
+    cdef object _element_stack_pop
+    cdef _Element _last # may be None
+    cdef bint _in_tail
+
+    def __init__(self, *, element_factory=None, parser=None):
+        self._sax_event_filter = \
+            SAX_EVENT_START | SAX_EVENT_END | SAX_EVENT_DATA | \
+            SAX_EVENT_PI | SAX_EVENT_COMMENT
+        self._data = [] # data collector
+        self._element_stack = [] # element stack
+        self._element_stack_pop = self._element_stack.pop
+        self._last = None # last element
+        self._in_tail = 0 # true if we're after an end tag
+        self._factory = element_factory
+        self._parser = parser
+
+    @cython.final
+    cdef int _flush(self) except -1:
+        if self._data:
+            if self._last is not None:
+                text = u"".join(self._data)
+                if self._in_tail:
+                    assert self._last.tail is None, u"internal error (tail)"
+                    self._last.tail = text
+                else:
+                    assert self._last.text is None, u"internal error (text)"
+                    self._last.text = text
+            del self._data[:]
+        return 0
+
+    # internal SAX event handlers
+
+    @cython.final
+    cdef _handleSaxStart(self, tag, attrib, nsmap):
+        self._flush()
+        if self._factory is not None:
+            self._last = self._factory(tag, attrib)
+            if self._element_stack:
+                _appendChild(self._element_stack[-1], self._last)
+        elif self._element_stack:
+            self._last = _makeSubElement(
+                self._element_stack[-1], tag, None, None, attrib, nsmap, None)
+        else:
+            self._last = _makeElement(
+                tag, NULL, None, self._parser, None, None, attrib, nsmap, None)
+        self._element_stack.append(self._last)
+        self._in_tail = 0
+        return self._last
+
+    @cython.final
+    cdef _handleSaxEnd(self, tag):
+        self._flush()
+        self._last = self._element_stack_pop()
+        self._in_tail = 1
+        return self._last
+
+    @cython.final
+    cdef int _handleSaxData(self, data) except -1:
+        self._data.append(data)
+
+    @cython.final
+    cdef _handleSaxPi(self, target, data):
+        self._flush()
+        self._last = ProcessingInstruction(target, data)
+        if self._element_stack:
+            _appendChild(self._element_stack[-1], self._last)
+        self._in_tail = 1
+        return self._last
+
+    @cython.final
+    cdef _handleSaxComment(self, comment):
+        self._flush()
+        self._last = Comment(comment)
+        if self._element_stack:
+            _appendChild(self._element_stack[-1], self._last)
+        self._in_tail = 1
+        return self._last
+
+    # Python level event handlers
+
+    def close(self):
+        u"""close(self)
+
+        Flushes the builder buffers, and returns the toplevel document
+        element.
+        """
+        assert not self._element_stack, u"missing end tags"
+        assert self._last is not None, u"missing toplevel element"
+        return self._last
+
+    def data(self, data):
+        u"""data(self, data)
+
+        Adds text to the current element.  The value should be either an
+        8-bit string containing ASCII text, or a Unicode string.
+        """
+        self._handleSaxData(data)
+
+    def start(self, tag, attrs, nsmap=None):
+        u"""start(self, tag, attrs, nsmap=None)
+
+        Opens a new element.
+        """
+        if nsmap is None:
+            nsmap = IMMUTABLE_EMPTY_MAPPING
+        return self._handleSaxStart(tag, attrs, nsmap)
+
+    def end(self, tag):
+        u"""end(self, tag)
+
+        Closes the current element.
+        """
+        element = self._handleSaxEnd(tag)
+        assert self._last.tag == tag,\
+               u"end tag mismatch (expected %s, got %s)" % (
+                   self._last.tag, tag)
+        return element
+
+    def pi(self, target, data):
+        u"""pi(self, target, data)
+        """
+        return self._handleSaxPi(target, data)
+
+    def comment(self, comment):
+        u"""comment(self, comment)
+        """
+        return self._handleSaxComment(comment)
diff --git a/lib/lxml/schematron.pxi b/lib/lxml/schematron.pxi
new file mode 100644
index 00000000..f5e97d8c
--- /dev/null
+++ b/lib/lxml/schematron.pxi
@@ -0,0 +1,164 @@
+# support for Schematron validation
+from lxml.includes cimport schematron
+
+class SchematronError(LxmlError):
+    u"""Base class of all Schematron errors.
+    """
+    pass
+
+class SchematronParseError(SchematronError):
+    u"""Error while parsing an XML document as Schematron schema.
+    """
+    pass
+
+class SchematronValidateError(SchematronError):
+    u"""Error while validating an XML document with a Schematron schema.
+    """
+    pass
+
+################################################################################
+# Schematron
+
+cdef class Schematron(_Validator):
+    u"""Schematron(self, etree=None, file=None)
+    A Schematron validator.
+
+    Pass a root Element or an ElementTree to turn it into a validator.
+    Alternatively, pass a filename as keyword argument 'file' to parse from
+    the file system.
+
+    Schematron is a less well known, but very powerful schema language.  The main
+    idea is to use the capabilities of XPath to put restrictions on the structure
+    and the content of XML documents.  Here is a simple example::
+
+      >>> schematron = Schematron(XML('''
+      ... <schema xmlns="http://www.ascc.net/xml/schematron" >
+      ...   <pattern name="id is the only permited attribute name">
+      ...     <rule context="*">
+      ...       <report test="@*[not(name()='id')]">Attribute
+      ...         <name path="@*[not(name()='id')]"/> is forbidden<name/>
+      ...       </report>
+      ...     </rule>
+      ...   </pattern>
+      ... </schema>
+      ... '''))
+
+      >>> xml = XML('''
+      ... <AAA name="aaa">
+      ...   <BBB id="bbb"/>
+      ...   <CCC color="ccc"/>
+      ... </AAA>
+      ... ''')
+
+      >>> schematron.validate(xml)
+      0
+
+      >>> xml = XML('''
+      ... <AAA id="aaa">
+      ...   <BBB id="bbb"/>
+      ...   <CCC/>
+      ... </AAA>
+      ... ''')
+
+      >>> schematron.validate(xml)
+      1
+
+    Schematron was added to libxml2 in version 2.6.21.  Before version 2.6.32,
+    however, Schematron lacked support for error reporting other than to stderr.
+    This version is therefore required to retrieve validation warnings and
+    errors in lxml.
+    """
+    cdef schematron.xmlSchematron* _c_schema
+    cdef xmlDoc* _c_schema_doc
+    def __cinit__(self):
+        self._c_schema = NULL
+        self._c_schema_doc = NULL
+
+    def __init__(self, etree=None, *, file=None):
+        cdef _Document doc
+        cdef _Element root_node
+        cdef xmlNode* c_node
+        cdef char* c_href
+        cdef schematron.xmlSchematronParserCtxt* parser_ctxt
+        _Validator.__init__(self)
+        if not config.ENABLE_SCHEMATRON:
+            raise SchematronError, \
+                u"lxml.etree was compiled without Schematron support."
+        if etree is not None:
+            doc = _documentOrRaise(etree)
+            root_node = _rootNodeOrRaise(etree)
+            self._c_schema_doc = _copyDocRoot(doc._c_doc, root_node._c_node)
+            parser_ctxt = schematron.xmlSchematronNewDocParserCtxt(self._c_schema_doc)
+        elif file is not None:
+            filename = _getFilenameForFile(file)
+            if filename is None:
+                # XXX assume a string object
+                filename = file
+            filename = _encodeFilename(filename)
+            with self._error_log:
+                parser_ctxt = schematron.xmlSchematronNewParserCtxt(_cstr(filename))
+        else:
+            raise SchematronParseError, u"No tree or file given"
+
+        if parser_ctxt is NULL:
+            if self._c_schema_doc is not NULL:
+                tree.xmlFreeDoc(self._c_schema_doc)
+                self._c_schema_doc = NULL
+            raise MemoryError()
+
+        try:
+            with self._error_log:
+                self._c_schema = schematron.xmlSchematronParse(parser_ctxt)
+        finally:
+            schematron.xmlSchematronFreeParserCtxt(parser_ctxt)
+
+        if self._c_schema is NULL:
+            raise SchematronParseError(
+                u"Document is not a valid Schematron schema",
+                self._error_log)
+
+    def __dealloc__(self):
+        schematron.xmlSchematronFree(self._c_schema)
+        if self._c_schema_doc is not NULL:
+            tree.xmlFreeDoc(self._c_schema_doc)
+
+    def __call__(self, etree):
+        u"""__call__(self, etree)
+
+        Validate doc using Schematron.
+
+        Returns true if document is valid, false if not."""
+        cdef _Document doc
+        cdef _Element root_node
+        cdef xmlDoc* c_doc
+        cdef schematron.xmlSchematronValidCtxt* valid_ctxt
+        cdef int ret
+
+        assert self._c_schema is not NULL, "Schematron instance not initialised"
+        doc = _documentOrRaise(etree)
+        root_node = _rootNodeOrRaise(etree)
+
+        valid_ctxt = schematron.xmlSchematronNewValidCtxt(
+            self._c_schema, schematron.XML_SCHEMATRON_OUT_ERROR)
+        if valid_ctxt is NULL:
+            raise MemoryError()
+
+        try:
+            self._error_log.clear()
+            schematron.xmlSchematronSetValidStructuredErrors(
+                valid_ctxt, _receiveError, <void*>self._error_log)
+            c_doc = _fakeRootDoc(doc._c_doc, root_node._c_node)
+            with nogil:
+                ret = schematron.xmlSchematronValidateDoc(valid_ctxt, c_doc)
+            _destroyFakeDoc(doc._c_doc, c_doc)
+        finally:
+            schematron.xmlSchematronFreeValidCtxt(valid_ctxt)
+
+        if ret == -1:
+            raise SchematronValidateError(
+                u"Internal error in Schematron validation",
+                self._error_log)
+        if ret == 0:
+            return True
+        else:
+            return False
diff --git a/lib/lxml/serializer.pxi b/lib/lxml/serializer.pxi
new file mode 100644
index 00000000..b8b81048
--- /dev/null
+++ b/lib/lxml/serializer.pxi
@@ -0,0 +1,903 @@
+# XML serialization and output functions
+
+cdef object GzipFile
+from gzip import GzipFile
+
+class SerialisationError(LxmlError):
+    u"""A libxml2 error that occurred during serialisation.
+    """
+
+cdef enum _OutputMethods:
+    OUTPUT_METHOD_XML
+    OUTPUT_METHOD_HTML
+    OUTPUT_METHOD_TEXT
+
+cdef int _findOutputMethod(method) except -1:
+    if method is None:
+        return OUTPUT_METHOD_XML
+    method = method.lower()
+    if method == "xml":
+        return OUTPUT_METHOD_XML
+    if method == "html":
+        return OUTPUT_METHOD_HTML
+    if method == "text":
+        return OUTPUT_METHOD_TEXT
+    raise ValueError(u"unknown output method %r" % method)
+
+cdef _textToString(xmlNode* c_node, encoding, bint with_tail):
+    cdef bint needs_conversion
+    cdef const_xmlChar* c_text
+    cdef xmlNode* c_text_node
+    cdef tree.xmlBuffer* c_buffer
+    cdef int error_result
+
+    c_buffer = tree.xmlBufferCreate()
+    if c_buffer is NULL:
+        raise MemoryError()
+
+    with nogil:
+        error_result = tree.xmlNodeBufGetContent(c_buffer, c_node)
+        if with_tail:
+            c_text_node = _textNodeOrSkip(c_node.next)
+            while c_text_node is not NULL:
+                tree.xmlBufferWriteChar(c_buffer, <const_char*>c_text_node.content)
+                c_text_node = _textNodeOrSkip(c_text_node.next)
+        c_text = tree.xmlBufferContent(c_buffer)
+
+    if error_result < 0 or c_text is NULL:
+        tree.xmlBufferFree(c_buffer)
+        raise SerialisationError, u"Error during serialisation (out of memory?)"
+
+    try:
+        needs_conversion = 0
+        if encoding is _unicode:
+            needs_conversion = 1
+        elif encoding is not None:
+            # Python prefers lower case encoding names
+            encoding = encoding.lower()
+            if encoding not in (u'utf8', u'utf-8'):
+                if encoding == u'ascii':
+                    if isutf8(c_text):
+                        # will raise a decode error below
+                        needs_conversion = 1
+                else:
+                    needs_conversion = 1
+
+        if needs_conversion:
+            text = python.PyUnicode_DecodeUTF8(
+                <const_char*>c_text, tree.xmlBufferLength(c_buffer), 'strict')
+            if encoding is not _unicode:
+                encoding = _utf8(encoding)
+                text = python.PyUnicode_AsEncodedString(
+                    text, encoding, 'strict')
+        else:
+            text = (<unsigned char*>c_text)[:tree.xmlBufferLength(c_buffer)]
+    finally:
+        tree.xmlBufferFree(c_buffer)
+    return text
+
+
+cdef _tostring(_Element element, encoding, doctype, method,
+               bint write_xml_declaration, bint write_complete_document,
+               bint pretty_print, bint with_tail, int standalone):
+    u"""Serialize an element to an encoded string representation of its XML
+    tree.
+    """
+    cdef tree.xmlOutputBuffer* c_buffer
+    cdef tree.xmlBuf* c_result_buffer
+    cdef tree.xmlCharEncodingHandler* enchandler
+    cdef const_char* c_enc
+    cdef const_xmlChar* c_version
+    cdef const_xmlChar* c_doctype
+    cdef int c_method
+    cdef int error_result
+    if element is None:
+        return None
+    _assertValidNode(element)
+    c_method = _findOutputMethod(method)
+    if c_method == OUTPUT_METHOD_TEXT:
+        return _textToString(element._c_node, encoding, with_tail)
+    if encoding is None or encoding is _unicode:
+        c_enc = NULL
+    else:
+        encoding = _utf8(encoding)
+        c_enc = _cstr(encoding)
+    if doctype is None:
+        c_doctype = NULL
+    else:
+        doctype = _utf8(doctype)
+        c_doctype = _xcstr(doctype)
+    # it is necessary to *and* find the encoding handler *and* use
+    # encoding during output
+    enchandler = tree.xmlFindCharEncodingHandler(c_enc)
+    if enchandler is NULL and c_enc is not NULL:
+        if encoding is not None:
+            encoding = encoding.decode('UTF-8')
+        raise LookupError, u"unknown encoding: '%s'" % encoding
+    c_buffer = tree.xmlAllocOutputBuffer(enchandler)
+    if c_buffer is NULL:
+        tree.xmlCharEncCloseFunc(enchandler)
+        raise MemoryError()
+
+    with nogil:
+        _writeNodeToBuffer(c_buffer, element._c_node, c_enc, c_doctype, c_method,
+                           write_xml_declaration, write_complete_document,
+                           pretty_print, with_tail, standalone)
+        tree.xmlOutputBufferFlush(c_buffer)
+        if c_buffer.conv is not NULL:
+            c_result_buffer = c_buffer.conv
+        else:
+            c_result_buffer = c_buffer.buffer
+
+    error_result = c_buffer.error
+    if error_result != xmlerror.XML_ERR_OK:
+        tree.xmlOutputBufferClose(c_buffer)
+        _raiseSerialisationError(error_result)
+
+    try:
+        if encoding is _unicode:
+            result = (<unsigned char*>tree.xmlBufContent(
+                c_result_buffer))[:tree.xmlBufUse(c_result_buffer)].decode('UTF-8')
+        else:
+            result = <bytes>(<unsigned char*>tree.xmlBufContent(
+                c_result_buffer))[:tree.xmlBufUse(c_result_buffer)]
+    finally:
+        error_result = tree.xmlOutputBufferClose(c_buffer)
+    if error_result < 0:
+        _raiseSerialisationError(error_result)
+    return result
+
+cdef bytes _tostringC14N(element_or_tree, bint exclusive, bint with_comments, inclusive_ns_prefixes):
+    cdef xmlDoc* c_doc
+    cdef xmlChar* c_buffer = NULL
+    cdef int byte_count = -1
+    cdef bytes result
+    cdef _Document doc
+    cdef _Element element
+    cdef xmlChar **c_inclusive_ns_prefixes
+
+    if isinstance(element_or_tree, _Element):
+        _assertValidNode(<_Element>element_or_tree)
+        doc = (<_Element>element_or_tree)._doc
+        c_doc = _plainFakeRootDoc(doc._c_doc, (<_Element>element_or_tree)._c_node, 0)
+    else:
+        doc = _documentOrRaise(element_or_tree)
+        _assertValidDoc(doc)
+        c_doc = doc._c_doc
+
+    c_inclusive_ns_prefixes = _convert_ns_prefixes(c_doc.dict, inclusive_ns_prefixes) if inclusive_ns_prefixes else NULL
+    try:
+         with nogil:
+             byte_count = c14n.xmlC14NDocDumpMemory(
+                 c_doc, NULL, exclusive, c_inclusive_ns_prefixes, with_comments, &c_buffer)
+
+    finally:
+         _destroyFakeDoc(doc._c_doc, c_doc)
+         if c_inclusive_ns_prefixes is not NULL:
+            python.PyMem_Free(c_inclusive_ns_prefixes)
+
+    if byte_count < 0 or c_buffer is NULL:
+        if c_buffer is not NULL:
+            tree.xmlFree(c_buffer)
+        raise C14NError, u"C14N failed"
+    try:
+        result = c_buffer[:byte_count]
+    finally:
+        tree.xmlFree(c_buffer)
+    return result
+
+cdef _raiseSerialisationError(int error_result):
+    if error_result == xmlerror.XML_ERR_NO_MEMORY:
+        raise MemoryError()
+    message = ErrorTypes._getName(error_result)
+    if message is None:
+        message = u"unknown error %d" % error_result
+    raise SerialisationError, message
+
+############################################################
+# low-level serialisation functions
+
+cdef void _writeDoctype(tree.xmlOutputBuffer* c_buffer,
+                        const_xmlChar* c_doctype) nogil:
+    tree.xmlOutputBufferWrite(c_buffer, tree.xmlStrlen(c_doctype),
+                              <const_char*>c_doctype)
+    tree.xmlOutputBufferWriteString(c_buffer, "\n")
+
+cdef void _writeNodeToBuffer(tree.xmlOutputBuffer* c_buffer,
+                             xmlNode* c_node, const_char* encoding, const_xmlChar* c_doctype,
+                             int c_method, bint write_xml_declaration,
+                             bint write_complete_document,
+                             bint pretty_print, bint with_tail,
+                             int standalone) nogil:
+    cdef xmlNode* c_nsdecl_node
+    cdef xmlDoc* c_doc = c_node.doc
+    if write_xml_declaration and c_method == OUTPUT_METHOD_XML:
+        _writeDeclarationToBuffer(c_buffer, c_doc.version, encoding, standalone)
+    if c_doctype:
+        _writeDoctype(c_buffer, c_doctype)
+    # write internal DTD subset, preceding PIs/comments, etc.
+    if write_complete_document and not c_buffer.error:
+        if c_doctype is NULL:
+            _writeDtdToBuffer(c_buffer, c_doc, c_node.name, encoding)
+        _writePrevSiblings(c_buffer, c_node, encoding, pretty_print)
+
+    c_nsdecl_node = c_node
+    if not c_node.parent or c_node.parent.type != tree.XML_DOCUMENT_NODE:
+        # copy the node and add namespaces from parents
+        # this is required to make libxml write them
+        c_nsdecl_node = tree.xmlCopyNode(c_node, 2)
+        if not c_nsdecl_node:
+            c_buffer.error = xmlerror.XML_ERR_NO_MEMORY
+            return
+        _copyParentNamespaces(c_node, c_nsdecl_node)
+
+        c_nsdecl_node.parent = c_node.parent
+        c_nsdecl_node.children = c_node.children
+        c_nsdecl_node.last = c_node.last
+
+    # write node
+    if c_method == OUTPUT_METHOD_HTML:
+        tree.htmlNodeDumpFormatOutput(
+            c_buffer, c_doc, c_nsdecl_node, encoding, pretty_print)
+    else:
+        tree.xmlNodeDumpOutput(
+            c_buffer, c_doc, c_nsdecl_node, 0, pretty_print, encoding)
+
+    if c_nsdecl_node is not c_node:
+        # clean up
+        c_nsdecl_node.children = c_nsdecl_node.last = NULL
+        tree.xmlFreeNode(c_nsdecl_node)
+
+    if c_buffer.error:
+        return
+
+    # write tail, trailing comments, etc.
+    if with_tail:
+        _writeTail(c_buffer, c_node, encoding, c_method, pretty_print)
+    if write_complete_document:
+        _writeNextSiblings(c_buffer, c_node, encoding, pretty_print)
+    if pretty_print:
+        tree.xmlOutputBufferWrite(c_buffer, 1, "\n")
+
+cdef void _writeDeclarationToBuffer(tree.xmlOutputBuffer* c_buffer,
+                                    const_xmlChar* version, const_char* encoding,
+                                    int standalone) nogil:
+    if version is NULL:
+        version = <unsigned char*>"1.0"
+    tree.xmlOutputBufferWrite(c_buffer, 15, "<?xml version='")
+    tree.xmlOutputBufferWriteString(c_buffer, <const_char*>version)
+    tree.xmlOutputBufferWrite(c_buffer, 12, "' encoding='")
+    tree.xmlOutputBufferWriteString(c_buffer, encoding)
+    if standalone == 0:
+        tree.xmlOutputBufferWrite(c_buffer, 20, "' standalone='no'?>\n")
+    elif standalone == 1:
+        tree.xmlOutputBufferWrite(c_buffer, 21, "' standalone='yes'?>\n")
+    else:
+        tree.xmlOutputBufferWrite(c_buffer, 4, "'?>\n")
+
+cdef void _writeDtdToBuffer(tree.xmlOutputBuffer* c_buffer,
+                            xmlDoc* c_doc, const_xmlChar* c_root_name,
+                            const_char* encoding) nogil:
+    cdef tree.xmlDtd* c_dtd
+    cdef xmlNode* c_node
+    c_dtd = c_doc.intSubset
+    if not c_dtd or not c_dtd.name:
+        return
+    if tree.xmlStrcmp(c_root_name, c_dtd.name) != 0:
+        return
+    tree.xmlOutputBufferWrite(c_buffer, 10, "<!DOCTYPE ")
+    tree.xmlOutputBufferWriteString(c_buffer, <const_char*>c_dtd.name)
+    if c_dtd.SystemID and c_dtd.SystemID[0] != c'\0':
+        if c_dtd.ExternalID != NULL and c_dtd.ExternalID[0] != c'\0':
+            tree.xmlOutputBufferWrite(c_buffer, 9, ' PUBLIC "')
+            tree.xmlOutputBufferWriteString(c_buffer, <const_char*>c_dtd.ExternalID)
+            tree.xmlOutputBufferWrite(c_buffer, 3, '" "')
+        else:
+            tree.xmlOutputBufferWrite(c_buffer, 9, ' SYSTEM "')
+        tree.xmlOutputBufferWriteString(c_buffer, <const_char*>c_dtd.SystemID)
+        tree.xmlOutputBufferWrite(c_buffer, 1, '"')
+    if not c_dtd.entities and not c_dtd.elements and \
+           not c_dtd.attributes and not c_dtd.notations and \
+           not c_dtd.pentities:
+        tree.xmlOutputBufferWrite(c_buffer, 2, '>\n')
+        return
+    tree.xmlOutputBufferWrite(c_buffer, 3, ' [\n')
+    if c_dtd.notations and not c_buffer.error:
+        c_buf = tree.xmlBufferCreate()
+        if not c_buf:
+            c_buffer.error = xmlerror.XML_ERR_NO_MEMORY
+            return
+        tree.xmlDumpNotationTable(c_buf, <tree.xmlNotationTable*>c_dtd.notations)
+        tree.xmlOutputBufferWrite(
+            c_buffer, tree.xmlBufferLength(c_buf),
+            <const_char*>tree.xmlBufferContent(c_buf))
+        tree.xmlBufferFree(c_buf)
+    c_node = c_dtd.children
+    while c_node and not c_buffer.error:
+        tree.xmlNodeDumpOutput(c_buffer, c_node.doc, c_node, 0, 0, encoding)
+        c_node = c_node.next
+    tree.xmlOutputBufferWrite(c_buffer, 3, "]>\n")
+
+cdef void _writeTail(tree.xmlOutputBuffer* c_buffer, xmlNode* c_node,
+                     const_char* encoding, int c_method, bint pretty_print) nogil:
+    u"Write the element tail."
+    c_node = c_node.next
+    while c_node and c_node.type == tree.XML_TEXT_NODE and not c_buffer.error:
+        if c_method == OUTPUT_METHOD_HTML:
+            tree.htmlNodeDumpFormatOutput(
+                c_buffer, c_node.doc, c_node, encoding, pretty_print)
+        else:
+            tree.xmlNodeDumpOutput(
+                c_buffer, c_node.doc, c_node, 0, pretty_print, encoding)
+        c_node = c_node.next
+
+cdef void _writePrevSiblings(tree.xmlOutputBuffer* c_buffer, xmlNode* c_node,
+                             const_char* encoding, bint pretty_print) nogil:
+    cdef xmlNode* c_sibling
+    if c_node.parent and _isElement(c_node.parent):
+        return
+    # we are at a root node, so add PI and comment siblings
+    c_sibling = c_node
+    while c_sibling.prev and \
+            (c_sibling.prev.type == tree.XML_PI_NODE or
+             c_sibling.prev.type == tree.XML_COMMENT_NODE):
+        c_sibling = c_sibling.prev
+    while c_sibling is not c_node and not c_buffer.error:
+        tree.xmlNodeDumpOutput(c_buffer, c_node.doc, c_sibling, 0,
+                               pretty_print, encoding)
+        if pretty_print:
+            tree.xmlOutputBufferWriteString(c_buffer, "\n")
+        c_sibling = c_sibling.next
+
+cdef void _writeNextSiblings(tree.xmlOutputBuffer* c_buffer, xmlNode* c_node,
+                             const_char* encoding, bint pretty_print) nogil:
+    cdef xmlNode* c_sibling
+    if c_node.parent and _isElement(c_node.parent):
+        return
+    # we are at a root node, so add PI and comment siblings
+    c_sibling = c_node.next
+    while not c_buffer.error and c_sibling and \
+            (c_sibling.type == tree.XML_PI_NODE or
+             c_sibling.type == tree.XML_COMMENT_NODE):
+        if pretty_print:
+            tree.xmlOutputBufferWriteString(c_buffer, "\n")
+        tree.xmlNodeDumpOutput(c_buffer, c_node.doc, c_sibling, 0,
+                               pretty_print, encoding)
+        c_sibling = c_sibling.next
+
+############################################################
+# output to file-like objects
+
+@cython.final
+@cython.internal
+cdef class _FilelikeWriter:
+    cdef object _filelike
+    cdef object _close_filelike
+    cdef _ExceptionContext _exc_context
+    cdef _ErrorLog error_log
+    def __cinit__(self, filelike, exc_context=None, compression=None):
+        if compression is not None and compression > 0:
+            filelike = GzipFile(
+                fileobj=filelike, mode='wb', compresslevel=compression)
+            self._close_filelike = filelike.close
+        self._filelike = filelike
+        if exc_context is None:
+            self._exc_context = _ExceptionContext()
+        else:
+            self._exc_context = exc_context
+        self.error_log = _ErrorLog()
+
+    cdef tree.xmlOutputBuffer* _createOutputBuffer(
+        self, tree.xmlCharEncodingHandler* enchandler) except NULL:
+        cdef tree.xmlOutputBuffer* c_buffer
+        c_buffer = tree.xmlOutputBufferCreateIO(
+            <tree.xmlOutputWriteCallback>_writeFilelikeWriter, _closeFilelikeWriter,
+            <python.PyObject*>self, enchandler)
+        if c_buffer is NULL:
+            raise IOError, u"Could not create I/O writer context."
+        return c_buffer
+
+    cdef int write(self, char* c_buffer, int size):
+        try:
+            if self._filelike is None:
+                raise IOError, u"File is already closed"
+            py_buffer = <bytes>c_buffer[:size]
+            self._filelike.write(py_buffer)
+        except:
+            size = -1
+            self._exc_context._store_raised()
+        finally:
+            return size  # and swallow any further exceptions
+
+    cdef int close(self):
+        retval = 0
+        try:
+            if self._close_filelike is not None:
+                self._close_filelike()
+            # we should not close the file here as we didn't open it
+            self._filelike = None
+        except:
+            retval = -1
+            self._exc_context._store_raised()
+        finally:
+            return retval  # and swallow any further exceptions
+
+cdef int _writeFilelikeWriter(void* ctxt, char* c_buffer, int length):
+    return (<_FilelikeWriter>ctxt).write(c_buffer, length)
+
+cdef int _closeFilelikeWriter(void* ctxt):
+    return (<_FilelikeWriter>ctxt).close()
+
+cdef _tofilelike(f, _Element element, encoding, doctype, method,
+                 bint write_xml_declaration, bint write_doctype,
+                 bint pretty_print, bint with_tail, int standalone,
+                 int compression):
+    cdef python.PyThreadState* state = NULL
+    cdef _FilelikeWriter writer = None
+    cdef tree.xmlOutputBuffer* c_buffer
+    cdef tree.xmlCharEncodingHandler* enchandler
+    cdef const_char* c_enc
+    cdef const_xmlChar* c_doctype
+    cdef int error_result
+
+    c_method = _findOutputMethod(method)
+    if c_method == OUTPUT_METHOD_TEXT:
+        data = _textToString(element._c_node, encoding, with_tail)
+        if compression:
+            bytes_out = BytesIO()
+            gzip_file = GzipFile(
+                fileobj=bytes_out, mode='wb', compresslevel=compression)
+            try:
+                gzip_file.write(data)
+            finally:
+                gzip_file.close()
+            data = bytes_out.getvalue()
+        if _isString(f):
+            filename8 = _encodeFilename(f)
+            f = open(filename8, 'wb')
+            try:
+                f.write(data)
+            finally:
+                f.close()
+        else:
+            f.write(data)
+        return
+
+    if encoding is None:
+        c_enc = NULL
+    else:
+        encoding = _utf8(encoding)
+        c_enc = _cstr(encoding)
+    if doctype is None:
+        c_doctype = NULL
+    else:
+        doctype = _utf8(doctype)
+        c_doctype = _xcstr(doctype)
+
+    writer = _create_output_buffer(f, c_enc, compression, &c_buffer)
+    if writer is None:
+        state = python.PyEval_SaveThread()
+
+    _writeNodeToBuffer(c_buffer, element._c_node, c_enc, c_doctype, c_method,
+                       write_xml_declaration, write_doctype,
+                       pretty_print, with_tail, standalone)
+    error_result = c_buffer.error
+    if error_result == xmlerror.XML_ERR_OK:
+        error_result = tree.xmlOutputBufferClose(c_buffer)
+        if error_result > 0:
+            error_result = xmlerror.XML_ERR_OK
+    else:
+        tree.xmlOutputBufferClose(c_buffer)
+    if writer is None:
+        python.PyEval_RestoreThread(state)
+    else:
+        writer._exc_context._raise_if_stored()
+    if error_result != xmlerror.XML_ERR_OK:
+        _raiseSerialisationError(error_result)
+
+cdef _create_output_buffer(f, const_char* c_enc, int compression,
+                           tree.xmlOutputBuffer** c_buffer_ret):
+    cdef tree.xmlOutputBuffer* c_buffer
+    cdef _FilelikeWriter writer
+    enchandler = tree.xmlFindCharEncodingHandler(c_enc)
+    if enchandler is NULL:
+        raise LookupError(u"unknown encoding: '%s'" %
+                          c_enc.decode(u'UTF-8') if c_enc is not NULL else u'')
+    try:
+        if _isString(f):
+            filename8 = _encodeFilename(f)
+            c_buffer = tree.xmlOutputBufferCreateFilename(
+                _cstr(filename8), enchandler, compression)
+            if c_buffer is NULL:
+                return python.PyErr_SetFromErrno(IOError) # raises IOError
+            writer = None
+        elif hasattr(f, 'write'):
+            writer = _FilelikeWriter(f, compression=compression)
+            c_buffer = writer._createOutputBuffer(enchandler)
+        else:
+            raise TypeError(
+                u"File or filename expected, got '%s'" %
+                python._fqtypename(f).decode('UTF-8'))
+    except:
+        tree.xmlCharEncCloseFunc(enchandler)
+        raise
+    c_buffer_ret[0] = c_buffer
+    return writer
+
+cdef xmlChar **_convert_ns_prefixes(tree.xmlDict* c_dict, ns_prefixes) except NULL:
+    cdef size_t i, num_ns_prefixes = len(ns_prefixes)
+    # Need to allocate one extra memory block to handle last NULL entry
+    c_ns_prefixes = <xmlChar **>python.PyMem_Malloc(sizeof(xmlChar*) * (num_ns_prefixes + 1))
+    i = 0
+    try:
+        for prefix in ns_prefixes:
+             prefix_utf = _utf8(prefix)
+             c_prefix = tree.xmlDictExists(c_dict, _xcstr(prefix_utf), len(prefix_utf))
+             if c_prefix:
+                 # unknown prefixes do not need to get serialised
+                 c_ns_prefixes[i] = <xmlChar*>c_prefix
+                 i += 1
+    except:
+        python.PyMem_Free(c_ns_prefixes)
+        raise
+
+    c_ns_prefixes[i] = NULL  # append end marker
+    return c_ns_prefixes
+
+cdef _tofilelikeC14N(f, _Element element, bint exclusive, bint with_comments,
+                     int compression, inclusive_ns_prefixes):
+    cdef _FilelikeWriter writer = None
+    cdef tree.xmlOutputBuffer* c_buffer
+    cdef xmlChar **c_inclusive_ns_prefixes = NULL
+    cdef char* c_filename
+    cdef xmlDoc* c_base_doc
+    cdef xmlDoc* c_doc
+    cdef int bytes_count, error = 0
+
+    c_base_doc = element._c_node.doc
+    c_doc = _fakeRootDoc(c_base_doc, element._c_node)
+    try:
+        c_inclusive_ns_prefixes = (
+            _convert_ns_prefixes(c_doc.dict, inclusive_ns_prefixes)
+            if inclusive_ns_prefixes else NULL)
+
+        if _isString(f):
+            filename8 = _encodeFilename(f)
+            c_filename = _cstr(filename8)
+            with nogil:
+                error = c14n.xmlC14NDocSave(
+                    c_doc, NULL, exclusive, c_inclusive_ns_prefixes,
+                    with_comments, c_filename, compression)
+        elif hasattr(f, 'write'):
+            writer   = _FilelikeWriter(f, compression=compression)
+            c_buffer = writer._createOutputBuffer(NULL)
+            with writer.error_log:
+                bytes_count = c14n.xmlC14NDocSaveTo(
+                    c_doc, NULL, exclusive, c_inclusive_ns_prefixes,
+                    with_comments, c_buffer)
+                error = tree.xmlOutputBufferClose(c_buffer)
+            if bytes_count < 0:
+                error = bytes_count
+        else:
+            raise TypeError(u"File or filename expected, got '%s'" %
+                            python._fqtypename(f).decode('UTF-8'))
+    finally:
+        _destroyFakeDoc(c_base_doc, c_doc)
+        if c_inclusive_ns_prefixes is not NULL:
+            python.PyMem_Free(c_inclusive_ns_prefixes)
+
+    if writer is not None:
+        writer._exc_context._raise_if_stored()
+
+    if error < 0:
+        message = u"C14N failed"
+        if writer is not None:
+            errors = writer.error_log
+            if len(errors):
+                message = errors[0].message
+        raise C14NError(message)
+
+# incremental serialisation
+
+cdef class xmlfile:
+    """xmlfile(self, output_file, encoding=None, compression=None)
+
+    A simple mechanism for incremental XML serialisation.
+
+    Usage example::
+
+         with xmlfile("somefile.xml", encoding='utf-8') as xf:
+             xf.write_declaration(standalone=True)
+             xf.write_doctype('<!DOCTYPE root SYSTEM "some.dtd">')
+
+             # generate an element (the root element)
+             with xf.element('root'):
+                  # write a complete Element into the open root element
+                  xf.write(etree.Element('test'))
+
+                  # generate and write more Elements, e.g. through iterparse
+                  for element in generate_some_elements():
+                      # serialise generated elements into the XML file
+                      xf.write(element)
+    """
+    cdef object output_file
+    cdef bytes encoding
+    cdef int compresslevel
+    cdef _IncrementalFileWriter writer
+
+    def __init__(self, output_file not None, encoding=None, compression=None):
+        self.output_file = output_file
+        self.encoding = _utf8orNone(encoding)
+        self.compresslevel = compression or 0
+
+    def __enter__(self):
+        assert self.output_file is not None
+        cdef _IncrementalFileWriter writer = _IncrementalFileWriter(
+            self.output_file, self.encoding, self.compresslevel)
+        self.writer = writer
+        return writer
+
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        if self.writer is not None:
+            old_writer, self.writer = self.writer, None
+            raise_on_error = exc_type is None
+            old_writer._close(raise_on_error)
+
+cdef enum _IncrementalFileWriterStatus:
+    WRITER_STARTING = 0
+    WRITER_DECL_WRITTEN = 1
+    WRITER_DTD_WRITTEN = 2
+    WRITER_IN_ELEMENT = 3
+    WRITER_FINISHED = 4
+
+@cython.final
+@cython.internal
+cdef class _IncrementalFileWriter:
+    cdef tree.xmlOutputBuffer* _c_out
+    cdef bytes _encoding
+    cdef const_char* _c_encoding
+    cdef _FilelikeWriter _target
+    cdef list _element_stack
+    cdef int _status
+
+    def __cinit__(self, outfile, bytes encoding, int compresslevel):
+        self._status = WRITER_STARTING
+        self._element_stack = []
+        if encoding is None:
+            encoding = b'ASCII'
+        self._encoding = encoding
+        self._c_encoding = _cstr(encoding) if encoding is not None else NULL
+        self._target = _create_output_buffer(
+            outfile, self._c_encoding, compresslevel, &self._c_out)
+
+    def __dealloc__(self):
+        if self._c_out is not NULL:
+            tree.xmlOutputBufferClose(self._c_out)
+
+    def write_declaration(self, version=None, standalone=None, doctype=None):
+        """write_declaration(self, version=None, standalone=None, doctype=None)
+
+        Write an XML declaration and (optionally) a doctype into the file.
+        """
+        assert self._c_out is not NULL
+        cdef const_xmlChar* c_version
+        cdef int c_standalone
+        if self._status >= WRITER_DECL_WRITTEN:
+            raise LxmlSyntaxError("XML declaration already written")
+        version = _utf8orNone(version)
+        c_version = _xcstr(version) if version is not None else NULL
+        doctype = _utf8orNone(doctype)
+        if standalone is None:
+            c_standalone = -1
+        else:
+            c_standalone = 1 if standalone else 0
+        _writeDeclarationToBuffer(self._c_out, c_version, self._c_encoding, c_standalone)
+        if doctype is not None:
+            _writeDoctype(self._c_out, _xcstr(doctype))
+            self._status = WRITER_DTD_WRITTEN
+        else:
+            self._status = WRITER_DECL_WRITTEN
+        self._handle_error(self._c_out.error)
+
+    def write_doctype(self, doctype):
+        """write_doctype(self, doctype)
+
+        Writes the given doctype declaration verbatimly into the file.
+        """
+        assert self._c_out is not NULL
+        if doctype is None:
+            return
+        if self._status >= WRITER_DTD_WRITTEN:
+            raise LxmlSyntaxError("DOCTYPE already written or cannot write it here")
+        doctype = _utf8(doctype)
+        _writeDoctype(self._c_out, _xcstr(doctype))
+        self._status = WRITER_DTD_WRITTEN
+        self._handle_error(self._c_out.error)
+
+    def element(self, tag, attrib=None, nsmap=None, **_extra):
+        """element(self, tag, attrib=None, nsmap=None, **_extra)
+
+        Returns a context manager that writes an opening and closing tag.
+        """
+        assert self._c_out is not NULL
+        attributes = []
+        if attrib is not None:
+            if isinstance(attrib, (dict, _Attrib)):
+                attrib = attrib.items()
+            for name, value in attrib:
+                if name not in _extra:
+                    ns, name = _getNsTag(name)
+                    attributes.append((ns, name, _utf8(value)))
+        if _extra:
+            for name, value in _extra.iteritems():
+                ns, name = _getNsTag(name)
+                attributes.append((ns, name, _utf8(value)))
+        reversed_nsmap = {}
+        if nsmap:
+            for prefix, ns in nsmap.items():
+                if prefix is not None:
+                    prefix = _utf8(prefix)
+                    _prefixValidOrRaise(prefix)
+                reversed_nsmap[_utf8(ns)] = prefix
+        ns, name = _getNsTag(tag)
+        return _FileWriterElement(self, (ns, name, attributes, reversed_nsmap))
+
+    cdef _write_qname(self, bytes name, bytes prefix):
+        if prefix is not None:
+            tree.xmlOutputBufferWrite(self._c_out, len(prefix), _cstr(prefix))
+            tree.xmlOutputBufferWrite(self._c_out, 1, ':')
+        tree.xmlOutputBufferWrite(self._c_out, len(name), _cstr(name))
+
+    cdef _write_start_element(self, element_config):
+        if self._status > WRITER_IN_ELEMENT:
+            raise LxmlSyntaxError("cannot append trailing element to complete XML document")
+        ns, name, attributes, nsmap = element_config
+        flat_namespace_map, new_namespaces = self._collect_namespaces(nsmap)
+        prefix = self._find_prefix(ns, flat_namespace_map, new_namespaces)
+        tree.xmlOutputBufferWrite(self._c_out, 1, '<')
+        self._write_qname(name, prefix)
+        self._write_attributes_and_namespaces(
+            attributes, flat_namespace_map, new_namespaces)
+        tree.xmlOutputBufferWrite(self._c_out, 1, '>')
+        self._handle_error(self._c_out.error)
+
+        self._element_stack.append((ns, name, prefix, flat_namespace_map))
+        self._status = WRITER_IN_ELEMENT
+
+    cdef _write_attributes_and_namespaces(self, list attributes,
+                                          dict flat_namespace_map,
+                                          list new_namespaces):
+        if attributes:
+            # _find_prefix() may append to new_namespaces => build them first
+            attributes = [
+                (self._find_prefix(ns, flat_namespace_map, new_namespaces), name, value)
+                for ns, name, value in attributes ]
+        if new_namespaces:
+            new_namespaces.sort()
+            self._write_attributes_list(new_namespaces)
+        if attributes:
+            self._write_attributes_list(attributes)
+
+    cdef _write_attributes_list(self, list attributes):
+        for prefix, name, value in attributes:
+            tree.xmlOutputBufferWrite(self._c_out, 1, ' ')
+            self._write_qname(name, prefix)
+            tree.xmlOutputBufferWrite(self._c_out, 2, '="')
+            tree.xmlOutputBufferWriteEscape(self._c_out, _xcstr(value), NULL)
+            tree.xmlOutputBufferWrite(self._c_out, 1, '"')
+
+    cdef _write_end_element(self, element_config):
+        if self._status != WRITER_IN_ELEMENT:
+            raise LxmlSyntaxError("not in an element")
+        if not self._element_stack or self._element_stack[-1][:2] != element_config[:2]:
+            raise LxmlSyntaxError("inconsistent exit action in context manager")
+
+        name, prefix = self._element_stack.pop()[1:3]
+        tree.xmlOutputBufferWrite(self._c_out, 2, '</')
+        self._write_qname(name, prefix)
+        tree.xmlOutputBufferWrite(self._c_out, 1, '>')
+
+        if not self._element_stack:
+            self._status = WRITER_FINISHED
+        self._handle_error(self._c_out.error)
+
+    cdef _find_prefix(self, bytes href, dict flat_namespaces_map, list new_namespaces):
+        if href is None:
+            return None
+        if href in flat_namespaces_map:
+            return flat_namespaces_map[href]
+        # need to create a new prefix
+        prefixes = flat_namespaces_map.values()
+        i = 0
+        while True:
+            prefix = _utf8('ns%d' % i)
+            if prefix not in prefixes:
+                new_namespaces.append((b'xmlns', prefix, href))
+                flat_namespaces_map[href] = prefix
+                return prefix
+            i += 1
+
+    cdef _collect_namespaces(self, dict nsmap):
+        new_namespaces = []
+        flat_namespaces_map = {}
+        for ns, prefix in nsmap.iteritems():
+            flat_namespaces_map[ns] = prefix
+            if prefix is None:
+                new_namespaces.append((None, b'xmlns', ns))
+            else:
+                new_namespaces.append((b'xmlns', prefix, ns))
+        # merge in flat namespace map of parent
+        if self._element_stack:
+            for ns, prefix in (<dict>self._element_stack[-1][-1]).iteritems():
+                if flat_namespaces_map.get(ns) is None:
+                    # unknown or empty prefix => prefer a 'real' prefix
+                    flat_namespaces_map[ns] = prefix
+        return flat_namespaces_map, new_namespaces
+
+    def write(self, *args, bint with_tail=True, bint pretty_print=False):
+        """write(self, *args, with_tail=True, pretty_print=False)
+
+        Write subtrees or strings into the file.
+        """
+        assert self._c_out is not NULL
+        for content in args:
+            if _isString(content):
+                if self._status != WRITER_IN_ELEMENT:
+                    if self._status > WRITER_IN_ELEMENT or content.strip():
+                        raise LxmlSyntaxError("not in an element")
+                content = _utf8(content)
+                tree.xmlOutputBufferWriteEscape(self._c_out, _xcstr(content), NULL)
+            elif iselement(content):
+                if self._status > WRITER_IN_ELEMENT:
+                    raise LxmlSyntaxError("cannot append trailing element to complete XML document")
+                _writeNodeToBuffer(self._c_out, (<_Element>content)._c_node,
+                                   self._c_encoding, NULL, OUTPUT_METHOD_XML,
+                                   False, False, pretty_print, with_tail, False)
+                if (<_Element>content)._c_node.type == tree.XML_ELEMENT_NODE:
+                    if not self._element_stack:
+                        self._status = WRITER_FINISHED
+            else:
+                raise TypeError("got invalid input value of type %s, expected string or Element" % type(content))
+            self._handle_error(self._c_out.error)
+
+    cdef _close(self, bint raise_on_error):
+        if raise_on_error:
+            if self._status < WRITER_IN_ELEMENT:
+                raise LxmlSyntaxError("no content written")
+            if self._element_stack:
+                raise LxmlSyntaxError("pending open tags on close")
+        error_result = self._c_out.error
+        if error_result == xmlerror.XML_ERR_OK:
+            error_result = tree.xmlOutputBufferClose(self._c_out)
+            if error_result > 0:
+                error_result = xmlerror.XML_ERR_OK
+        else:
+            tree.xmlOutputBufferClose(self._c_out)
+        self._status = WRITER_FINISHED
+        self._c_out = NULL
+        del self._element_stack[:]
+        if raise_on_error:
+            self._handle_error(error_result)
+
+    cdef _handle_error(self, int error_result):
+        if error_result != xmlerror.XML_ERR_OK:
+            if self._target is not None:
+                self._target._exc_context._raise_if_stored()
+            _raiseSerialisationError(error_result)
+
+@cython.final
+@cython.internal
+@cython.freelist(8)
+cdef class _FileWriterElement:
+    cdef object _element
+    cdef _IncrementalFileWriter _writer
+
+    def __cinit__(self, _IncrementalFileWriter writer not None, element_config):
+        self._writer = writer
+        self._element = element_config
+
+    def __enter__(self):
+        self._writer._write_start_element(self._element)
+
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        self._writer._write_end_element(self._element)
diff --git a/lib/lxml/tests/__init__.py b/lib/lxml/tests/__init__.py
new file mode 100644
index 00000000..85dfe70d
--- /dev/null
+++ b/lib/lxml/tests/__init__.py
@@ -0,0 +1,4 @@
+"""
+The lxml test suite for lxml, ElementTree and cElementTree.
+"""
+
diff --git a/lib/lxml/tests/common_imports.py b/lib/lxml/tests/common_imports.py
new file mode 100644
index 00000000..e04b7d64
--- /dev/null
+++ b/lib/lxml/tests/common_imports.py
@@ -0,0 +1,303 @@
+import os
+import os.path
+import re
+import gc
+import sys
+import unittest
+
+try:
+    import urlparse
+except ImportError:
+    import urllib.parse as urlparse 
+
+try:
+    from urllib import pathname2url
+except:
+    from urllib.request import pathname2url
+
+from lxml import etree
+
+def make_version_tuple(version_string):
+    l = []
+    for part in re.findall('([0-9]+|[^0-9.]+)', version_string):
+        try:
+            l.append(int(part))
+        except ValueError:
+            l.append(part)
+    return tuple(l)
+
+IS_PYPY = (getattr(sys, 'implementation', None) == 'pypy' or
+           getattr(sys, 'pypy_version_info', None) is not None)
+
+IS_PYTHON3 = sys.version_info[0] >= 3
+
+try:
+    from xml.etree import ElementTree # Python 2.5+
+except ImportError:
+    try:
+        from elementtree import ElementTree # standard ET
+    except ImportError:
+        ElementTree = None
+
+if hasattr(ElementTree, 'VERSION'):
+    ET_VERSION = make_version_tuple(ElementTree.VERSION)
+else:
+    ET_VERSION = (0,0,0)
+
+try:
+    from xml.etree import cElementTree # Python 2.5+
+except ImportError:
+    try:
+        import cElementTree # standard ET
+    except ImportError:
+        cElementTree = None
+
+if hasattr(cElementTree, 'VERSION'):
+    CET_VERSION = make_version_tuple(cElementTree.VERSION)
+else:
+    CET_VERSION = (0,0,0)
+
+def filter_by_version(test_class, version_dict, current_version):
+    """Remove test methods that do not work with the current lib version.
+    """
+    find_required_version = version_dict.get
+    def dummy_test_method(self):
+        pass
+    for name in dir(test_class):
+        expected_version = find_required_version(name, (0,0,0))
+        if expected_version > current_version:
+            setattr(test_class, name, dummy_test_method)
+
+try:
+    import doctest
+    # check if the system version has everything we need
+    doctest.DocFileSuite
+    doctest.DocTestParser
+    doctest.NORMALIZE_WHITESPACE
+    doctest.ELLIPSIS
+except (ImportError, AttributeError):
+    # we need our own version to make it work (Python 2.3?)
+    import local_doctest as doctest
+
+try:
+    sorted
+except NameError:
+    def sorted(seq, **kwargs):
+        seq = list(seq)
+        seq.sort(**kwargs)
+        return seq
+else:
+    locals()['sorted'] = sorted
+
+
+try:
+    next
+except NameError:
+    def next(it):
+        return it.next()
+else:
+    locals()['next'] = next
+
+
+try:
+    import pytest
+except ImportError:
+    class skipif(object):
+        "Using a class because a function would bind into a method when used in classes"
+        def __init__(self, *args): pass
+        def __call__(self, func, *args): return func
+else:
+    skipif = pytest.mark.skipif
+
+def _get_caller_relative_path(filename, frame_depth=2):
+    module = sys.modules[sys._getframe(frame_depth).f_globals['__name__']]
+    return os.path.normpath(os.path.join(
+            os.path.dirname(getattr(module, '__file__', '')), filename))
+
+if sys.version_info[0] >= 3:
+    # Python 3
+    from builtins import str as unicode
+    def _str(s, encoding="UTF-8"):
+        return s
+    def _bytes(s, encoding="UTF-8"):
+        return s.encode(encoding)
+    from io import StringIO, BytesIO as _BytesIO
+    def BytesIO(*args):
+        if args and isinstance(args[0], str):
+            args = (args[0].encode("UTF-8"),)
+        return _BytesIO(*args)
+
+    doctest_parser = doctest.DocTestParser()
+    _fix_unicode = re.compile(r'(\s+)u(["\'])').sub
+    _fix_exceptions = re.compile(r'(.*except [^(]*),\s*(.*:)').sub
+    def make_doctest(filename):
+        filename = _get_caller_relative_path(filename)
+        doctests = read_file(filename)
+        doctests = _fix_unicode(r'\1\2', doctests)
+        doctests = _fix_exceptions(r'\1 as \2', doctests)
+        return doctest.DocTestCase(
+            doctest_parser.get_doctest(
+                doctests, {}, os.path.basename(filename), filename, 0))
+else:
+    # Python 2
+    from __builtin__ import unicode
+    def _str(s, encoding="UTF-8"):
+        return unicode(s, encoding=encoding)
+    def _bytes(s, encoding="UTF-8"):
+        return s
+    from StringIO import StringIO
+    BytesIO = StringIO
+
+    doctest_parser = doctest.DocTestParser()
+    _fix_traceback = re.compile(r'^(\s*)(?:\w+\.)+(\w*(?:Error|Exception|Invalid):)', re.M).sub
+    _fix_exceptions = re.compile(r'(.*except [^(]*)\s+as\s+(.*:)').sub
+    _fix_bytes = re.compile(r'(\s+)b(["\'])').sub
+    def make_doctest(filename):
+        filename = _get_caller_relative_path(filename)
+        doctests = read_file(filename)
+        doctests = _fix_traceback(r'\1\2', doctests)
+        doctests = _fix_exceptions(r'\1, \2', doctests)
+        doctests = _fix_bytes(r'\1\2', doctests)
+        return doctest.DocTestCase(
+            doctest_parser.get_doctest(
+                doctests, {}, os.path.basename(filename), filename, 0))
+
+try:
+    skipIf = unittest.skipIf
+except AttributeError:
+    def skipIf(condition, why,
+               _skip=lambda test_method: None,
+               _keep=lambda test_method: test_method):
+        if condition:
+            return _skip
+        return _keep
+
+class HelperTestCase(unittest.TestCase):
+    def tearDown(self):
+        gc.collect()
+
+    def parse(self, text, parser=None):
+        f = BytesIO(text)
+        return etree.parse(f, parser=parser)
+    
+    def _rootstring(self, tree):
+        return etree.tostring(tree.getroot()).replace(
+            _bytes(' '), _bytes('')).replace(_bytes('\n'), _bytes(''))
+
+    # assertFalse doesn't exist in Python 2.3
+    try:
+        unittest.TestCase.assertFalse
+    except AttributeError:
+        assertFalse = unittest.TestCase.failIf
+        
+class SillyFileLike:
+    def __init__(self, xml_data=_bytes('<foo><bar/></foo>')):
+        self.xml_data = xml_data
+        
+    def read(self, amount=None):
+        if self.xml_data:
+            if amount:
+                data = self.xml_data[:amount]
+                self.xml_data = self.xml_data[amount:]
+            else:
+                data = self.xml_data
+                self.xml_data = _bytes('')
+            return data
+        return _bytes('')
+
+class LargeFileLike:
+    def __init__(self, charlen=100, depth=4, children=5):
+        self.data = BytesIO()
+        self.chars  = _bytes('a') * charlen
+        self.children = range(children)
+        self.more = self.iterelements(depth)
+
+    def iterelements(self, depth):
+        yield _bytes('<root>')
+        depth -= 1
+        if depth > 0:
+            for child in self.children:
+                for element in self.iterelements(depth):
+                    yield element
+                yield self.chars
+        else:
+            yield self.chars
+        yield _bytes('</root>')
+
+    def read(self, amount=None):
+        data = self.data
+        append = data.write
+        if amount:
+            for element in self.more:
+                append(element)
+                if data.tell() >= amount:
+                    break
+        else:
+            for element in self.more:
+                append(element)
+        result = data.getvalue()
+        data.seek(0)
+        data.truncate()
+        if amount:
+            append(result[amount:])
+            result = result[:amount]
+        return result
+
+class LargeFileLikeUnicode(LargeFileLike):
+    def __init__(self, charlen=100, depth=4, children=5):
+        LargeFileLike.__init__(self, charlen, depth, children)
+        self.data = StringIO()
+        self.chars  = _str('a') * charlen
+        self.more = self.iterelements(depth)
+
+    def iterelements(self, depth):
+        yield _str('<root>')
+        depth -= 1
+        if depth > 0:
+            for child in self.children:
+                for element in self.iterelements(depth):
+                    yield element
+                yield self.chars
+        else:
+            yield self.chars
+        yield _str('</root>')
+
+def fileInTestDir(name):
+    _testdir = os.path.dirname(__file__)
+    return os.path.join(_testdir, name)
+
+def path2url(path):
+    return urlparse.urljoin(
+        'file:', pathname2url(path))
+
+def fileUrlInTestDir(name):
+    return path2url(fileInTestDir(name))
+
+def read_file(name, mode='r'):
+    f = open(name, mode)
+    try:
+        data = f.read()
+    finally:
+        f.close()
+    return data
+
+def write_to_file(name, data, mode='w'):
+    f = open(name, mode)
+    try:
+        data = f.write(data)
+    finally:
+        f.close()
+
+def readFileInTestDir(name, mode='r'):
+    return read_file(fileInTestDir(name), mode)
+
+def canonicalize(xml):
+    tree = etree.parse(BytesIO(xml))
+    f = BytesIO()
+    tree.write_c14n(f)
+    return f.getvalue()
+
+def unentitify(xml):
+    for entity_name, value in re.findall("(&#([0-9]+);)", xml):
+        xml = xml.replace(entity_name, unichr(int(value)))
+    return xml
diff --git a/lib/lxml/tests/dummy_http_server.py b/lib/lxml/tests/dummy_http_server.py
new file mode 100644
index 00000000..d36cb6ea
--- /dev/null
+++ b/lib/lxml/tests/dummy_http_server.py
@@ -0,0 +1,83 @@
+"""
+Simple HTTP request dumper for tests in Python 2.5+.
+"""
+
+import sys
+from contextlib import contextmanager
+
+try:
+    import urlparse
+except ImportError:
+    # Python 3
+    import urllib.parse as urlparse
+
+
+@contextmanager
+def webserver(app, port=0, host=None):
+    """Context manager entry point for the 'with' statement.
+
+    Pass 0 as port number to dynamically allocate a free port.
+
+    Usage:
+
+    with webserver(wsgi_app_function, 8080) as host_url:
+        do_ws_calls(host_url)
+    """
+    server = build_web_server(app, port, host or '127.0.0.1')
+    host, port = server.socket.getsockname()
+
+    import threading
+    thread = threading.Thread(target=server.serve_forever,
+                              kwargs={'poll_interval': 0.5})
+    thread.setDaemon(True)
+    thread.start()
+    try:
+        yield 'http://%s:%s/' % (host, port)  # yield control to 'with' body
+    finally:
+        server.shutdown()
+        server.server_close()
+
+
+try:
+    from SocketServer import ThreadingMixIn
+except ImportError:
+    # Python 3
+    from socketserver import ThreadingMixIn
+
+import wsgiref.simple_server as wsgiserver
+class WebServer(wsgiserver.WSGIServer, ThreadingMixIn):
+    """A web server that starts a new thread for each request.
+    """
+
+
+class _RequestHandler(wsgiserver.WSGIRequestHandler):
+    def get_stderr(self):
+        # don't write to stderr
+        return sys.stdout
+
+    def log_message(self, format, *args):
+        # message = "wsmock(%s) %s" % (self.address_string(), format % args)
+        pass  # don't log messages
+
+
+def build_web_server(app, port, host=None):
+    server = wsgiserver.make_server(
+        host or '', port, app,
+        server_class=WebServer,
+        handler_class=_RequestHandler)
+    return server
+
+
+class HTTPRequestCollector(object):
+    def __init__(self, response_data, response_code=200, headers=()):
+        self.requests = []
+        self.response_code = response_code
+        self.response_data = response_data
+        self.headers = list(headers or ())
+
+    def __call__(self, environ, start_response):
+        self.requests.append((
+            environ.get('PATH_INFO'),
+            urlparse.parse_qsl(environ.get('QUERY_STRING'))))
+        start_response('%s OK' % self.response_code, self.headers)
+        return [self.response_data]
diff --git a/lib/lxml/tests/include/test_xinclude.xml b/lib/lxml/tests/include/test_xinclude.xml
new file mode 100644
index 00000000..1cc05cf8
--- /dev/null
+++ b/lib/lxml/tests/include/test_xinclude.xml
@@ -0,0 +1,4 @@
+<doc xmlns:xi="http://www.w3.org/2001/XInclude">
+<foo/>
+<xi:include href="../test.xml" />
+</doc>
\ No newline at end of file
diff --git a/lib/lxml/tests/shakespeare.html b/lib/lxml/tests/shakespeare.html
new file mode 100644
index 00000000..821ca6ac
--- /dev/null
+++ b/lib/lxml/tests/shakespeare.html
@@ -0,0 +1,526 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+	"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en" debug="true">
+<head>
+	<meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
+</head>
+
+<body>
+	
+	<div id="test">
+	<div class="dialog">
+	<h2>As You Like It</h2>
+	<div id="playwright">
+
+	  by William Shakespeare
+
+
+	</div>
+	<div class="dialog scene thirdClass" id="scene1">
+
+	  <h3>ACT I, SCENE III. A room in the palace.</h3>
+
+	  <div class="dialog">
+	  <div class="direction">Enter CELIA and ROSALIND</div>
+
+	  </div>
+
+	  <div id="speech1" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.1">Why, cousin! why, Rosalind! Cupid have mercy! not a word?</div>
+
+	  </div>
+
+	  <div id="speech2" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.2">Not one to throw at a dog.</div>
+
+	  </div>
+
+	  <div id="speech3" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.3">No, thy words are too precious to be cast away upon</div>
+
+	  <div id="scene1.3.4">curs; throw some of them at me; come, lame me with reasons.</div>
+
+	  </div>
+
+	  <div id="speech4" class="character">ROSALIND</div>
+
+	  <div id="speech5" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.8">But is all this for your father?</div>
+
+	  </div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.5">Then there were two cousins laid up; when the one</div>
+	  <div id="scene1.3.6">should be lamed with reasons and the other mad</div>
+
+	  <div id="scene1.3.7">without any.</div>
+	  </div>
+
+	  <div id="speech6" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.9">No, some of it is for my child's father. O, how</div>
+
+	  <div id="scene1.3.10">full of briers is this working-day world!</div>
+
+	  </div>
+
+	  <div id="speech7" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.11">They are but burs, cousin, thrown upon thee in</div>
+	  <div id="scene1.3.12">holiday foolery: if we walk not in the trodden</div>
+
+	  <div id="scene1.3.13">paths our very petticoats will catch them.</div>
+
+	  </div>
+
+	  <div id="speech8" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.14">I could shake them off my coat: these burs are in my heart.</div>
+	  </div>
+
+	  <div id="speech9" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.15">Hem them away.</div>
+
+	  </div>
+
+	  <div id="speech10" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.16">I would try, if I could cry 'hem' and have him.</div>
+	  </div>
+
+	  <div id="speech11" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.17">Come, come, wrestle with thy affections.</div>
+
+	  </div>
+
+	  <div id="speech12" class="character">ROSALIND</div>
+	  <div class="dialog">
+	  <div id="scene1.3.18">O, they take the part of a better wrestler than myself!</div>
+
+	  </div>
+
+	  <div id="speech13" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.19">O, a good wish upon you! you will try in time, in</div>
+	  <div id="scene1.3.20">despite of a fall. But, turning these jests out of</div>
+	  <div id="scene1.3.21">service, let us talk in good earnest: is it</div>
+
+	  <div id="scene1.3.22">possible, on such a sudden, you should fall into so</div>
+
+	  <div id="scene1.3.23">strong a liking with old Sir Rowland's youngest son?</div>
+
+	  </div>
+
+	  <div id="speech14" class="character">ROSALIND</div>
+	  <div class="dialog">
+	  <div id="scene1.3.24">The duke my father loved his father dearly.</div>
+
+	  </div>
+
+	  <div id="speech15" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.25">Doth it therefore ensue that you should love his son</div>
+
+	  <div id="scene1.3.26">dearly? By this kind of chase, I should hate him,</div>
+
+	  <div id="scene1.3.27">for my father hated his father dearly; yet I hate</div>
+
+	  <div id="scene1.3.28">not Orlando.</div>
+
+	  </div>
+
+	  <div id="speech16" class="character">ROSALIND</div>
+
+	  <div title="wtf" class="dialog">
+
+	  <div id="scene1.3.29">No, faith, hate him not, for my sake.</div>
+
+	  </div>
+
+	  <div id="speech17" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.30">Why should I not? doth he not deserve well?</div>
+
+	  </div>
+
+	  <div id="speech18" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.31">Let me love him for that, and do you love him</div>
+	  <div id="scene1.3.32">because I do. Look, here comes the duke.</div>
+	  </div>
+
+	  <div id="speech19" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.33">With his eyes full of anger.</div>
+	  <div class="direction">Enter DUKE FREDERICK, with Lords</div>
+	  </div>
+
+	  <div id="speech20" class="character">DUKE FREDERICK</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.34">Mistress, dispatch you with your safest haste</div>
+
+	  <div id="scene1.3.35">And get you from our court.</div>
+	  </div>
+
+	  <div id="speech21" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.36">Me, uncle?</div>
+
+	  </div>
+
+	  <div id="speech22" class="character">DUKE FREDERICK</div>
+	  <div class="dialog">
+	  <div id="scene1.3.37">You, cousin</div>
+
+	  <div id="scene1.3.38">Within these ten days if that thou be'st found</div>
+
+	  <div id="scene1.3.39">So near our public court as twenty miles,</div>
+
+	  <div id="scene1.3.40">Thou diest for it.</div>
+
+	  </div>
+
+	  <div id="speech23" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.41">                  I do beseech your grace,</div>
+
+	  <div id="scene1.3.42">Let me the knowledge of my fault bear with me:</div>
+	  <div id="scene1.3.43">If with myself I hold intelligence</div>
+
+	  <div id="scene1.3.44">Or have acquaintance with mine own desires,</div>
+
+	  <div id="scene1.3.45">If that I do not dream or be not frantic,--</div>
+
+	  <div id="scene1.3.46">As I do trust I am not--then, dear uncle,</div>
+
+	  <div id="scene1.3.47">Never so much as in a thought unborn</div>
+
+	  <div id="scene1.3.48">Did I offend your highness.</div>
+
+	  </div>
+
+	  <div id="speech24" class="character">DUKE FREDERICK</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.49">Thus do all traitors:</div>
+
+	  <div id="scene1.3.50">If their purgation did consist in words,</div>
+
+	  <div id="scene1.3.51">They are as innocent as grace itself:</div>
+
+	  <div id="scene1.3.52">Let it suffice thee that I trust thee not.</div>
+
+	  </div>
+
+	  <div id="speech25" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.53">Yet your mistrust cannot make me a traitor:</div>
+
+	  <div id="scene1.3.54">Tell me whereon the likelihood depends.</div>
+
+	  </div>
+
+	  <div id="speech26" class="character">DUKE FREDERICK</div>
+	  <div class="dialog">
+
+	  <div id="scene1.3.55">Thou art thy father's daughter; there's enough.</div>
+
+	  </div>
+
+	  <div id="speech27" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.56">So was I when your highness took his dukedom;</div>
+	  <div id="scene1.3.57">So was I when your highness banish'd him:</div>
+
+	  <div id="scene1.3.58">Treason is not inherited, my lord;</div>
+
+	  <div id="scene1.3.59">Or, if we did derive it from our friends,</div>
+
+	  <div id="scene1.3.60">What's that to me? my father was no traitor:</div>
+
+	  <div id="scene1.3.61">Then, good my liege, mistake me not so much</div>
+	  <div id="scene1.3.62">To think my poverty is treacherous.</div>
+
+	  </div>
+
+	  <div id="speech28" class="character">CELIA</div>
+	  <div class="dialog">
+
+	  <div id="scene1.3.63">Dear sovereign, hear me speak.</div>
+
+	  </div>
+
+	  <div id="speech29" class="character">DUKE FREDERICK</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.64">Ay, Celia; we stay'd her for your sake,</div>
+	  <div id="scene1.3.65">Else had she with her father ranged along.</div>
+
+	  </div>
+
+	  <div id="speech30" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.66">I did not then entreat to have her stay;</div>
+	  <div id="scene1.3.67">It was your pleasure and your own remorse:</div>
+	  <div id="scene1.3.68">I was too young that time to value her;</div>
+
+	  <div id="scene1.3.69">But now I know her: if she be a traitor,</div>
+
+	  <div id="scene1.3.70">Why so am I; we still have slept together,</div>
+
+	  <div id="scene1.3.71">Rose at an instant, learn'd, play'd, eat together,</div>
+	  <div id="scene1.3.72">And wheresoever we went, like Juno's swans,</div>
+
+	  <div id="scene1.3.73">Still we went coupled and inseparable.</div>
+	  </div>
+
+	  <div id="speech31" class="character">DUKE FREDERICK</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.74">She is too subtle for thee; and her smoothness,</div>
+	  <div id="scene1.3.75">Her very silence and her patience</div>
+	  <div id="scene1.3.76">Speak to the people, and they pity her.</div>
+	  <div id="scene1.3.77">Thou art a fool: she robs thee of thy name;</div>
+
+	  <div id="scene1.3.78">And thou wilt show more bright and seem more virtuous</div>
+
+	  <div id="scene1.3.79">When she is gone. Then open not thy lips:</div>
+	  <div id="scene1.3.80">Firm and irrevocable is my doom</div>
+	  <div id="scene1.3.81">Which I have pass'd upon her; she is banish'd.</div>
+	  </div>
+
+	  <div id="speech32" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.82">Pronounce that sentence then on me, my liege:</div>
+	  <div id="scene1.3.83">I cannot live out of her company.</div>
+	  </div>
+
+	  <div id="speech33" class="character">DUKE FREDERICK</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.84">You are a fool. You, niece, provide yourself:</div>
+
+	  <div id="scene1.3.85">If you outstay the time, upon mine honour,</div>
+	  <div id="scene1.3.86">And in the greatness of my word, you die.</div>
+	  <div class="direction">Exeunt DUKE FREDERICK and Lords</div>
+	  </div>
+
+	  <div id="speech34" class="character">CELIA</div>
+	  <div class="dialog">
+
+	  <div id="scene1.3.87">O my poor Rosalind, whither wilt thou go?</div>
+
+	  <div id="scene1.3.88">Wilt thou change fathers? I will give thee mine.</div>
+	  <div id="scene1.3.89">I charge thee, be not thou more grieved than I am.</div>
+
+	  </div>
+
+	  <div id="speech35" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.90">I have more cause.</div>
+	  </div>
+
+	  <div id="speech36" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.91">                  Thou hast not, cousin;</div>
+
+	  <div id="scene1.3.92">Prithee be cheerful: know'st thou not, the duke</div>
+
+	  <div id="scene1.3.93">Hath banish'd me, his daughter?</div>
+
+	  </div>
+
+	  <div id="speech37" class="character">ROSALIND</div>
+	  <div class="dialog">
+	  <div id="scene1.3.94">That he hath not.</div>
+
+	  </div>
+
+	  <div id="speech38" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.95">No, hath not? Rosalind lacks then the love</div>
+
+	  <div id="scene1.3.96">Which teacheth thee that thou and I am one:</div>
+	  <div id="scene1.3.97">Shall we be sunder'd? shall we part, sweet girl?</div>
+
+	  <div id="scene1.3.98">No: let my father seek another heir.</div>
+
+	  <div id="scene1.3.99">Therefore devise with me how we may fly,</div>
+
+	  <div id="scene1.3.100">Whither to go and what to bear with us;</div>
+	  <div id="scene1.3.101">And do not seek to take your change upon you,</div>
+	  <div id="scene1.3.102">To bear your griefs yourself and leave me out;</div>
+
+	  <div id="scene1.3.103">For, by this heaven, now at our sorrows pale,</div>
+
+	  <div id="scene1.3.104">Say what thou canst, I'll go along with thee.</div>
+
+	  </div>
+
+	  <div id="speech39" class="character">ROSALIND</div>
+	  <div class="dialog">
+
+	  <div id="scene1.3.105">Why, whither shall we go?</div>
+
+	  </div>
+
+	  <div id="speech40" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.106">To seek my uncle in the forest of Arden.</div>
+	  </div>
+
+	  <div id="speech41" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.107">Alas, what danger will it be to us,</div>
+
+	  <div id="scene1.3.108">Maids as we are, to travel forth so far!</div>
+	  <div id="scene1.3.109">Beauty provoketh thieves sooner than gold.</div>
+
+	  </div>
+
+	  <div id="speech42" class="character">CELIA</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.110">I'll put myself in poor and mean attire</div>
+
+	  <div id="scene1.3.111">And with a kind of umber smirch my face;</div>
+	  <div id="scene1.3.112">The like do you: so shall we pass along</div>
+
+	  <div id="scene1.3.113">And never stir assailants.</div>
+
+	  </div>
+
+	  <div id="speech43" class="character">ROSALIND</div>
+	  <div class="dialog">
+
+	  <div id="scene1.3.114">Were it not better,</div>
+
+	  <div id="scene1.3.115">Because that I am more than common tall,</div>
+
+	  <div id="scene1.3.116">That I did suit me all points like a man?</div>
+
+	  <div id="scene1.3.117">A gallant curtle-axe upon my thigh,</div>
+
+	  <div id="scene1.3.118">A boar-spear in my hand; and--in my heart</div>
+
+	  <div id="scene1.3.119">Lie there what hidden woman's fear there will--</div>
+
+	  <div id="scene1.3.120">We'll have a swashing and a martial outside,</div>
+
+	  <div id="scene1.3.121">As many other mannish cowards have</div>
+
+	  <div id="scene1.3.122">That do outface it with their semblances.</div>
+
+	  </div>
+
+	  <div id="speech44" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.123">What shall I call thee when thou art a man?</div>
+	  </div>
+
+	  <div id="speech45" class="character">ROSALIND</div>
+
+	  <div class="dialog">
+	  <div id="scene1.3.124">I'll have no worse a name than Jove's own page;</div>
+
+	  <div id="scene1.3.125">And therefore look you call me Ganymede.</div>
+
+	  <div id="scene1.3.126">But what will you be call'd?</div>
+
+	  </div>
+
+	  <div id="speech46" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.127">Something that hath a reference to my state</div>
+	  <div id="scene1.3.128">No longer Celia, but Aliena.</div>
+
+	  </div>
+
+	  <div id="speech47" class="character">ROSALIND</div>
+	  <div class="dialog">
+
+	  <div id="scene1.3.129">But, cousin, what if we assay'd to steal</div>
+
+	  <div id="scene1.3.130">The clownish fool out of your father's court?</div>
+
+	  <div id="scene1.3.131">Would he not be a comfort to our travel?</div>
+
+	  </div>
+
+	  <div id="speech48" class="character">CELIA</div>
+
+	  <div class="dialog">
+
+	  <div id="scene1.3.132">He'll go along o'er the wide world with me;</div>
+
+	  <div id="scene1.3.133">Leave me alone to woo him. Let's away,</div>
+	  <div id="scene1.3.134">And get our jewels and our wealth together,</div>
+
+	  <div id="scene1.3.135">Devise the fittest time and safest way</div>
+
+	  <div id="scene1.3.136">To hide us from pursuit that will be made</div>
+
+	  <div id="scene1.3.137">After my flight. Now go we in content</div>
+
+	  <div id="scene1.3.138">To liberty and not to banishment.</div>
+	  <div class="direction">Exeunt</div>
+
+	  </div>
+
+	</div>
+	</div>
+</div>
+</body>
+
+</html>
\ No newline at end of file
diff --git a/lib/lxml/tests/test-document.xslt b/lib/lxml/tests/test-document.xslt
new file mode 100644
index 00000000..5d80c4b6
--- /dev/null
+++ b/lib/lxml/tests/test-document.xslt
@@ -0,0 +1,10 @@
+<?xml version="1.0"?>
+<xsl:stylesheet version="1.0"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+
+  <xsl:template match="/">
+    <test>
+      <xsl:copy-of select="document('')"/>
+    </test>
+  </xsl:template>
+</xsl:stylesheet>
diff --git a/lib/lxml/tests/test-string.xml b/lib/lxml/tests/test-string.xml
new file mode 100644
index 00000000..25ae1809
--- /dev/null
+++ b/lib/lxml/tests/test-string.xml
@@ -0,0 +1,2 @@
+<?xml version="1.0"?>
+<a>Søk på nettet</a>
diff --git a/lib/lxml/tests/test.dtd b/lib/lxml/tests/test.dtd
new file mode 100644
index 00000000..bb620304
--- /dev/null
+++ b/lib/lxml/tests/test.dtd
@@ -0,0 +1,11 @@
+<!ELEMENT a (b)>
+<!ATTLIST a
+    default (valueA|valueB) "valueA"
+>
+
+<!ELEMENT b EMPTY>
+<!ATTLIST b
+    default (valueA|valueB) "valueB"
+>
+
+<!ENTITY c "&#42;">
diff --git a/lib/lxml/tests/test.sch b/lib/lxml/tests/test.sch
new file mode 100644
index 00000000..9fc4815b
--- /dev/null
+++ b/lib/lxml/tests/test.sch
@@ -0,0 +1,8 @@
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
diff --git a/lib/lxml/tests/test.xml b/lib/lxml/tests/test.xml
new file mode 100644
index 00000000..2eccc292
--- /dev/null
+++ b/lib/lxml/tests/test.xml
@@ -0,0 +1,2 @@
+<!DOCTYPE a SYSTEM "test.dtd">
+<a><b></b></a>
diff --git a/lib/lxml/tests/test.xsd b/lib/lxml/tests/test.xsd
new file mode 100644
index 00000000..9a085b32
--- /dev/null
+++ b/lib/lxml/tests/test.xsd
@@ -0,0 +1,8 @@
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
diff --git a/lib/lxml/tests/test1.rng b/lib/lxml/tests/test1.rng
new file mode 100644
index 00000000..bef4d00c
--- /dev/null
+++ b/lib/lxml/tests/test1.rng
@@ -0,0 +1,6 @@
+<grammar ns="http://www.w3.org/1999/xhtml"
+         xmlns="http://relaxng.org/ns/structure/1.0">
+
+<include href="test2.rng"/>
+
+</grammar>
diff --git a/lib/lxml/tests/test1.xslt b/lib/lxml/tests/test1.xslt
new file mode 100644
index 00000000..f25763e1
--- /dev/null
+++ b/lib/lxml/tests/test1.xslt
@@ -0,0 +1,9 @@
+<xsl:stylesheet 
+  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+<xsl:include href="test2.xslt" />
+
+<xsl:template match="/">
+<p>Foo</p>
+</xsl:template>
+
+</xsl:stylesheet>
diff --git a/lib/lxml/tests/test2.rng b/lib/lxml/tests/test2.rng
new file mode 100644
index 00000000..f6d03897
--- /dev/null
+++ b/lib/lxml/tests/test2.rng
@@ -0,0 +1,13 @@
+<grammar xmlns="http://relaxng.org/ns/structure/1.0">
+
+<start>
+  <ref name="a" />
+</start>
+
+<define name="a">
+  <element name="a">
+  <text/>
+  </element>
+</define>
+
+</grammar>
diff --git a/lib/lxml/tests/test2.xslt b/lib/lxml/tests/test2.xslt
new file mode 100644
index 00000000..5c01e21a
--- /dev/null
+++ b/lib/lxml/tests/test2.xslt
@@ -0,0 +1,8 @@
+<xsl:stylesheet 
+  xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+
+<xsl:template match="hello">
+<p>hello</p>
+</xsl:template>
+
+</xsl:stylesheet>
diff --git a/lib/lxml/tests/test_broken.xml b/lib/lxml/tests/test_broken.xml
new file mode 100644
index 00000000..3dd455a3
--- /dev/null
+++ b/lib/lxml/tests/test_broken.xml
@@ -0,0 +1 @@
+<a><b></c></b></a>
\ No newline at end of file
diff --git a/lib/lxml/tests/test_builder.py b/lib/lxml/tests/test_builder.py
new file mode 100644
index 00000000..e09edb60
--- /dev/null
+++ b/lib/lxml/tests/test_builder.py
@@ -0,0 +1,38 @@
+# -*- coding: utf-8 -*-
+import unittest
+
+"""
+Tests that ElementMaker works properly.
+"""
+
+import sys, os.path
+from lxml import etree
+from lxml.builder import E
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import HelperTestCase, BytesIO, _bytes
+
+class BuilderTestCase(HelperTestCase):
+    etree = etree
+
+    def test_build_from_xpath_result(self):
+        class StringSubclass(str): pass
+        wrapped = E.b(StringSubclass('Hello'))
+        self.assertEqual(_bytes('<b>Hello</b>'), etree.tostring(wrapped))
+
+    def test_unknown_type_raises(self):
+        class UnknownType(object):
+            pass
+        self.assertRaises(TypeError, E.b, UnknownType())
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(BuilderTestCase)])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_classlookup.py b/lib/lxml/tests/test_classlookup.py
new file mode 100644
index 00000000..a4277daf
--- /dev/null
+++ b/lib/lxml/tests/test_classlookup.py
@@ -0,0 +1,405 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests for different Element class lookup mechanisms.
+"""
+
+
+import unittest, os.path, sys, gc
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, HelperTestCase, SillyFileLike, fileInTestDir
+from common_imports import canonicalize, _bytes, _str, BytesIO, StringIO
+
+xml_str = _bytes('''\
+<root xmlns="myNS" xmlns:other="otherNS">
+  <c1 a1="A1" a2="A2" other:a3="A3">
+    <c2 a1="C2">0</c2>
+    <c2>1</c2>
+    <other:c2>2</other:c2>
+  </c1>
+</root>''')
+
+
+class ProxyTestCase(HelperTestCase):
+    """Basic tests for element proxy behaviour.
+    """
+    etree = etree
+
+    def test_proxy_reuse(self):
+        root = etree.XML('<a><b><c/></b></a>')
+        b = root.find('b')
+        self.assertTrue(b is root[0])
+
+    def test_proxy_reuse_after_gc(self):
+        root = etree.XML('<a><b><c/></b></a>')
+        b = root.find('b')
+        self.assertTrue(self.etree.iselement(b))
+        gc.collect()
+        self.assertTrue(b is root[0])
+
+    def test_proxy_reuse_after_del_root(self):
+        root = etree.XML('<a><b><c/></b></a>')
+        b = root.find('b')
+        self.assertTrue(self.etree.iselement(b))
+        c = b.find('c')
+        self.assertTrue(self.etree.iselement(c))
+        del root
+        gc.collect()
+        self.assertTrue(b[0] is c)
+
+    def test_proxy_hashing(self):
+        root = etree.XML('<a><b><c/></b></a>')
+        old_elements = set(root.iter())
+        elements = root.iter()
+        del root
+        gc.collect()
+
+        missing = len(old_elements)
+        self.assertEqual(3, missing)
+        for new in elements:
+            for old in old_elements:
+                if old == new:
+                    self.assertTrue(old is new)
+                    missing -= 1
+                    break
+            else:
+                self.assertTrue(False, "element '%s' is missing" % new.tag)
+        self.assertEqual(0, missing)
+
+    def test_element_base(self):
+        el = self.etree.ElementBase()
+        self.assertEqual('ElementBase', el.tag)
+        root = self.etree.ElementBase()
+        root.append(el)
+        self.assertEqual('ElementBase', root[0].tag)
+
+    def test_element_base_children(self):
+        el = self.etree.ElementBase(etree.ElementBase())
+        self.assertEqual('ElementBase', el.tag)
+        self.assertEqual(1, len(el))
+        self.assertEqual('ElementBase', el[0].tag)
+
+        root = self.etree.ElementBase()
+        root.append(el)
+        self.assertEqual('ElementBase', root[0].tag)
+        self.assertEqual('ElementBase', root[0][0].tag)
+
+    def test_comment_base(self):
+        el = self.etree.CommentBase('some text')
+        self.assertEqual(self.etree.Comment, el.tag)
+        self.assertEqual('some text', el.text)
+        root = self.etree.Element('root')
+        root.append(el)
+        self.assertEqual('some text', root[0].text)
+
+    def test_pi_base(self):
+        el = self.etree.PIBase('the target', 'some text')
+        self.assertEqual(self.etree.ProcessingInstruction, el.tag)
+        self.assertEqual('some text', el.text)
+        root = self.etree.Element('root')
+        root.append(el)
+        self.assertEqual('some text', root[0].text)
+
+
+class ClassLookupTestCase(HelperTestCase):
+    """Test cases for different Element class lookup mechanisms.
+    """
+    etree = etree
+
+    def tearDown(self):
+        etree.set_element_class_lookup()
+        super(ClassLookupTestCase, self).tearDown()
+
+    def test_namespace_lookup(self):
+        class TestElement(etree.ElementBase):
+            FIND_ME = "namespace class"
+
+        lookup = etree.ElementNamespaceClassLookup()
+        etree.set_element_class_lookup(lookup)
+
+        ns = lookup.get_namespace("myNS")
+        ns[None] = TestElement
+
+        root = etree.XML(xml_str)
+        self.assertEqual(root.FIND_ME,
+                          TestElement.FIND_ME)
+        self.assertEqual(root[0].FIND_ME,
+                          TestElement.FIND_ME)
+        self.assertFalse(hasattr(root[0][-1], 'FIND_ME'))
+
+    def test_default_class_lookup(self):
+        class TestElement(etree.ElementBase):
+            FIND_ME = "default element"
+        class TestComment(etree.CommentBase):
+            FIND_ME = "default comment"
+        class TestPI(etree.PIBase):
+            FIND_ME = "default pi"
+
+        parser = etree.XMLParser()
+
+        lookup = etree.ElementDefaultClassLookup(
+            element=TestElement, comment=TestComment, pi=TestPI)
+        parser.set_element_class_lookup(lookup)
+
+        root = etree.XML(_bytes("""<?xml version='1.0'?>
+        <root>
+          <?myPI?>
+          <!-- hi -->
+        </root>
+        """), parser)
+
+        self.assertEqual("default element", root.FIND_ME)
+        self.assertEqual("default pi", root[0].FIND_ME)
+        self.assertEqual("default comment", root[1].FIND_ME)
+
+    def test_default_class_lookup_pull_parser(self):
+        class TestElement(etree.ElementBase):
+            FIND_ME = "default element"
+        class TestComment(etree.CommentBase):
+            FIND_ME = "default comment"
+        class TestPI(etree.PIBase):
+            FIND_ME = "default pi"
+
+        parser = etree.XMLPullParser(events=('start', 'end', 'comment', 'pi'))
+        lookup = etree.ElementDefaultClassLookup(
+            element=TestElement, comment=TestComment, pi=TestPI)
+        parser.set_element_class_lookup(lookup)
+
+        events_seen = []
+
+        def add_events(events):
+            for ev, el in events:
+                events_seen.append((ev, el.FIND_ME))
+
+        parser.feed("""<?xml version='1.0'?>
+        <root>
+          <?myPI?>
+        """)
+        add_events(parser.read_events())
+
+        parser.feed("<!-- hi -->")
+        add_events(parser.read_events())
+
+        parser.feed("</root>")
+        root = parser.close()
+        add_events(parser.read_events())
+
+        self.assertEqual([
+            ('start',   "default element"),
+            ('pi',      "default pi"),
+            ('comment', "default comment"),
+            ('end',     "default element"),
+        ], events_seen)
+
+        self.assertEqual("default element", root.FIND_ME)
+        self.assertEqual("default pi", root[0].FIND_ME)
+        self.assertEqual("default comment", root[1].FIND_ME)
+
+    def test_evil_class_lookup(self):
+        class MyLookup(etree.CustomElementClassLookup):
+            def lookup(self, t, d, ns, name):
+                if name == 'none':
+                    return None
+                elif name == 'obj':
+                    return object()
+                else:
+                    return etree.ElementBase
+
+        parser = etree.XMLParser()
+        parser.set_element_class_lookup(MyLookup())
+
+        root = etree.XML(_bytes('<none/>'), parser)
+        self.assertEqual('none', root.tag)
+
+        self.assertRaises(
+            TypeError,
+            etree.XML, _bytes("<obj />"), parser)
+
+        root = etree.XML(_bytes('<root/>'), parser)
+        self.assertEqual('root', root.tag)
+
+    def test_class_lookup_type_mismatch(self):
+        class MyLookup(etree.CustomElementClassLookup):
+            def lookup(self, t, d, ns, name):
+                if t == 'element':
+                    if name == 'root':
+                        return etree.ElementBase
+                    return etree.CommentBase
+                elif t == 'comment':
+                    return etree.PIBase
+                elif t == 'PI':
+                    return etree.EntityBase
+                elif t == 'entity':
+                    return etree.ElementBase
+                else:
+                    raise ValueError('got type %s' % t)
+
+        parser = etree.XMLParser(resolve_entities=False)
+        parser.set_element_class_lookup(MyLookup())
+
+        root = etree.XML(_bytes('<root></root>'), parser)
+        self.assertEqual('root', root.tag)
+        self.assertEqual(etree.ElementBase, type(root))
+
+        root = etree.XML(_bytes("<root><test/></root>"), parser)
+        self.assertRaises(TypeError, root.__getitem__, 0)
+
+        root = etree.XML(_bytes("<root><!-- test --></root>"), parser)
+        self.assertRaises(TypeError, root.__getitem__, 0)
+
+        root = etree.XML(_bytes("<root><?test?></root>"), parser)
+        self.assertRaises(TypeError, root.__getitem__, 0)
+
+        root = etree.XML(
+            _bytes('<!DOCTYPE root [<!ENTITY myent "ent">]>'
+                   '<root>&myent;</root>'),
+            parser)
+        self.assertRaises(TypeError, root.__getitem__, 0)
+
+        root = etree.XML(_bytes('<root><root/></root>'), parser)
+        self.assertEqual('root', root[0].tag)
+
+    def test_attribute_based_lookup(self):
+        class TestElement(etree.ElementBase):
+            FIND_ME = "attribute_based"
+
+        class_dict = {"A1" : TestElement}
+
+        lookup = etree.AttributeBasedElementClassLookup(
+            "a1", class_dict)
+        etree.set_element_class_lookup(lookup)
+
+        root = etree.XML(xml_str)
+        self.assertFalse(hasattr(root, 'FIND_ME'))
+        self.assertEqual(root[0].FIND_ME,
+                          TestElement.FIND_ME)
+        self.assertFalse(hasattr(root[0][0], 'FIND_ME'))
+
+    def test_custom_lookup(self):
+        class TestElement(etree.ElementBase):
+            FIND_ME = "custom"
+
+        class MyLookup(etree.CustomElementClassLookup):
+            def lookup(self, t, d, ns, name):
+                if name == 'c1':
+                    return TestElement
+
+        etree.set_element_class_lookup( MyLookup() )
+
+        root = etree.XML(xml_str)
+        self.assertFalse(hasattr(root, 'FIND_ME'))
+        self.assertEqual(root[0].FIND_ME,
+                          TestElement.FIND_ME)
+        self.assertFalse(hasattr(root[0][1], 'FIND_ME'))
+
+    def test_custom_lookup_ns_fallback(self):
+        class TestElement1(etree.ElementBase):
+            FIND_ME = "custom"
+
+        class TestElement2(etree.ElementBase):
+            FIND_ME = "nsclasses"
+
+        class MyLookup(etree.CustomElementClassLookup):
+            def lookup(self, t, d, ns, name):
+                if name == 'c1':
+                    return TestElement1
+
+        lookup = etree.ElementNamespaceClassLookup( MyLookup() )
+        etree.set_element_class_lookup(lookup)
+
+        ns = lookup.get_namespace("otherNS")
+        ns[None] = TestElement2
+
+        root = etree.XML(xml_str)
+        self.assertFalse(hasattr(root, 'FIND_ME'))
+        self.assertEqual(root[0].FIND_ME,
+                          TestElement1.FIND_ME)
+        self.assertFalse(hasattr(root[0][1], 'FIND_ME'))
+        self.assertEqual(root[0][-1].FIND_ME,
+                          TestElement2.FIND_ME)
+
+    def test_parser_based_lookup(self):
+        class TestElement(etree.ElementBase):
+            FIND_ME = "parser_based"
+
+        lookup = etree.ParserBasedElementClassLookup()
+        etree.set_element_class_lookup(lookup)
+
+        class MyLookup(etree.CustomElementClassLookup):
+            def lookup(self, t, d, ns, name):
+                return TestElement
+
+        parser = etree.XMLParser()
+        parser.set_element_class_lookup( MyLookup() )
+
+        root = etree.parse(BytesIO(xml_str), parser).getroot()
+        self.assertEqual(root.FIND_ME,
+                          TestElement.FIND_ME)
+        self.assertEqual(root[0].FIND_ME,
+                          TestElement.FIND_ME)
+
+        root = etree.parse(BytesIO(xml_str)).getroot()
+        self.assertFalse(hasattr(root, 'FIND_ME'))
+        self.assertFalse(hasattr(root[0], 'FIND_ME'))
+
+    def test_class_lookup_reentry(self):
+        XML = self.etree.XML
+
+        class TestElement(etree.ElementBase):
+            FIND_ME = "here"
+
+        root = None
+        class MyLookup(etree.CustomElementClassLookup):
+            el = None
+            def lookup(self, t, d, ns, name):
+                if root is not None: # not in the parser
+                    if self.el is None and name == "a":
+                        self.el = []
+                        self.el.append(root.find(name))
+                return TestElement
+
+        parser = self.etree.XMLParser()
+        parser.set_element_class_lookup(MyLookup())
+
+        root = XML(_bytes('<root><a>A</a><b xmlns="test">B</b></root>'),
+                   parser)
+
+        a = root[0]
+        self.assertEqual(a.tag, "a")
+        self.assertEqual(root[0].tag, "a")
+        del a
+        self.assertEqual(root[0].tag, "a")
+
+    def test_lookup_without_fallback(self):
+        class Lookup(etree.CustomElementClassLookup):
+             def __init__(self):
+                 # no super call here, so no fallback is set
+                 pass
+
+             def lookup(self, node_type, document, namespace, name):
+                 return Foo
+
+        class Foo(etree.ElementBase):
+             def custom(self):
+                 return "test"
+
+        parser = self.etree.XMLParser()
+        parser.set_element_class_lookup( Lookup() )
+
+        root = etree.XML('<foo/>', parser)
+
+        self.assertEqual("test", root.custom())
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ProxyTestCase)])
+    suite.addTests([unittest.makeSuite(ClassLookupTestCase)])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_css.py b/lib/lxml/tests/test_css.py
new file mode 100644
index 00000000..73fa5d52
--- /dev/null
+++ b/lib/lxml/tests/test_css.py
@@ -0,0 +1,65 @@
+import unittest
+
+import lxml.html
+
+from lxml.tests.common_imports import doctest, HelperTestCase, skipif
+
+try:
+    import cssselect
+except ImportError:
+    cssselect = None
+
+
+HTML = '''
+<div>
+  <a href="foo">link</a>
+  <a>anchor</a>
+</div>
+'''
+
+
+class CSSTestCase(HelperTestCase):
+
+    pytestmark = skipif('cssselect is None')
+
+    def test_cssselect(self):
+        div, = lxml.html.fromstring(HTML).xpath('//div')
+
+        def count(selector, expected_count, **kwargs):
+            result = div.cssselect(selector, **kwargs)
+            self.assertEqual(len(result), expected_count)
+
+        count('div', 1)
+        count('a', 2)
+        count('em', 0)
+        # Element names are case-insensitive in HTML
+        count('DIV', 1)
+        # ... but not in XHTML or XML
+        count('DIV', 0, translator='xhtml')
+        count('DIV', 0, translator='xml')
+
+        # :contains() is case-insensitive in lxml
+        count(':contains("link")', 2)  # div, a
+        count(':contains("LInk")', 2)
+        # Whatever the document language
+        count(':contains("LInk")', 2, translator='xhtml')
+        count(':contains("LInk")', 2, translator='xml')
+        # ... but not in upstream cssselect
+        import cssselect
+        count(':contains("link")', 2, translator=cssselect.HTMLTranslator())
+        count(':contains("LInk")', 0, translator=cssselect.HTMLTranslator())
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    try:
+        import cssselect
+    except ImportError:
+        # no 'cssselect' installed
+        print("Skipping tests in lxml.cssselect - external cssselect package is not installed")
+        return suite
+
+    import lxml.cssselect
+    suite.addTests(doctest.DocTestSuite(lxml.cssselect))
+    suite.addTests([unittest.makeSuite(CSSTestCase)])
+    return suite
diff --git a/lib/lxml/tests/test_doctestcompare.py b/lib/lxml/tests/test_doctestcompare.py
new file mode 100644
index 00000000..5a4fde7c
--- /dev/null
+++ b/lib/lxml/tests/test_doctestcompare.py
@@ -0,0 +1,95 @@
+import sys
+import unittest
+
+from lxml import etree
+from lxml.tests.common_imports import HelperTestCase
+from lxml.doctestcompare import LXMLOutputChecker, PARSE_HTML, PARSE_XML
+
+
+class DummyInput:
+    def __init__(self, **kw):
+        for name, value in kw.items():
+            setattr(self, name, value)
+
+
+def indent(elem, level=0):
+    i = "\n" + level*"  "
+    if len(elem):
+        if not elem.text or not elem.text.strip():
+            elem.text = i + "  "
+        if not elem.tail or not elem.tail.strip():
+            elem.tail = i
+        for elem in elem:
+            indent(elem, level+1)
+        if not elem.tail or not elem.tail.strip():
+            elem.tail = i
+    else:
+        if level and (not elem.tail or not elem.tail.strip()):
+            elem.tail = i
+
+
+class DoctestCompareTest(HelperTestCase):
+    _checker = LXMLOutputChecker()
+
+    def compare(self, want, got, html=False):
+        if html:
+            options = PARSE_HTML
+        else:
+            options = PARSE_XML
+
+        parse = self._checker.get_parser(want, got, options)
+        want_doc = parse(want)
+        got_doc = parse(got)
+        return self._checker.collect_diff(
+            want_doc, got_doc, html, indent=0).lstrip()
+
+    def assert_diff(self, want, got, diff, html=False):
+        self.assertEqual(self.compare(want, got, html), diff)
+
+    def assert_nodiff(self, want, got, html=False):
+        root = etree.fromstring(want)
+        root.tail = '\n'
+        indent(root)
+        diff = etree.tostring(
+            root, encoding='unicode', method=html and 'html' or 'xml')
+        self.assert_diff(want, got, diff, html=html)
+
+    def test_equal_input(self):
+        self.assert_nodiff(
+            '<p title="expected">Expected</p>',
+            '<p title="expected">Expected</p>')
+
+    def test_differing_tags(self):
+        self.assert_diff(
+            '<p title="expected">Expected</p>',
+            '<b title="expected">Expected</b>',
+            '<p (got: b) title="expected">Expected</p (got: b)>\n')
+
+    def test_tags_upper_lower_case(self):
+        self.assert_diff(
+            '<p title="expected">Expected</p>',
+            '<P title="expected">Expected</P>',
+            '<p (got: P) title="expected">Expected</p (got: P)>\n')
+
+    def test_tags_upper_lower_case_html(self):
+        self.assert_nodiff(
+            '<html><body><p title="expected">Expected</p></body></html>',
+            '<HTML><BODY><P title="expected">Expected</P></BODY></HTML>',
+            html=True)
+
+    def test_differing_attributes(self):
+        self.assert_diff(
+            '<p title="expected">Expected</p>',
+            '<p title="actual">Actual</p>',
+            '<p title="expected (got: actual)">Expected (got: Actual)</p>\n')
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if sys.version_info >= (2,4):
+        suite.addTests([unittest.makeSuite(DoctestCompareTest)])
+    return suite
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/lib/lxml/tests/test_dtd.py b/lib/lxml/tests/test_dtd.py
new file mode 100644
index 00000000..f4f1c0fa
--- /dev/null
+++ b/lib/lxml/tests/test_dtd.py
@@ -0,0 +1,315 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to DTD parsing and validation
+"""
+
+import unittest, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir)  # needed for Py3
+
+from common_imports import etree, BytesIO, _bytes
+from common_imports import HelperTestCase, make_doctest, skipIf
+from common_imports import fileInTestDir, fileUrlInTestDir
+
+
+class ETreeDtdTestCase(HelperTestCase):
+    def test_dtd(self):
+        pass
+
+    def test_dtd_file(self):
+        parse = etree.parse
+        tree = parse(fileInTestDir("test.xml"))
+        root = tree.getroot()
+
+        dtd = etree.DTD(fileInTestDir("test.dtd"))
+        self.assertTrue(dtd.validate(root))
+
+    def test_dtd_stringio(self):
+        root = etree.XML(_bytes("<b/>"))
+        dtd = etree.DTD(BytesIO("<!ELEMENT b EMPTY>"))
+        self.assertTrue(dtd.validate(root))
+
+    def test_dtd_parse_invalid(self):
+        fromstring = etree.fromstring
+        parser = etree.XMLParser(dtd_validation=True)
+        xml = _bytes('<!DOCTYPE b SYSTEM "%s"><b><a/></b>' %
+                     fileInTestDir("test.dtd"))
+        self.assertRaises(etree.XMLSyntaxError,
+                          fromstring, xml, parser=parser)
+
+    def test_dtd_parse_file_not_found(self):
+        fromstring = etree.fromstring
+        dtd_filename = fileUrlInTestDir("__nosuch.dtd")
+        parser = etree.XMLParser(dtd_validation=True)
+        xml = _bytes('<!DOCTYPE b SYSTEM "%s"><b><a/></b>' % dtd_filename)
+        self.assertRaises(etree.XMLSyntaxError,
+                          fromstring, xml, parser=parser)
+        errors = None
+        try:
+            fromstring(xml, parser=parser)
+        except etree.XMLSyntaxError:
+            e = sys.exc_info()[1]
+            self.assertTrue(e.error_log)
+            self.assertTrue(parser.error_log)
+            errors = [entry.message for entry in e.error_log
+                      if dtd_filename in entry.message]
+        self.assertTrue(errors)
+
+    def test_dtd_parse_valid(self):
+        parser = etree.XMLParser(dtd_validation=True)
+        xml = ('<!DOCTYPE a SYSTEM "%s"><a><b/></a>' %
+               fileUrlInTestDir("test.dtd"))
+        root = etree.fromstring(xml, parser=parser)
+
+    def test_dtd_parse_valid_file_url(self):
+        parser = etree.XMLParser(dtd_validation=True)
+        xml = ('<!DOCTYPE a SYSTEM "%s"><a><b/></a>' %
+               fileUrlInTestDir("test.dtd"))
+        root = etree.fromstring(xml, parser=parser)
+
+    def test_dtd_parse_valid_relative(self):
+        parser = etree.XMLParser(dtd_validation=True)
+        xml = '<!DOCTYPE a SYSTEM "test.dtd"><a><b/></a>'
+        root = etree.fromstring(
+            xml, parser=parser, base_url=fileUrlInTestDir("test.xml"))
+
+    def test_dtd_parse_valid_relative_file_url(self):
+        parser = etree.XMLParser(dtd_validation=True)
+        xml = '<!DOCTYPE a SYSTEM "test.dtd"><a><b/></a>'
+        root = etree.fromstring(
+            xml, parser=parser, base_url=fileUrlInTestDir("test.xml"))
+
+    def test_dtd_invalid(self):
+        root = etree.XML("<b><a/></b>")
+        dtd = etree.DTD(BytesIO("<!ELEMENT b EMPTY>"))
+        self.assertRaises(etree.DocumentInvalid, dtd.assertValid, root)
+
+    def test_dtd_assertValid(self):
+        root = etree.XML("<b><a/></b>")
+        dtd = etree.DTD(BytesIO("<!ELEMENT b (a)><!ELEMENT a EMPTY>"))
+        dtd.assertValid(root)
+
+    def test_dtd_internal(self):
+        root = etree.XML(_bytes('''
+        <!DOCTYPE b SYSTEM "none" [
+        <!ELEMENT b (a)>
+        <!ELEMENT a EMPTY>
+        ]>
+        <b><a/></b>
+        '''))
+        dtd = etree.ElementTree(root).docinfo.internalDTD
+        self.assertTrue(dtd)
+        dtd.assertValid(root)
+
+    def test_dtd_internal_invalid(self):
+        root = etree.XML(_bytes('''
+        <!DOCTYPE b SYSTEM "none" [
+        <!ELEMENT b (a)>
+        <!ELEMENT a (c)>
+        <!ELEMENT c EMPTY>
+        ]>
+        <b><a/></b>
+        '''))
+        dtd = etree.ElementTree(root).docinfo.internalDTD
+        self.assertTrue(dtd)
+        self.assertFalse(dtd.validate(root))
+
+    def test_dtd_invalid_duplicate_id(self):
+        root = etree.XML(_bytes('''
+        <a><b id="id1"/><b id="id2"/><b id="id1"/></a>
+        '''))
+        dtd = etree.DTD(BytesIO(_bytes("""
+        <!ELEMENT a (b*)>
+        <!ATTLIST b
+            id ID #REQUIRED
+        >
+        <!ELEMENT b EMPTY>
+        """)))
+        self.assertFalse(dtd.validate(root))
+        self.assertTrue(dtd.error_log)
+        self.assertTrue([error for error in dtd.error_log
+                         if 'id1' in error.message])
+
+    def test_dtd_api_internal(self):
+        root = etree.XML(_bytes('''
+        <!DOCTYPE b SYSTEM "none" [
+        <!ATTLIST a
+          attr1 (x | y | z) "z"
+          attr2 CDATA #FIXED "X"
+        >
+        <!ELEMENT b (a)>
+        <!ELEMENT a EMPTY>
+        ]>
+        <b><a/></b>
+        '''))
+        dtd = etree.ElementTree(root).docinfo.internalDTD
+        self.assertTrue(dtd)
+        dtd.assertValid(root)
+
+        seen = []
+        for el in dtd.iterelements():
+            if el.name == 'a':
+                self.assertEqual(2, len(el.attributes()))
+                for attr in el.iterattributes():
+                    if attr.name == 'attr1':
+                        self.assertEqual('enumeration', attr.type)
+                        self.assertEqual('none', attr.default)
+                        self.assertEqual('z', attr.default_value)
+                        values = attr.values()
+                        values.sort()
+                        self.assertEqual(['x', 'y', 'z'], values)
+                    else:
+                        self.assertEqual('attr2', attr.name)
+                        self.assertEqual('cdata', attr.type)
+                        self.assertEqual('fixed', attr.default)
+                        self.assertEqual('X', attr.default_value)
+            else:
+                self.assertEqual('b', el.name)
+                self.assertEqual(0, len(el.attributes()))
+            seen.append(el.name)
+        seen.sort()
+        self.assertEqual(['a', 'b'], seen)
+        self.assertEqual(2, len(dtd.elements()))
+
+    def test_internal_dtds(self):
+        for el_count in range(2, 5):
+            for attr_count in range(4):
+                root = etree.XML(_bytes('''
+                <!DOCTYPE el0 SYSTEM "none" [
+                ''' + ''.join(['''
+                <!ATTLIST el%d
+                  attr%d (x | y | z) "z"
+                >
+                ''' % (e, a) for a in range(attr_count) for e in range(el_count)
+                ]) + ''.join(['''
+                <!ELEMENT el%d EMPTY>
+                ''' % e for e in range(1, el_count)
+                ]) + '''
+                ''' + '<!ELEMENT el0 (%s)>' % '|'.join([
+                    'el%d' % e for e in range(1, el_count)]) + '''
+                ]>
+                <el0><el1 %s /></el0>
+                ''' % ' '.join(['attr%d="x"' % a for a in range(attr_count)])))
+                dtd = etree.ElementTree(root).docinfo.internalDTD
+                self.assertTrue(dtd)
+                dtd.assertValid(root)
+
+                e = -1
+                for e, el in enumerate(dtd.iterelements()):
+                    self.assertEqual(attr_count, len(el.attributes()))
+                    a = -1
+                    for a, attr in enumerate(el.iterattributes()):
+                        self.assertEqual('enumeration', attr.type)
+                        self.assertEqual('none', attr.default)
+                        self.assertEqual('z', attr.default_value)
+                        values = sorted(attr.values())
+                        self.assertEqual(['x', 'y', 'z'], values)
+                    self.assertEqual(attr_count - 1, a)
+                self.assertEqual(el_count - 1, e)
+                self.assertEqual(el_count, len(dtd.elements()))
+
+    def test_dtd_broken(self):
+        self.assertRaises(etree.DTDParseError, etree.DTD,
+                          BytesIO("<!ELEMENT b HONKEY>"))
+
+    def test_parse_file_dtd(self):
+        parser = etree.XMLParser(attribute_defaults=True)
+
+        tree = etree.parse(fileInTestDir('test.xml'), parser)
+        root = tree.getroot()
+
+        self.assertEqual(
+            "valueA",
+            root.get("default"))
+        self.assertEqual(
+            "valueB",
+            root[0].get("default"))
+
+    @skipIf(etree.LIBXML_VERSION == (2, 9, 0),
+            "DTD loading is broken for incremental parsing in libxml2 2.9.0")
+    def test_iterparse_file_dtd_start(self):
+        iterparse = etree.iterparse
+        iterator = iterparse(fileInTestDir("test.xml"), events=('start',),
+                             attribute_defaults=True)
+        attributes = [ element.get("default")
+                       for event, element in iterator ]
+        self.assertEqual(
+            ["valueA", "valueB"],
+            attributes)
+
+    @skipIf(etree.LIBXML_VERSION == (2, 9, 0),
+            "DTD loading is broken for incremental parsing in libxml2 2.9.0")
+    def test_iterparse_file_dtd_end(self):
+        iterparse = etree.iterparse
+        iterator = iterparse(fileInTestDir("test.xml"), events=('end',),
+                             attribute_defaults=True)
+        attributes = [ element.get("default")
+                       for event, element in iterator ]
+        self.assertEqual(
+            ["valueB", "valueA"],
+            attributes)
+
+    def test_dtd_attrs(self):
+        dtd = etree.DTD(fileUrlInTestDir("test.dtd"))
+
+        # Test DTD.system_url attribute
+        self.assertTrue(dtd.system_url.endswith("test.dtd"))
+
+        # Test elements and their attributes
+        a = dtd.elements()[0]
+        self.assertEqual(a.name, "a")
+        self.assertEqual(a.type, "element")
+        self.assertEqual(a.content.name, "b")
+        self.assertEqual(a.content.type, "element")
+        self.assertEqual(a.content.occur, "once")
+
+        aattr = a.attributes()[0]
+        self.assertEqual(aattr.name, "default")
+        self.assertEqual(aattr.type, "enumeration")
+        self.assertEqual(aattr.values(), ["valueA", "valueB"])
+        self.assertEqual(aattr.default_value, "valueA")
+
+        b = dtd.elements()[1]
+        self.assertEqual(b.name, "b")
+        self.assertEqual(b.type, "empty")
+        self.assertEqual(b.content, None)
+
+        # Test entities and their attributes
+        c = dtd.entities()[0]
+        self.assertEqual(c.name, "c")
+        self.assertEqual(c.orig, "&#42;")
+        self.assertEqual(c.content, "*")
+
+        # Test DTD.name attribute
+        root = etree.XML(_bytes('''
+        <!DOCTYPE a SYSTEM "none" [
+        <!ELEMENT a EMPTY>
+        ]>
+        <a/>
+        '''))
+        dtd = etree.ElementTree(root).docinfo.internalDTD
+        self.assertEqual(dtd.name, "a")
+
+        # Test DTD.name and DTD.systemID attributes
+        parser = etree.XMLParser(dtd_validation=True)
+        xml = '<!DOCTYPE a SYSTEM "test.dtd"><a><b/></a>'
+        root = etree.fromstring(xml, parser=parser,
+                                base_url=fileUrlInTestDir("test.xml"))
+
+        dtd = root.getroottree().docinfo.internalDTD
+        self.assertEqual(dtd.name, "a")
+        self.assertEqual(dtd.system_url, "test.dtd")
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeDtdTestCase)])
+    suite.addTests(
+        [make_doctest('../../../doc/validation.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_elementtree.py b/lib/lxml/tests/test_elementtree.py
new file mode 100644
index 00000000..764a22cc
--- /dev/null
+++ b/lib/lxml/tests/test_elementtree.py
@@ -0,0 +1,4136 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests for the ElementTree API
+
+Only test cases that apply equally well to etree and ElementTree
+belong here. Note that there is a second test module called test_io.py
+for IO related test cases.
+"""
+
+import unittest
+import os, re, tempfile, copy, operator, gc, sys
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import StringIO, BytesIO, etree
+from common_imports import ElementTree, cElementTree, ET_VERSION, CET_VERSION
+from common_imports import filter_by_version, fileInTestDir, canonicalize, HelperTestCase
+from common_imports import _str, _bytes, unicode, next
+
+if cElementTree is not None and (CET_VERSION <= (1,0,7) or sys.version_info >= (3,3)):
+    cElementTree = None
+
+if ElementTree is not None:
+    print("Comparing with ElementTree %s" % getattr(ElementTree, "VERSION", "?"))
+
+if cElementTree is not None:
+    print("Comparing with cElementTree %s" % getattr(cElementTree, "VERSION", "?"))
+
+try:
+    reversed
+except NameError:
+    # Python 2.3
+    def reversed(seq):
+        seq = list(seq)[::-1]
+        return seq
+
+class _ETreeTestCaseBase(HelperTestCase):
+    etree = None
+    required_versions_ET = {}
+    required_versions_cET = {}
+
+    def XMLParser(self, **kwargs):
+        try:
+            XMLParser = self.etree.XMLParser
+        except AttributeError:
+            assert 'ElementTree' in self.etree.__name__
+            XMLParser = self.etree.TreeBuilder
+        return XMLParser(**kwargs)
+
+    def test_element(self):
+        for i in range(10):
+            e = self.etree.Element('foo')
+            self.assertEqual(e.tag, 'foo')
+            self.assertEqual(e.text, None)
+            self.assertEqual(e.tail, None)
+
+    def test_simple(self):
+        Element = self.etree.Element
+        
+        root = Element('root')
+        root.append(Element('one'))
+        root.append(Element('two'))
+        root.append(Element('three'))
+        self.assertEqual(3, len(root))
+        self.assertEqual('one', root[0].tag)
+        self.assertEqual('two', root[1].tag)
+        self.assertEqual('three', root[2].tag)
+        self.assertRaises(IndexError, operator.getitem, root, 3)
+
+    # test weird dictionary interaction leading to segfault previously
+    def test_weird_dict_interaction(self):
+        root = self.etree.Element('root')
+        self.assertEqual(root.tag, "root")
+        add = self.etree.ElementTree(file=BytesIO('<foo>Foo</foo>'))
+        self.assertEqual(add.getroot().tag, "foo")
+        self.assertEqual(add.getroot().text, "Foo")
+        root.append(self.etree.Element('baz'))
+        self.assertEqual(root.tag, "root")
+        self.assertEqual(root[0].tag, "baz")
+
+    def test_subelement(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        root = Element('root')
+        SubElement(root, 'one')
+        SubElement(root, 'two')
+        SubElement(root, 'three')
+        self.assertEqual(3, len(root))
+        self.assertEqual('one', root[0].tag)
+        self.assertEqual('two', root[1].tag)
+        self.assertEqual('three', root[2].tag)
+        
+    def test_element_contains(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        root1 = Element('root')
+        SubElement(root1, 'one')
+        self.assertTrue(root1[0] in root1)
+
+        root2 = Element('root')
+        SubElement(root2, 'two')
+        SubElement(root2, 'three')
+        self.assertTrue(root2[0] in root2)
+        self.assertTrue(root2[1] in root2)
+
+        self.assertFalse(root1[0] in root2)
+        self.assertFalse(root2[0] in root1)
+        self.assertFalse(None in root2)
+
+    def test_element_indexing_with_text(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc>Test<one>One</one></doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual(1, len(root))
+        self.assertEqual('one', root[0].tag)
+        self.assertRaises(IndexError, operator.getitem, root, 1)
+        
+    def test_element_indexing_with_text2(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc><one>One</one><two>Two</two>hm<three>Three</three></doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual(3, len(root))
+        self.assertEqual('one', root[0].tag)
+        self.assertEqual('two', root[1].tag)
+        self.assertEqual('three', root[2].tag)
+
+    def test_element_indexing_only_text(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc>Test</doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual(0, len(root))
+
+    def test_element_indexing_negative(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        self.assertEqual(d, a[-1])
+        self.assertEqual(c, a[-2])
+        self.assertEqual(b, a[-3])
+        self.assertRaises(IndexError, operator.getitem, a, -4)
+        a[-1] = e = Element('e')
+        self.assertEqual(e, a[-1])
+        del a[-1]
+        self.assertEqual(2, len(a))
+        
+    def test_elementtree(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc><one>One</one><two>Two</two></doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual(2, len(root))
+        self.assertEqual('one', root[0].tag)
+        self.assertEqual('two', root[1].tag)
+
+    def test_text(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc>This is a text</doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual('This is a text', root.text)
+
+    def test_text_empty(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc></doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual(None, root.text)
+
+    def test_text_other(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc><one>One</one></doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual(None, root.text)
+        self.assertEqual('One', root[0].text)
+
+    def test_text_escape_in(self):
+        ElementTree = self.etree.ElementTree
+
+        f = BytesIO('<doc>This is &gt; than a text</doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual('This is > than a text', root.text)
+
+    def test_text_escape_out(self):
+        Element = self.etree.Element
+
+        a = Element("a")
+        a.text = "<>&"
+        self.assertXML(_bytes('<a>&lt;&gt;&amp;</a>'),
+                       a)
+
+    def test_text_escape_tostring(self):
+        tostring = self.etree.tostring
+        Element  = self.etree.Element
+
+        a = Element("a")
+        a.text = "<>&"
+        self.assertEqual(_bytes('<a>&lt;&gt;&amp;</a>'),
+                         tostring(a))
+
+    def test_text_str_subclass(self):
+        Element = self.etree.Element
+
+        class strTest(str):
+            pass
+
+        a = Element("a")
+        a.text = strTest("text")
+        self.assertXML(_bytes('<a>text</a>'),
+                       a)
+
+    def test_tail(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc>This is <i>mixed</i> content.</doc>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual(1, len(root))
+        self.assertEqual('This is ', root.text)
+        self.assertEqual(None, root.tail)
+        self.assertEqual('mixed', root[0].text)
+        self.assertEqual(' content.', root[0].tail)
+
+    def test_tail_str_subclass(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        class strTest(str):
+            pass
+
+        a = Element("a")
+        SubElement(a, "t").tail = strTest("tail")
+        self.assertXML(_bytes('<a><t></t>tail</a>'),
+                       a)
+
+    def _test_del_tail(self):
+        # this is discouraged for ET compat, should not be tested...
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc>This is <i>mixed</i> content.</doc>'))
+        self.assertEqual(1, len(root))
+        self.assertEqual('This is ', root.text)
+        self.assertEqual(None, root.tail)
+        self.assertEqual('mixed', root[0].text)
+        self.assertEqual(' content.', root[0].tail)
+
+        del root[0].tail
+
+        self.assertEqual(1, len(root))
+        self.assertEqual('This is ', root.text)
+        self.assertEqual(None, root.tail)
+        self.assertEqual('mixed', root[0].text)
+        self.assertEqual(None, root[0].tail)
+
+        root[0].tail = "TAIL"
+
+        self.assertEqual(1, len(root))
+        self.assertEqual('This is ', root.text)
+        self.assertEqual(None, root.tail)
+        self.assertEqual('mixed', root[0].text)
+        self.assertEqual('TAIL', root[0].tail)
+
+    def test_ElementTree(self):
+        Element = self.etree.Element
+        ElementTree = self.etree.ElementTree
+        
+        el = Element('hoi')
+        doc = ElementTree(el)
+        root = doc.getroot()
+        self.assertEqual(None, root.text)
+        self.assertEqual('hoi', root.tag)
+
+    def test_attrib(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc one="One" two="Two"/>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual('One', root.attrib['one'])
+        self.assertEqual('Two', root.attrib['two'])
+        self.assertRaises(KeyError, operator.getitem, root.attrib, 'three')
+
+    def test_attrib_get(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc one="One" two="Two"/>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual('One', root.attrib.get('one'))
+        self.assertEqual('Two', root.attrib.get('two'))
+        self.assertEqual(None, root.attrib.get('three'))
+        self.assertEqual('foo', root.attrib.get('three', 'foo'))
+
+    def test_attrib_dict(self):
+        ElementTree = self.etree.ElementTree
+
+        f = BytesIO('<doc one="One" two="Two"/>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        attrib = dict(root.attrib)
+        self.assertEqual('One', attrib['one'])
+        self.assertEqual('Two', attrib['two'])
+        self.assertRaises(KeyError, operator.getitem, attrib, 'three')
+
+    def test_attrib_copy(self):
+        ElementTree = self.etree.ElementTree
+
+        f = BytesIO('<doc one="One" two="Two"/>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        attrib = copy.copy(root.attrib)
+        self.assertEqual('One', attrib['one'])
+        self.assertEqual('Two', attrib['two'])
+        self.assertRaises(KeyError, operator.getitem, attrib, 'three')
+
+    def test_attrib_deepcopy(self):
+        ElementTree = self.etree.ElementTree
+
+        f = BytesIO('<doc one="One" two="Two"/>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        attrib = copy.deepcopy(root.attrib)
+        self.assertEqual('One', attrib['one'])
+        self.assertEqual('Two', attrib['two'])
+        self.assertRaises(KeyError, operator.getitem, attrib, 'three')
+
+    def test_attributes_get(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc one="One" two="Two"/>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual('One', root.get('one'))
+        self.assertEqual('Two', root.get('two'))
+        self.assertEqual(None, root.get('three'))
+        self.assertEqual('foo', root.get('three', 'foo'))
+
+    def test_attrib_clear(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc one="One" two="Two"/>'))
+        self.assertEqual('One', root.get('one'))
+        self.assertEqual('Two', root.get('two'))
+        root.attrib.clear()
+        self.assertEqual(None, root.get('one'))
+        self.assertEqual(None, root.get('two'))
+
+    def test_attrib_set_clear(self):
+        Element = self.etree.Element
+        
+        root = Element("root", one="One")
+        root.set("two", "Two")
+        self.assertEqual('One', root.get('one'))
+        self.assertEqual('Two', root.get('two'))
+        root.attrib.clear()
+        self.assertEqual(None, root.get('one'))
+        self.assertEqual(None, root.get('two'))
+
+    def test_attrib_ns_clear(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        attribNS = '{http://foo/bar}x'
+
+        parent = Element('parent')
+        parent.set(attribNS, 'a')
+        child = SubElement(parent, 'child')
+        child.set(attribNS, 'b')
+
+        self.assertEqual('a', parent.get(attribNS))
+        self.assertEqual('b', child.get(attribNS))
+
+        parent.clear()
+        self.assertEqual(None, parent.get(attribNS))
+        self.assertEqual('b', child.get(attribNS))
+
+    def test_attrib_pop(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<doc one="One" two="Two"/>')
+        doc = ElementTree(file=f)
+        root = doc.getroot()
+        self.assertEqual('One', root.attrib['one'])
+        self.assertEqual('Two', root.attrib['two'])
+
+        self.assertEqual('One', root.attrib.pop('one'))
+
+        self.assertEqual(None, root.attrib.get('one'))
+        self.assertEqual('Two', root.attrib['two'])
+
+    def test_attrib_pop_unknown(self):
+        root = self.etree.XML(_bytes('<doc one="One" two="Two"/>'))
+        self.assertRaises(KeyError, root.attrib.pop, 'NONE')
+
+        self.assertEqual('One', root.attrib['one'])
+        self.assertEqual('Two', root.attrib['two'])
+
+    def test_attrib_pop_default(self):
+        root = self.etree.XML(_bytes('<doc one="One" two="Two"/>'))
+        self.assertEqual('Three', root.attrib.pop('three', 'Three'))
+
+    def test_attrib_pop_empty_default(self):
+        root = self.etree.XML(_bytes('<doc/>'))
+        self.assertEqual('Three', root.attrib.pop('three', 'Three'))
+
+    def test_attrib_pop_invalid_args(self):
+        root = self.etree.XML(_bytes('<doc one="One" two="Two"/>'))
+        self.assertRaises(TypeError, root.attrib.pop, 'One', None, None)
+
+    def test_attribute_update_dict(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta"/>'))
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha', 'Alpha'), ('beta', 'Beta')],
+            items)
+
+        root.attrib.update({'alpha' : 'test', 'gamma' : 'Gamma'})
+
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha', 'test'), ('beta', 'Beta'), ('gamma', 'Gamma')],
+            items)
+
+    def test_attribute_update_sequence(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta"/>'))
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha', 'Alpha'), ('beta', 'Beta')],
+            items)
+
+        root.attrib.update({'alpha' : 'test', 'gamma' : 'Gamma'}.items())
+
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha', 'test'), ('beta', 'Beta'), ('gamma', 'Gamma')],
+            items)
+
+    def test_attribute_update_iter(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta"/>'))
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha', 'Alpha'), ('beta', 'Beta')],
+            items)
+
+        root.attrib.update(iter({'alpha' : 'test', 'gamma' : 'Gamma'}.items()))
+
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha', 'test'), ('beta', 'Beta'), ('gamma', 'Gamma')],
+            items)
+
+    def test_attribute_update_attrib(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta"/>'))
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha', 'Alpha'), ('beta', 'Beta')],
+                                                  items)
+
+        other = XML(_bytes('<doc alpha="test" gamma="Gamma"/>'))
+        root.attrib.update(other.attrib)
+
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha', 'test'), ('beta', 'Beta'), ('gamma', 'Gamma')],
+                                                                     items)
+
+    def test_attribute_keys(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta" gamma="Gamma"/>'))
+        keys = list(root.attrib.keys())
+        keys.sort()
+        self.assertEqual(['alpha', 'beta', 'gamma'], keys)
+
+    def test_attribute_keys2(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta" gamma="Gamma"/>'))
+        keys = list(root.keys())
+        keys.sort()
+        self.assertEqual(['alpha', 'beta', 'gamma'], keys)
+
+    def test_attribute_items2(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta" gamma="Gamma"/>'))
+        items = list(root.items())
+        items.sort()
+        self.assertEqual(
+            [('alpha','Alpha'), ('beta','Beta'), ('gamma','Gamma')],
+            items)
+
+    def test_attribute_keys_ns(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<foo bar="Bar" xmlns:ns="http://ns.codespeak.net/test" ns:baz="Baz" />'))
+        keys = list(root.keys())
+        keys.sort()
+        self.assertEqual(['bar', '{http://ns.codespeak.net/test}baz'],
+                          keys)
+        
+    def test_attribute_values(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta" gamma="Gamma"/>'))
+        values = list(root.attrib.values())
+        values.sort()
+        self.assertEqual(['Alpha', 'Beta', 'Gamma'], values)
+
+    def test_attribute_values_ns(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<foo bar="Bar" xmlns:ns="http://ns.codespeak.net/test" ns:baz="Baz" />'))
+        values = list(root.attrib.values())
+        values.sort()
+        self.assertEqual(
+            ['Bar', 'Baz'], values)
+        
+    def test_attribute_items(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta" gamma="Gamma"/>'))
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual([
+            ('alpha', 'Alpha'),
+            ('beta', 'Beta'),
+            ('gamma', 'Gamma'),
+            ], 
+            items)
+
+    def test_attribute_items_ns(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<foo bar="Bar" xmlns:ns="http://ns.codespeak.net/test" ns:baz="Baz" />'))
+        items = list(root.attrib.items())
+        items.sort()
+        self.assertEqual(
+            [('bar', 'Bar'), ('{http://ns.codespeak.net/test}baz', 'Baz')],
+            items)
+
+    def test_attribute_str(self):
+        XML = self.etree.XML
+
+        expected = "{'{http://ns.codespeak.net/test}baz': 'Baz', 'bar': 'Bar'}"
+        alternative = "{'bar': 'Bar', '{http://ns.codespeak.net/test}baz': 'Baz'}"
+        
+        root = XML(_bytes('<foo bar="Bar" xmlns:ns="http://ns.codespeak.net/test" ns:baz="Baz" />'))
+        try:
+            self.assertEqual(expected, str(root.attrib))
+        except AssertionError:
+            self.assertEqual(alternative, str(root.attrib))
+
+    def test_attribute_contains(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<foo bar="Bar" xmlns:ns="http://ns.codespeak.net/test" ns:baz="Baz" />'))
+        self.assertEqual(
+            True, 'bar' in root.attrib)
+        self.assertEqual(
+            False, 'baz' in root.attrib)
+        self.assertEqual(
+            False, 'hah' in root.attrib)
+        self.assertEqual(
+            True,
+            '{http://ns.codespeak.net/test}baz' in root.attrib)
+
+    def test_attribute_set(self):
+        Element = self.etree.Element
+
+        root = Element("root")
+        root.set("attr", "TEST")
+        self.assertEqual("TEST", root.get("attr"))
+
+    def test_attrib_as_attrib(self):
+        Element = self.etree.Element
+
+        root = Element("root")
+        root.set("attr", "TEST")
+        self.assertEqual("TEST", root.attrib["attr"])
+
+        root2 = Element("root2", root.attrib)
+        self.assertEqual("TEST", root2.attrib["attr"])
+
+    def test_attribute_iterator(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta" gamma="Gamma" />'))
+        result = []
+        for key in root.attrib:
+            result.append(key)
+        result.sort()
+        self.assertEqual(['alpha', 'beta', 'gamma'], result)
+
+    def test_attribute_manipulation(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        a.attrib['foo'] = 'Foo'
+        a.attrib['bar'] = 'Bar'
+        self.assertEqual('Foo', a.attrib['foo'])
+        del a.attrib['foo']
+        self.assertRaises(KeyError, operator.getitem, a.attrib, 'foo')
+
+    def test_del_attribute_ns(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        a.attrib['{http://a/}foo'] = 'Foo'
+        a.attrib['{http://a/}bar'] = 'Bar'
+        self.assertEqual(None, a.get('foo'))
+        self.assertEqual('Foo', a.get('{http://a/}foo'))
+        self.assertEqual('Foo', a.attrib['{http://a/}foo'])
+
+        self.assertRaises(KeyError, operator.delitem, a.attrib, 'foo')
+        self.assertEqual('Foo', a.attrib['{http://a/}foo'])
+
+        del a.attrib['{http://a/}foo']
+        self.assertRaises(KeyError, operator.getitem, a.attrib, 'foo')
+
+    def test_del_attribute_ns_parsed(self):
+        XML = self.etree.XML
+
+        a = XML(_bytes('<a xmlns:nsa="http://a/" nsa:foo="FooNS" foo="Foo" />'))
+
+        self.assertEqual('Foo', a.attrib['foo'])
+        self.assertEqual('FooNS', a.attrib['{http://a/}foo'])
+
+        del a.attrib['foo']
+        self.assertEqual('FooNS', a.attrib['{http://a/}foo'])
+        self.assertRaises(KeyError, operator.getitem, a.attrib, 'foo')
+        self.assertRaises(KeyError, operator.delitem, a.attrib, 'foo')
+
+        del a.attrib['{http://a/}foo']
+        self.assertRaises(KeyError, operator.getitem, a.attrib, '{http://a/}foo')
+        self.assertRaises(KeyError, operator.getitem, a.attrib, 'foo')
+
+        a = XML(_bytes('<a xmlns:nsa="http://a/" foo="Foo" nsa:foo="FooNS" />'))
+
+        self.assertEqual('Foo', a.attrib['foo'])
+        self.assertEqual('FooNS', a.attrib['{http://a/}foo'])
+
+        del a.attrib['foo']
+        self.assertEqual('FooNS', a.attrib['{http://a/}foo'])
+        self.assertRaises(KeyError, operator.getitem, a.attrib, 'foo')
+
+        del a.attrib['{http://a/}foo']
+        self.assertRaises(KeyError, operator.getitem, a.attrib, '{http://a/}foo')
+        self.assertRaises(KeyError, operator.getitem, a.attrib, 'foo')
+
+    def test_XML(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc>This is a text.</doc>'))
+        self.assertEqual(0, len(root))
+        self.assertEqual('This is a text.', root.text)
+
+    def test_XMLID(self):
+        XMLID = self.etree.XMLID
+        XML   = self.etree.XML
+        xml_text = _bytes('''
+        <document>
+          <h1 id="chapter1">...</h1>
+          <p id="note1" class="note">...</p>
+          <p>Regular paragraph.</p>
+          <p xml:id="xmlid">XML:ID paragraph.</p>
+          <p id="warn1" class="warning">...</p>
+        </document>
+        ''')
+
+        root, dic = XMLID(xml_text)
+        root2 = XML(xml_text)
+        self.assertEqual(self._writeElement(root),
+                          self._writeElement(root2))
+        expected = {
+            "chapter1" : root[0],
+            "note1"    : root[1],
+            "warn1"    : root[4]
+            }
+        self.assertEqual(dic, expected)
+
+    def test_fromstring(self):
+        fromstring = self.etree.fromstring
+
+        root = fromstring('<doc>This is a text.</doc>')
+        self.assertEqual(0, len(root))
+        self.assertEqual('This is a text.', root.text)
+
+    required_versions_ET['test_fromstringlist'] = (1,3)
+    def test_fromstringlist(self):
+        fromstringlist = self.etree.fromstringlist
+
+        root = fromstringlist(["<do", "c>T", "hi", "s is",
+                               " a text.<", "/doc", ">"])
+        self.assertEqual(0, len(root))
+        self.assertEqual('This is a text.', root.text)
+
+    required_versions_ET['test_fromstringlist_characters'] = (1,3)
+    def test_fromstringlist_characters(self):
+        fromstringlist = self.etree.fromstringlist
+
+        root = fromstringlist(list('<doc>This is a text.</doc>'))
+        self.assertEqual(0, len(root))
+        self.assertEqual('This is a text.', root.text)
+
+    required_versions_ET['test_fromstringlist_single'] = (1,3)
+    def test_fromstringlist_single(self):
+        fromstringlist = self.etree.fromstringlist
+
+        root = fromstringlist(['<doc>This is a text.</doc>'])
+        self.assertEqual(0, len(root))
+        self.assertEqual('This is a text.', root.text)
+
+    def test_iselement(self):
+        iselement = self.etree.iselement
+        Element = self.etree.Element
+        ElementTree = self.etree.ElementTree
+        XML = self.etree.XML
+        Comment = self.etree.Comment
+        ProcessingInstruction = self.etree.ProcessingInstruction
+        
+        el = Element('hoi')
+        self.assertTrue(iselement(el))
+
+        el2 = XML(_bytes('<foo/>'))
+        self.assertTrue(iselement(el2))
+
+        tree = ElementTree(element=Element('dag'))
+        self.assertTrue(not iselement(tree))
+        self.assertTrue(iselement(tree.getroot()))
+
+        c = Comment('test')
+        self.assertTrue(iselement(c))
+
+        p = ProcessingInstruction("test", "some text")
+        self.assertTrue(iselement(p))
+        
+    def test_iteration(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<three/></doc>'))
+        result = []
+        for el in root:
+            result.append(el.tag)
+        self.assertEqual(['one', 'two', 'three'], result)
+
+    def test_iteration_empty(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc></doc>'))
+        result = []
+        for el in root:
+            result.append(el.tag)
+        self.assertEqual([], result)
+
+    def test_iteration_text_only(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc>Text</doc>'))
+        result = []
+        for el in root:
+            result.append(el.tag)
+        self.assertEqual([], result)
+
+    def test_iteration_crash(self):
+        # this would cause a crash in the past
+        fromstring = self.etree.fromstring
+        root = etree.fromstring('<html><p></p>x</html>')
+        for elem in root:
+            elem.tail = ''
+
+    def test_iteration_reversed(self):
+        XML = self.etree.XML
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<three/></doc>'))
+        result = []
+        for el in reversed(root):
+            result.append(el.tag)
+        self.assertEqual(['three', 'two', 'one'], result)
+
+    def test_iteration_subelement(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<three/></doc>'))
+        result = []
+        add = True
+        for el in root:
+            result.append(el.tag)
+            if add:
+                self.etree.SubElement(root, 'four')
+                add = False
+        self.assertEqual(['one', 'two', 'three', 'four'], result)
+
+    def test_iteration_del_child(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<three/></doc>'))
+        result = []
+        for el in root:
+            result.append(el.tag)
+            del root[-1]
+        self.assertEqual(['one', 'two'], result)
+
+    def test_iteration_double(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<doc><one/><two/></doc>'))
+        result = []
+        for el0 in root:
+            result.append(el0.tag)
+            for el1 in root:
+                result.append(el1.tag)
+        self.assertEqual(['one','one', 'two', 'two', 'one', 'two'], result)
+
+    required_versions_ET['test_itertext'] = (1,3)
+    def test_itertext(self):
+        # ET 1.3+
+        XML = self.etree.XML
+        root = XML(_bytes("<root>RTEXT<a></a>ATAIL<b/><c>CTEXT</c>CTAIL</root>"))
+
+        text = list(root.itertext())
+        self.assertEqual(["RTEXT", "ATAIL", "CTEXT", "CTAIL"],
+                          text)
+
+    required_versions_ET['test_itertext_child'] = (1,3)
+    def test_itertext_child(self):
+        # ET 1.3+
+        XML = self.etree.XML
+        root = XML(_bytes("<root>RTEXT<a></a>ATAIL<b/><c>CTEXT</c>CTAIL</root>"))
+
+        text = list(root[2].itertext())
+        self.assertEqual(["CTEXT"],
+                          text)
+
+    def test_findall(self):
+        XML = self.etree.XML
+        root = XML(_bytes('<a><b><c/></b><b/><c><b/></c></a>'))
+        self.assertEqual(len(list(root.findall("c"))), 1)
+        self.assertEqual(len(list(root.findall(".//c"))), 2)
+        self.assertEqual(len(list(root.findall(".//b"))), 3)
+        self.assertEqual(len(list(root.findall(".//b"))[0]), 1)
+        self.assertEqual(len(list(root.findall(".//b"))[1]), 0)
+        self.assertEqual(len(list(root.findall(".//b"))[2]), 0)
+
+    def test_findall_ns(self):
+        XML = self.etree.XML
+        root = XML(_bytes('<a xmlns:x="X" xmlns:y="Y"><x:b><c/></x:b><b/><c><x:b/><b/></c><b/></a>'))
+        self.assertEqual(len(list(root.findall(".//{X}b"))), 2)
+        self.assertEqual(len(list(root.findall(".//b"))), 3)
+        self.assertEqual(len(list(root.findall("b"))), 2)
+
+    def test_element_with_attributes_keywords(self):
+        Element = self.etree.Element
+        
+        el = Element('tag', foo='Foo', bar='Bar')
+        self.assertEqual('Foo', el.attrib['foo'])
+        self.assertEqual('Bar', el.attrib['bar'])
+
+    def test_element_with_attributes(self):
+        Element = self.etree.Element
+        
+        el = Element('tag', {'foo':'Foo', 'bar':'Bar'})
+        self.assertEqual('Foo', el.attrib['foo'])
+        self.assertEqual('Bar', el.attrib['bar'])
+
+    def test_element_with_attributes_ns(self):
+        Element = self.etree.Element
+
+        el = Element('tag', {'{ns1}foo':'Foo', '{ns2}bar':'Bar'})
+        self.assertEqual('Foo', el.attrib['{ns1}foo'])
+        self.assertEqual('Bar', el.attrib['{ns2}bar'])
+
+    def test_subelement_with_attributes(self):
+        Element =  self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        el = Element('tag')
+        SubElement(el, 'foo', {'foo':'Foo'}, baz="Baz")
+        self.assertEqual("Baz", el[0].attrib['baz'])
+        self.assertEqual('Foo', el[0].attrib['foo'])
+
+    def test_subelement_with_attributes_ns(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        el = Element('tag')
+        SubElement(el, 'foo', {'{ns1}foo':'Foo', '{ns2}bar':'Bar'})
+        self.assertEqual('Foo', el[0].attrib['{ns1}foo'])
+        self.assertEqual('Bar', el[0].attrib['{ns2}bar'])
+        
+    def test_write(self):
+        ElementTree = self.etree.ElementTree
+        XML = self.etree.XML
+
+        for i in range(10):
+            f = BytesIO() 
+            root = XML(_bytes('<doc%s>This is a test.</doc%s>' % (i, i)))
+            tree = ElementTree(element=root)
+            tree.write(f)
+            data = f.getvalue()
+            self.assertEqual(
+                _bytes('<doc%s>This is a test.</doc%s>' % (i, i)),
+                canonicalize(data))
+
+    required_versions_ET['test_write_method_html'] = (1,3)
+    def test_write_method_html(self):
+        ElementTree = self.etree.ElementTree
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        html = Element('html')
+        body = SubElement(html, 'body')
+        p = SubElement(body, 'p')
+        p.text = "html"
+        SubElement(p, 'br').tail = "test"
+
+        tree = ElementTree(element=html)
+        f = BytesIO() 
+        tree.write(f, method="html")
+        data = f.getvalue().replace(_bytes('\n'),_bytes(''))
+
+        self.assertEqual(_bytes('<html><body><p>html<br>test</p></body></html>'),
+                          data)
+
+    required_versions_ET['test_write_method_text'] = (1,3)
+    def test_write_method_text(self):
+        ElementTree = self.etree.ElementTree
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        a.text = "A"
+        a.tail = "tail"
+        b = SubElement(a, 'b')
+        b.text = "B"
+        b.tail = "TAIL"
+        c = SubElement(a, 'c')
+        c.text = "C"
+        
+        tree = ElementTree(element=a)
+        f = BytesIO() 
+        tree.write(f, method="text")
+        data = f.getvalue()
+
+        self.assertEqual(_bytes('ABTAILCtail'),
+                          data)
+        
+    def test_write_fail(self):
+        ElementTree = self.etree.ElementTree
+        XML = self.etree.XML
+
+        tree = ElementTree( XML(_bytes('<doc>This is a test.</doc>')) )
+        self.assertRaises(IOError, tree.write,
+                          "definitely////\\-\\nonexisting\\-\\////FILE")
+
+    # this could trigger a crash, apparently because the document
+    # reference was prematurely garbage collected
+    def test_crash(self):
+        Element = self.etree.Element
+        
+        element = Element('tag')
+        for i in range(10):
+            element.attrib['key'] = 'value'
+            value = element.attrib['key']
+            self.assertEqual(value, 'value')
+            
+    # from doctest; for some reason this caused crashes too
+    def test_write_ElementTreeDoctest(self):
+        Element = self.etree.Element
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO()
+        for i in range(10):
+            element = Element('tag%s' % i)
+            self._check_element(element)
+            tree = ElementTree(element)
+            tree.write(f)
+            self._check_element_tree(tree)
+
+    def test_subelement_reference(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        el = Element('foo')
+        el2 = SubElement(el, 'bar')
+        el3 = SubElement(el2, 'baz')
+
+        al = Element('foo2')
+        al2 = SubElement(al, 'bar2')
+        al3 = SubElement(al2, 'baz2')
+
+        # now move al2 into el
+        el.append(al2)
+
+        # now change al3 directly
+        al3.text = 'baz2-modified'
+
+        # it should have changed through this route too
+        self.assertEqual(
+            'baz2-modified',
+            el[1][0].text)
+
+    def test_set_text(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        a.text = 'hoi'
+        self.assertEqual(
+            'hoi',
+            a.text)
+        self.assertEqual(
+            'b',
+            a[0].tag)
+
+    def test_set_text2(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        a.text = 'hoi'
+        b = SubElement(a ,'b')
+        self.assertEqual(
+            'hoi',
+            a.text)
+        self.assertEqual(
+            'b',
+            a[0].tag)
+
+    def test_set_text_none(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+
+        a.text = 'foo'
+        a.text = None
+
+        self.assertEqual(
+            None,
+            a.text)
+        self.assertXML(_bytes('<a></a>'), a)
+        
+    def test_set_text_empty(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        self.assertEqual(None, a.text)
+
+        a.text = ''
+        self.assertEqual('', a.text)
+        self.assertXML(_bytes('<a></a>'), a)
+        
+    def test_tail1(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        a.tail = 'dag'
+        self.assertEqual('dag',
+                          a.tail)
+        b = SubElement(a, 'b')
+        b.tail = 'hoi'
+        self.assertEqual('hoi',
+                          b.tail)
+        self.assertEqual('dag',
+                          a.tail)
+
+    def test_tail_append(self):
+        Element = self.etree.Element
+        
+        a = Element('a')
+        b = Element('b')
+        b.tail = 'b_tail'
+        a.append(b)
+        self.assertEqual('b_tail',
+                          b.tail)
+
+    def test_tail_set_twice(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        b.tail = 'foo'
+        b.tail = 'bar'
+        self.assertEqual('bar',
+                          b.tail)
+        self.assertXML(_bytes('<a><b></b>bar</a>'), a)
+        
+    def test_tail_set_none(self):
+        Element = self.etree.Element
+        a = Element('a')
+        a.tail = 'foo'
+        a.tail = None
+        self.assertEqual(
+            None,
+            a.tail)
+        self.assertXML(_bytes('<a></a>'), a)
+
+    required_versions_ET['test_extend'] = (1,3)
+    def test_extend(self):
+        root = self.etree.Element('foo')
+        for i in range(3):
+            element = self.etree.SubElement(root, 'a%s' % i)
+            element.text = "text%d" % i
+            element.tail = "tail%d" % i
+
+        elements = []
+        for i in range(3):
+            new_element = self.etree.Element("test%s" % i)
+            new_element.text = "TEXT%s" % i
+            new_element.tail = "TAIL%s" % i
+            elements.append(new_element)
+
+        root.extend(elements)
+
+        self.assertEqual(
+            ["a0", "a1", "a2", "test0", "test1", "test2"],
+            [ el.tag for el in root ])
+        self.assertEqual(
+            ["text0", "text1", "text2", "TEXT0", "TEXT1", "TEXT2"],
+            [ el.text for el in root ])
+        self.assertEqual(
+            ["tail0", "tail1", "tail2", "TAIL0", "TAIL1", "TAIL2"],
+            [ el.tail for el in root ])
+
+    def test_comment(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        Comment = self.etree.Comment
+
+        a = Element('a')
+        a.append(Comment('foo'))
+        self.assertEqual(a[0].tag, Comment)
+        self.assertEqual(a[0].text, 'foo')
+
+    # ElementTree < 1.3 adds whitespace around comments
+    required_versions_ET['test_comment_text'] = (1,3)
+    def test_comment_text(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        Comment = self.etree.Comment
+        tostring = self.etree.tostring
+
+        a = Element('a')
+        a.append(Comment('foo'))
+        self.assertEqual(a[0].text, 'foo')
+
+        self.assertEqual(
+            _bytes('<a><!--foo--></a>'),
+            tostring(a))
+
+        a[0].text = "TEST"
+        self.assertEqual(a[0].text, 'TEST')
+
+        self.assertEqual(
+            _bytes('<a><!--TEST--></a>'),
+            tostring(a))
+
+    # ElementTree < 1.3 adds whitespace around comments
+    required_versions_ET['test_comment_whitespace'] = (1,3)
+    def test_comment_whitespace(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        Comment = self.etree.Comment
+        tostring = self.etree.tostring
+
+        a = Element('a')
+        a.append(Comment(' foo  '))
+        self.assertEqual(a[0].text, ' foo  ')
+        self.assertEqual(
+            _bytes('<a><!-- foo  --></a>'),
+            tostring(a))
+        
+    def test_comment_nonsense(self):
+        Comment = self.etree.Comment
+        c = Comment('foo')
+        self.assertEqual({}, c.attrib)
+        self.assertEqual([], list(c.keys()))
+        self.assertEqual([], list(c.items()))
+        self.assertEqual(None, c.get('hoi'))
+        self.assertEqual(0, len(c))
+        # should not iterate
+        for i in c:
+            pass
+
+    def test_pi(self):
+        # lxml.etree separates target and text
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        ProcessingInstruction = self.etree.ProcessingInstruction
+
+        a = Element('a')
+        a.append(ProcessingInstruction('foo', 'some more text'))
+        self.assertEqual(a[0].tag, ProcessingInstruction)
+        self.assertXML(_bytes("<a><?foo some more text?></a>"),
+                       a)
+
+    def test_processinginstruction(self):
+        # lxml.etree separates target and text
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        ProcessingInstruction = self.etree.PI
+
+        a = Element('a')
+        a.append(ProcessingInstruction('foo', 'some more text'))
+        self.assertEqual(a[0].tag, ProcessingInstruction)
+        self.assertXML(_bytes("<a><?foo some more text?></a>"),
+                       a)
+
+    def test_pi_nonsense(self):
+        ProcessingInstruction = self.etree.ProcessingInstruction
+        pi = ProcessingInstruction('foo')
+        self.assertEqual({}, pi.attrib)
+        self.assertEqual([], list(pi.keys()))
+        self.assertEqual([], list(pi.items()))
+        self.assertEqual(None, pi.get('hoi'))
+        self.assertEqual(0, len(pi))
+        # should not iterate
+        for i in pi:
+            pass
+
+    def test_setitem(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = Element('c')
+        a[0] = c
+        self.assertEqual(
+            c,
+            a[0])
+        self.assertXML(_bytes('<a><c></c></a>'),
+                       a)
+        self.assertXML(_bytes('<b></b>'),
+                       b)
+        
+    def test_setitem2(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        for i in range(5):
+            b = SubElement(a, 'b%s' % i)
+            c = SubElement(b, 'c')
+        for i in range(5):
+            d = Element('d')
+            e = SubElement(d, 'e')
+            a[i] = d
+        self.assertXML(
+            _bytes('<a><d><e></e></d><d><e></e></d><d><e></e></d><d><e></e></d><d><e></e></d></a>'),
+            a)
+        self.assertXML(_bytes('<c></c>'),
+                       c)
+
+    def test_setitem_replace(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        SubElement(a, 'b')
+        d = Element('d')
+        a[0] = d
+        self.assertXML(_bytes('<a><d></d></a>'), a)
+
+    def test_setitem_indexerror(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+
+        self.assertRaises(IndexError, operator.setitem, a, 1, Element('c'))
+
+    def test_setitem_tail(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        b.tail = 'B2'
+        c = Element('c')
+        c.tail = 'C2'
+
+        a[0] = c
+        self.assertXML(
+            _bytes('<a><c></c>C2</a>'),
+            a)
+
+    def test_tag_write(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+
+        a.tag = 'c'
+
+        self.assertEqual(
+            'c',
+            a.tag)
+
+        self.assertXML(
+            _bytes('<c><b></b></c>'),
+            a)
+
+    def test_tag_reset_ns(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        tostring = self.etree.tostring
+
+        a = Element('{a}a')
+        b1 = SubElement(a, '{a}b')
+        b2 = SubElement(a, '{b}b')
+
+        self.assertEqual('{a}b',  b1.tag)
+
+        b1.tag = 'c'
+
+        # can't use C14N here!
+        self.assertEqual('c', b1.tag)
+        self.assertEqual(_bytes('<c'), tostring(b1)[:2])
+        self.assertTrue(_bytes('<c') in tostring(a))
+
+    def test_tag_reset_root_ns(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        tostring = self.etree.tostring
+
+        a = Element('{a}a')
+        b1 = SubElement(a, '{a}b')
+        b2 = SubElement(a, '{b}b')
+
+        a.tag = 'c'
+
+        self.assertEqual(
+            'c',
+            a.tag)
+
+        # can't use C14N here!
+        self.assertEqual('c',  a.tag)
+        self.assertEqual(_bytes('<c'), tostring(a)[:2])
+
+    def test_tag_str_subclass(self):
+        Element = self.etree.Element
+
+        class strTest(str):
+            pass
+
+        a = Element("a")
+        a.tag = strTest("TAG")
+        self.assertXML(_bytes('<TAG></TAG>'),
+                       a)
+
+    def test_delitem(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        del a[1]
+        self.assertXML(
+            _bytes('<a><b></b><d></d></a>'),
+            a)
+
+        del a[0]
+        self.assertXML(
+            _bytes('<a><d></d></a>'),
+            a)
+
+        del a[0]
+        self.assertXML(
+            _bytes('<a></a>'),
+            a)
+        # move deleted element into other tree afterwards
+        other = Element('other')
+        other.append(c)
+        self.assertXML(
+            _bytes('<other><c></c></other>'),
+            other)
+    
+    def test_del_insert(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        bs = SubElement(b, 'bs')
+        c = SubElement(a, 'c')
+        cs = SubElement(c, 'cs')
+
+        el = a[0]
+        self.assertXML(
+            _bytes('<a><b><bs></bs></b><c><cs></cs></c></a>'),
+            a)
+        self.assertXML(_bytes('<b><bs></bs></b>'), b)
+        self.assertXML(_bytes('<c><cs></cs></c>'), c)
+
+        del a[0]
+        self.assertXML(
+            _bytes('<a><c><cs></cs></c></a>'),
+            a)
+        self.assertXML(_bytes('<b><bs></bs></b>'), b)
+        self.assertXML(_bytes('<c><cs></cs></c>'), c)
+
+        a.insert(0, el)
+        self.assertXML(
+            _bytes('<a><b><bs></bs></b><c><cs></cs></c></a>'),
+            a)
+        self.assertXML(_bytes('<b><bs></bs></b>'), b)
+        self.assertXML(_bytes('<c><cs></cs></c>'), c)
+
+    def test_del_setitem(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        bs = SubElement(b, 'bs')
+        c = SubElement(a, 'c')
+        cs = SubElement(c, 'cs')
+
+        el = a[0]
+        del a[0]
+        a[0] = el
+        self.assertXML(
+            _bytes('<a><b><bs></bs></b></a>'),
+            a)
+        self.assertXML(_bytes('<b><bs></bs></b>'), b)
+        self.assertXML(_bytes('<c><cs></cs></c>'), c)
+
+    def test_del_setslice(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        bs = SubElement(b, 'bs')
+        c = SubElement(a, 'c')
+        cs = SubElement(c, 'cs')
+
+        el = a[0]
+        del a[0]
+        a[0:0] = [el]
+        self.assertXML(
+            _bytes('<a><b><bs></bs></b><c><cs></cs></c></a>'),
+            a)
+        self.assertXML(_bytes('<b><bs></bs></b>'), b)
+        self.assertXML(_bytes('<c><cs></cs></c>'), c)
+
+    def test_replace_slice_tail(self):
+        XML = self.etree.XML
+        a = XML(_bytes('<a><b></b>B2<c></c>C2</a>'))
+        b, c = a
+
+        a[:] = []
+
+        self.assertEqual("B2", b.tail)
+        self.assertEqual("C2", c.tail)
+
+    def test_merge_namespaced_subtree_as_slice(self):
+        XML = self.etree.XML
+        root = XML(_bytes(
+            '<foo><bar xmlns:baz="http://huhu"><puh><baz:bump1 /><baz:bump2 /></puh></bar></foo>'))
+        root[:] = root.findall('.//puh') # delete bar from hierarchy
+
+        # previously, this lost a namespace declaration on bump2
+        result = self.etree.tostring(root)
+        foo = self.etree.fromstring(result)
+
+        self.assertEqual('puh', foo[0].tag)
+        self.assertEqual('{http://huhu}bump1', foo[0][0].tag)
+        self.assertEqual('{http://huhu}bump2', foo[0][1].tag)
+
+    def test_delitem_tail(self):
+        ElementTree = self.etree.ElementTree
+        f = BytesIO('<a><b></b>B2<c></c>C2</a>')
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        del a[0]
+        self.assertXML(
+            _bytes('<a><c></c>C2</a>'),
+            a)
+        
+    def test_clear(self):
+        Element = self.etree.Element
+     
+        a = Element('a')
+        a.text = 'foo'
+        a.tail = 'bar'
+        a.set('hoi', 'dag')
+        a.clear()
+        self.assertEqual(None, a.text)
+        self.assertEqual(None, a.tail)
+        self.assertEqual(None, a.get('hoi'))
+        self.assertEqual('a', a.tag)
+
+    def test_clear_sub(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        a.text = 'foo'
+        a.tail = 'bar'
+        a.set('hoi', 'dag')
+        b = SubElement(a, 'b')
+        c = SubElement(b, 'c')
+        a.clear()
+        self.assertEqual(None, a.text)
+        self.assertEqual(None, a.tail)
+        self.assertEqual(None, a.get('hoi'))
+        self.assertEqual('a', a.tag)
+        self.assertEqual(0, len(a))
+        self.assertXML(_bytes('<a></a>'),
+                       a)
+        self.assertXML(_bytes('<b><c></c></b>'),
+                       b)
+    
+    def test_clear_tail(self):
+        ElementTree = self.etree.ElementTree
+        f = BytesIO('<a><b></b>B2<c></c>C2</a>')
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        a.clear()
+        self.assertXML(
+            _bytes('<a></a>'),
+            a)
+
+    def test_insert(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = Element('d')
+        a.insert(0, d)
+
+        self.assertEqual(
+            d,
+            a[0])
+
+        self.assertXML(
+            _bytes('<a><d></d><b></b><c></c></a>'),
+            a)
+
+        e = Element('e')
+        a.insert(2, e)
+        self.assertEqual(
+            e,
+            a[2])
+        self.assertXML(
+            _bytes('<a><d></d><b></b><e></e><c></c></a>'),
+            a)
+
+    def test_insert_beyond_index(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = Element('c')
+
+        a.insert(2, c)
+        self.assertEqual(
+            c,
+            a[1])
+        self.assertXML(
+            _bytes('<a><b></b><c></c></a>'),
+            a)
+
+    def test_insert_negative(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        d = Element('d')
+        a.insert(-1, d)
+        self.assertEqual(
+            d,
+            a[-2])
+        self.assertXML(
+            _bytes('<a><b></b><d></d><c></c></a>'),
+            a)
+
+    def test_insert_tail(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+
+        c = Element('c')
+        c.tail = 'C2'
+
+        a.insert(0, c)
+        self.assertXML(
+            _bytes('<a><c></c>C2<b></b></a>'),
+            a)
+        
+    def test_remove(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        a.remove(b)
+        self.assertEqual(
+            c,
+            a[0])
+        self.assertXML(
+            _bytes('<a><c></c></a>'),
+            a)
+        
+    def test_remove_ns(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('{http://test}a')
+        b = SubElement(a, '{http://test}b')
+        c = SubElement(a, '{http://test}c')
+
+        a.remove(b)
+        self.assertXML(
+            _bytes('<ns0:a xmlns:ns0="http://test"><ns0:c></ns0:c></ns0:a>'),
+            a)
+        self.assertXML(
+            _bytes('<ns0:b xmlns:ns0="http://test"></ns0:b>'),
+            b)
+
+    def test_remove_nonexisting(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = Element('d')
+        self.assertRaises(
+            ValueError, a.remove, d)
+
+    def test_remove_tail(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        b.tail = 'b2'
+        a.remove(b)
+        self.assertXML(
+            _bytes('<a></a>'),
+            a)
+        self.assertEqual('b2', b.tail)
+
+    def _test_getchildren(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+        self.assertXML(
+            _bytes('<a><b><d></d></b><c><e></e></c></a>'),
+            a)
+        self.assertEqual(
+            [b, c],
+            a.getchildren())
+        self.assertEqual(
+            [d],
+            b.getchildren())
+        self.assertEqual(
+            [],
+            d.getchildren())
+
+    def test_makeelement(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        b = a.makeelement('c', {'hoi':'dag'})
+        self.assertXML(
+            _bytes('<c hoi="dag"></c>'),
+            b)
+
+    required_versions_ET['test_iter'] = (1,3)
+    def test_iter(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+
+        self.assertEqual(
+            [a, b, d, c, e],
+            list(a.iter()))
+        self.assertEqual(
+            [d],
+            list(d.iter()))
+
+    def test_getiterator(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+
+        self.assertEqual(
+            [a, b, d, c, e],
+            list(a.getiterator()))
+        self.assertEqual(
+            [d],
+            list(d.getiterator()))
+
+    def test_getiterator_empty(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+
+        self.assertEqual(
+            [],
+            list(a.getiterator('none')))
+        self.assertEqual(
+            [],
+            list(e.getiterator('none')))
+        self.assertEqual(
+            [e],
+            list(e.getiterator()))
+
+    def test_getiterator_filter(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+
+        self.assertEqual(
+            [a],
+            list(a.getiterator('a')))
+        a2 = SubElement(e, 'a')
+        self.assertEqual(
+            [a, a2],
+            list(a.getiterator('a')))
+        self.assertEqual(
+            [a2],
+            list(c.getiterator('a')))
+
+    def test_getiterator_filter_all(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+
+        self.assertEqual(
+            [a, b, d, c, e],
+            list(a.getiterator('*')))
+
+    def test_getiterator_filter_comment(self):
+        Element = self.etree.Element
+        Comment = self.etree.Comment
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        comment_b = Comment("TEST-b")
+        b.append(comment_b)
+
+        self.assertEqual(
+            [comment_b],
+            list(a.getiterator(Comment)))
+
+        comment_a = Comment("TEST-a")
+        a.append(comment_a)
+
+        self.assertEqual(
+            [comment_b, comment_a],
+            list(a.getiterator(Comment)))
+
+        self.assertEqual(
+            [comment_b],
+            list(b.getiterator(Comment)))
+
+    def test_getiterator_filter_pi(self):
+        Element = self.etree.Element
+        PI = self.etree.ProcessingInstruction
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        pi_b = PI("TEST-b")
+        b.append(pi_b)
+
+        self.assertEqual(
+            [pi_b],
+            list(a.getiterator(PI)))
+
+        pi_a = PI("TEST-a")
+        a.append(pi_a)
+
+        self.assertEqual(
+            [pi_b, pi_a],
+            list(a.getiterator(PI)))
+
+        self.assertEqual(
+            [pi_b],
+            list(b.getiterator(PI)))
+
+    def test_getiterator_with_text(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        a.text = 'a'
+        b = SubElement(a, 'b')
+        b.text = 'b'
+        b.tail = 'b1'
+        c = SubElement(a, 'c')
+        c.text = 'c'
+        c.tail = 'c1'
+        d = SubElement(b, 'd')
+        c.text = 'd'
+        c.tail = 'd1'
+        e = SubElement(c, 'e')
+        e.text = 'e'
+        e.tail = 'e1'
+
+        self.assertEqual(
+            [a, b, d, c, e],
+            list(a.getiterator()))
+        #self.assertEqual(
+        #    [d],
+        #    list(d.getiterator()))
+
+    def test_getiterator_filter_with_text(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        a.text = 'a'
+        b = SubElement(a, 'b')
+        b.text = 'b'
+        b.tail = 'b1'
+        c = SubElement(a, 'c')
+        c.text = 'c'
+        c.tail = 'c1'
+        d = SubElement(b, 'd')
+        c.text = 'd'
+        c.tail = 'd1'
+        e = SubElement(c, 'e')
+        e.text = 'e'
+        e.tail = 'e1'
+
+        self.assertEqual(
+            [a],
+            list(a.getiterator('a')))
+        a2 = SubElement(e, 'a')
+        self.assertEqual(
+            [a, a2],
+            list(a.getiterator('a')))   
+        self.assertEqual(
+            [a2],
+            list(e.getiterator('a')))
+
+    def test_getslice(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        self.assertEqual(
+            [b, c],
+            a[0:2])
+        self.assertEqual(
+            [b, c, d],
+            a[:])
+        self.assertEqual(
+            [b, c, d],
+            a[:10])
+        self.assertEqual(
+            [b],
+            a[0:1])
+        self.assertEqual(
+            [],
+            a[10:12])
+
+    def test_getslice_negative(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        self.assertEqual(
+            [d],
+            a[-1:])
+        self.assertEqual(
+            [c, d],
+            a[-2:])
+        self.assertEqual(
+            [c],
+            a[-2:-1])
+        self.assertEqual(
+            [b, c],
+            a[-3:-1])
+        self.assertEqual(
+            [b, c],
+            a[-3:2])
+
+    def test_getslice_step(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        self.assertEqual(
+            [e,d,c,b],
+            a[::-1])
+        self.assertEqual(
+            [b,d],
+            a[::2])
+        self.assertEqual(
+            [e,c],
+            a[::-2])
+        self.assertEqual(
+            [d,c],
+            a[-2:0:-1])
+        self.assertEqual(
+            [e],
+            a[:1:-2])
+
+    def test_getslice_text(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<a><b>B</b>B1<c>C</c>C1</a>')
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        b = a[0]
+        c = a[1]
+        self.assertEqual(
+            [b, c],
+            a[:])
+        self.assertEqual(
+            [b],
+            a[0:1])
+        self.assertEqual(
+            [c],
+            a[1:])
+
+    def test_comment_getitem_getslice(self):
+        Element = self.etree.Element
+        Comment = self.etree.Comment
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        foo = Comment('foo')
+        a.append(foo)
+        c = SubElement(a, 'c')
+        self.assertEqual(
+            [b, foo, c],
+            a[:])
+        self.assertEqual(
+            foo,
+            a[1])
+        a[1] = new = Element('new')
+        self.assertEqual(
+            new,
+            a[1])
+        self.assertXML(
+            _bytes('<a><b></b><new></new><c></c></a>'),
+            a)
+        
+    def test_delslice(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        del a[1:3]
+        self.assertEqual(
+            [b, e],
+            list(a))
+
+    def test_delslice_negative1(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        del a[1:-1]
+        self.assertEqual(
+            [b, e],
+            list(a))
+
+    def test_delslice_negative2(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        del a[-3:-1]
+        self.assertEqual(
+            [b, e],
+            list(a))
+
+    def test_delslice_step(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        del a[1::2]
+        self.assertEqual(
+            [b, d],
+            list(a))
+
+    def test_delslice_step_negative(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        del a[::-1]
+        self.assertEqual(
+            [],
+            list(a))
+
+    def test_delslice_step_negative2(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        del a[::-2]
+        self.assertEqual(
+            [b, d],
+            list(a))
+
+    def test_delslice_child_tail(self):
+        ElementTree = self.etree.ElementTree
+        f = BytesIO('<a><b></b>B2<c></c>C2<d></d>D2<e></e>E2</a>')
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        del a[1:3]
+        self.assertXML(
+            _bytes('<a><b></b>B2<e></e>E2</a>'),
+            a)
+
+    def test_delslice_tail(self):
+        XML = self.etree.XML
+        a = XML(_bytes('<a><b></b>B2<c></c>C2</a>'))
+        b, c = a
+
+        del a[:]
+
+        self.assertEqual("B2", b.tail)
+        self.assertEqual("C2", c.tail)
+
+    def test_delslice_memory(self):
+        # this could trigger a crash
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(b, 'c')
+        del b # no more reference to b
+        del a[:]
+        self.assertEqual('c', c.tag)
+        
+    def test_setslice(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        e = Element('e')
+        f = Element('f')
+        g = Element('g')
+
+        s = [e, f, g]
+        a[1:2] = s
+        self.assertEqual(
+            [b, e, f, g, d],
+            list(a))
+
+    def test_setslice_all(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        e = Element('e')
+        f = Element('f')
+        g = Element('g')
+
+        s = [e, f, g]
+        a[:] = s
+        self.assertEqual(
+            [e, f, g],
+            list(a))
+
+    def test_setslice_all_empty(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+
+        e = Element('e')
+        f = Element('f')
+        g = Element('g')
+
+        s = [e, f, g]
+        a[:] = s
+        self.assertEqual(
+            [e, f, g],
+            list(a))
+
+    def test_setslice_all_replace(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        s = [b, c, d]
+        a[:] = s
+        self.assertEqual(
+            [b, c, d],
+            list(a))
+        
+    def test_setslice_all_replace_reversed(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        s = [d, c, b]
+        a[:] = s
+        self.assertEqual(
+            [d, c, b],
+            list(a))
+
+    def test_setslice_all_replace_reversed_ns1(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('{ns}a')
+        b = SubElement(a, '{ns}b', {'{ns1}a1': 'test'})
+        c = SubElement(a, '{ns}c', {'{ns2}a2': 'test'})
+        d = SubElement(a, '{ns}d', {'{ns3}a3': 'test'})
+
+        s = [d, c, b]
+        a[:] = s
+        self.assertEqual(
+            [d, c, b],
+            list(a))
+        self.assertEqual(
+            ['{ns}d', '{ns}c', '{ns}b'],
+            [ child.tag for child in a ])
+
+        self.assertEqual(
+            [['{ns3}a3'], ['{ns2}a2'], ['{ns1}a1']],
+            [ list(child.attrib.keys()) for child in a ])
+
+    def test_setslice_all_replace_reversed_ns2(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('{ns}a')
+        b = SubElement(a, '{ns1}b', {'{ns}a1': 'test'})
+        c = SubElement(a, '{ns2}c', {'{ns}a2': 'test'})
+        d = SubElement(a, '{ns3}d', {'{ns}a3': 'test'})
+
+        s = [d, c, b]
+        a[:] = s
+        self.assertEqual(
+            [d, c, b],
+            list(a))
+        self.assertEqual(
+            ['{ns3}d', '{ns2}c', '{ns1}b'],
+            [ child.tag for child in a ])
+
+        self.assertEqual(
+            [['{ns}a3'], ['{ns}a2'], ['{ns}a1']],
+            [ list(child.attrib.keys()) for child in a ])
+
+    def test_setslice_end(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        e = Element('e')
+        f = Element('f')
+        g = Element('g')
+        h = Element('h')
+
+        s = [e, f]
+        a[99:] = s
+        self.assertEqual(
+            [a, b, e, f],
+            list(a))
+
+        s = [g, h]
+        a[:0] = s
+        self.assertEqual(
+            [g, h, a, b, e, f],
+            list(a))
+
+    def test_setslice_single(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        e = Element('e')
+        f = Element('f')
+
+        s = [e]
+        a[0:1] = s
+        self.assertEqual(
+            [e, c],
+            list(a))
+
+        s = [f]
+        a[1:2] = s
+        self.assertEqual(
+            [e, f],
+            list(a))
+
+    def test_setslice_tail(self):
+        ElementTree = self.etree.ElementTree
+        Element = self.etree.Element
+        f = BytesIO('<a><b></b>B2<c></c>C2<d></d>D2<e></e>E2</a>')
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        x = Element('x')
+        y = Element('y')
+        z = Element('z')
+        x.tail = 'X2'
+        y.tail = 'Y2'
+        z.tail = 'Z2'
+        a[1:3] = [x, y, z]
+        self.assertXML(
+            _bytes('<a><b></b>B2<x></x>X2<y></y>Y2<z></z>Z2<e></e>E2</a>'),
+            a)
+
+    def test_setslice_negative(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        x = Element('x')
+        y = Element('y')
+
+        a[1:-1] = [x, y]
+        self.assertEqual(
+            [b, x, y, d],
+            list(a))
+
+    def test_setslice_negative2(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        x = Element('x')
+        y = Element('y')
+
+        a[1:-2] = [x, y]
+        self.assertEqual(
+            [b, x, y, c, d],
+            list(a))
+
+    def test_setslice_end(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+
+        e = Element('e')
+        f = Element('f')
+        g = Element('g')
+
+        s = [e, f, g]
+        a[3:] = s
+        self.assertEqual(
+            [b, c, d, e, f, g],
+            list(a))
+        
+    def test_setslice_empty(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+
+        b = Element('b')
+        c = Element('c')
+
+        a[:] = [b, c]
+        self.assertEqual(
+            [b, c],
+            list(a))
+
+    def test_tail_elementtree_root(self):
+        Element = self.etree.Element
+        ElementTree = self.etree.ElementTree
+
+        a = Element('a')
+        a.tail = 'A2'
+        t = ElementTree(element=a)
+        self.assertEqual('A2',
+                          a.tail)
+
+    def test_elementtree_getiterator(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        ElementTree = self.etree.ElementTree
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+        t = ElementTree(element=a)
+        
+        self.assertEqual(
+            [a, b, d, c, e],
+            list(t.getiterator()))
+
+    def test_elementtree_getiterator_filter(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        ElementTree = self.etree.ElementTree
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+        t = ElementTree(element=a)
+        
+        self.assertEqual(
+            [a],
+            list(t.getiterator('a')))
+        a2 = SubElement(e, 'a')
+        self.assertEqual(
+            [a, a2],
+            list(t.getiterator('a')))
+
+    def test_ns_access(self):
+        ElementTree = self.etree.ElementTree
+        ns = 'http://xml.infrae.com/1'
+        f = BytesIO('<x:a xmlns:x="%s"><x:b></x:b></x:a>' % ns)
+        t = ElementTree(file=f)
+        a = t.getroot()
+        self.assertEqual('{%s}a' % ns,
+                          a.tag)
+        self.assertEqual('{%s}b' % ns,
+                          a[0].tag)
+
+    def test_ns_access2(self):
+        ElementTree = self.etree.ElementTree
+        ns = 'http://xml.infrae.com/1'
+        ns2 = 'http://xml.infrae.com/2'
+        f = BytesIO('<x:a xmlns:x="%s" xmlns:y="%s"><x:b></x:b><y:b></y:b></x:a>' % (ns, ns2))
+        t = ElementTree(file=f)
+        a = t.getroot()
+        self.assertEqual('{%s}a' % ns,
+                          a.tag)
+        self.assertEqual('{%s}b' % ns,
+                          a[0].tag)
+        self.assertEqual('{%s}b' % ns2,
+                          a[1].tag)
+
+    def test_ns_setting(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        ns = 'http://xml.infrae.com/1'
+        ns2 = 'http://xml.infrae.com/2'
+        a = Element('{%s}a' % ns)
+        b = SubElement(a, '{%s}b' % ns2)
+        c = SubElement(a, '{%s}c' % ns)
+        self.assertEqual('{%s}a' % ns,
+                          a.tag)
+        self.assertEqual('{%s}b' % ns2,
+                          b.tag)
+        self.assertEqual('{%s}c' % ns,
+                          c.tag)
+        self.assertEqual('{%s}a' % ns,
+                          a.tag)
+        self.assertEqual('{%s}b' % ns2,
+                          b.tag)
+        self.assertEqual('{%s}c' % ns,
+                          c.tag)
+
+    def test_ns_tag_parse(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        ElementTree = self.etree.ElementTree
+
+        ns = 'http://xml.infrae.com/1'
+        ns2 = 'http://xml.infrae.com/2'
+        f = BytesIO('<a xmlns="%s" xmlns:x="%s"><x:b></x:b><b></b></a>' % (ns, ns2))
+        t = ElementTree(file=f)
+
+        a = t.getroot()
+        self.assertEqual('{%s}a' % ns,
+                          a.tag)
+        self.assertEqual('{%s}b' % ns2,
+                          a[0].tag)
+        self.assertEqual('{%s}b' % ns,
+                          a[1].tag)
+
+    def test_ns_attr(self):
+        Element = self.etree.Element
+        ns = 'http://xml.infrae.com/1'
+        ns2 = 'http://xml.infrae.com/2'
+        a = Element('a')
+        a.set('{%s}foo' % ns, 'Foo')
+        a.set('{%s}bar' % ns2, 'Bar')
+        self.assertEqual(
+            'Foo',
+            a.get('{%s}foo' % ns))
+        self.assertEqual(
+            'Bar',
+            a.get('{%s}bar' % ns2))
+        try:
+            self.assertXML(
+                _bytes('<a xmlns:ns0="%s" xmlns:ns1="%s" ns0:foo="Foo" ns1:bar="Bar"></a>' % (ns, ns2)),
+                a)
+        except AssertionError:
+            self.assertXML(
+                _bytes('<a xmlns:ns0="%s" xmlns:ns1="%s" ns1:foo="Foo" ns0:bar="Bar"></a>' % (ns2, ns)),
+                a)
+
+    def test_ns_move(self):
+        Element = self.etree.Element
+        one = self.etree.fromstring(
+            _bytes('<foo><bar xmlns:ns="http://a.b.c"><ns:baz/></bar></foo>'))
+        baz = one[0][0]
+
+        two = Element('root')
+        two.append(baz)
+        # removing the originating document could cause a crash/error before
+        # as namespace is not moved along with it
+        del one, baz
+        self.assertEqual('{http://a.b.c}baz', two[0].tag)
+
+    def test_ns_decl_tostring(self):
+        tostring = self.etree.tostring
+        root = self.etree.XML(
+            _bytes('<foo><bar xmlns:ns="http://a.b.c"><ns:baz/></bar></foo>'))
+        baz = root[0][0]
+
+        nsdecl = re.findall(_bytes("xmlns(?::[a-z0-9]+)?=[\"']([^\"']+)[\"']"),
+                            tostring(baz))
+        self.assertEqual([_bytes("http://a.b.c")], nsdecl)
+
+    def test_ns_decl_tostring_default(self):
+        tostring = self.etree.tostring
+        root = self.etree.XML(
+            _bytes('<foo><bar xmlns="http://a.b.c"><baz/></bar></foo>'))
+        baz = root[0][0]
+
+        nsdecl = re.findall(_bytes("xmlns(?::[a-z0-9]+)?=[\"']([^\"']+)[\"']"),
+                            tostring(baz))
+        self.assertEqual([_bytes("http://a.b.c")], nsdecl)
+        
+    def test_ns_decl_tostring_root(self):
+        tostring = self.etree.tostring
+        root = self.etree.XML(
+            _bytes('<foo xmlns:ns="http://a.b.c"><bar><ns:baz/></bar></foo>'))
+        baz = root[0][0]
+
+        nsdecl = re.findall(_bytes("xmlns(?::[a-z0-9]+)?=[\"']([^\"']+)[\"']"),
+                            tostring(baz))
+
+        self.assertEqual([_bytes("http://a.b.c")], nsdecl)
+        
+    def test_ns_decl_tostring_element(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        root = Element("foo")
+        bar = SubElement(root, "{http://a.b.c}bar")
+        baz = SubElement(bar, "{http://a.b.c}baz")
+
+        nsdecl = re.findall(_bytes("xmlns(?::[a-z0-9]+)?=[\"']([^\"']+)[\"']"),
+                            self.etree.tostring(baz))
+
+        self.assertEqual([_bytes("http://a.b.c")], nsdecl)
+
+    def test_attribute_xmlns_move(self):
+        Element = self.etree.Element
+
+        root = Element('element')
+
+        subelement = Element('subelement',
+                             {"{http://www.w3.org/XML/1998/namespace}id": "foo"})
+        self.assertEqual(1, len(subelement.attrib))
+        self.assertEqual(
+            "foo",
+            subelement.get("{http://www.w3.org/XML/1998/namespace}id"))
+
+        root.append(subelement)
+        self.assertEqual(1, len(subelement.attrib))
+        self.assertEqual(
+            list({"{http://www.w3.org/XML/1998/namespace}id" : "foo"}.items()),
+            list(subelement.attrib.items()))
+        self.assertEqual(
+            "foo",
+            subelement.get("{http://www.w3.org/XML/1998/namespace}id"))
+
+    def test_namespaces_after_serialize(self):
+        parse = self.etree.parse
+        tostring = self.etree.tostring
+
+        ns_href = "http://a.b.c"
+        one = parse(
+            BytesIO('<foo><bar xmlns:ns="%s"><ns:baz/></bar></foo>' % ns_href))
+        baz = one.getroot()[0][0]
+
+        parsed = parse(BytesIO( tostring(baz) )).getroot()
+        self.assertEqual('{%s}baz' % ns_href, parsed.tag)
+
+    def test_attribute_namespace_roundtrip(self):
+        fromstring = self.etree.fromstring
+        tostring = self.etree.tostring
+
+        ns_href = "http://a.b.c"
+        xml = _bytes('<root xmlns="%s" xmlns:x="%s"><el x:a="test" /></root>' % (
+                ns_href,ns_href))
+        root = fromstring(xml)
+        self.assertEqual('test', root[0].get('{%s}a' % ns_href))
+
+        xml2 = tostring(root)
+        self.assertTrue(_bytes(':a=') in xml2, xml2)
+
+        root2 = fromstring(xml2)
+        self.assertEqual('test', root2[0].get('{%s}a' % ns_href))
+
+    def test_attribute_namespace_roundtrip_replaced(self):
+        fromstring = self.etree.fromstring
+        tostring = self.etree.tostring
+
+        ns_href = "http://a.b.c"
+        xml = _bytes('<root xmlns="%s" xmlns:x="%s"><el x:a="test" /></root>' % (
+                ns_href,ns_href))
+        root = fromstring(xml)
+        self.assertEqual('test', root[0].get('{%s}a' % ns_href))
+
+        root[0].set('{%s}a' % ns_href, 'TEST')
+
+        xml2 = tostring(root)
+        self.assertTrue(_bytes(':a=') in xml2, xml2)
+
+        root2 = fromstring(xml2)
+        self.assertEqual('TEST', root2[0].get('{%s}a' % ns_href))
+
+    required_versions_ET['test_register_namespace'] = (1,3)
+    def test_register_namespace(self):
+        # ET 1.3+
+        Element = self.etree.Element
+        prefix = 'TESTPREFIX'
+        namespace = 'http://seriously.unknown/namespace/URI'
+
+        el = Element('{%s}test' % namespace)
+        self.assertEqual(_bytes('<ns0:test xmlns:ns0="%s"></ns0:test>' % namespace),
+            self._writeElement(el))
+
+        self.etree.register_namespace(prefix, namespace)
+        el = Element('{%s}test' % namespace)
+        self.assertEqual(_bytes('<%s:test xmlns:%s="%s"></%s:test>' % (
+            prefix, prefix, namespace, prefix)),
+            self._writeElement(el))
+
+        self.assertRaises(ValueError, self.etree.register_namespace, 'ns25', namespace)
+
+    def test_tostring(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        
+        self.assertEqual(_bytes('<a><b></b><c></c></a>'),
+                          canonicalize(tostring(a)))
+
+    def test_tostring_element(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(c, 'd')
+        self.assertEqual(_bytes('<b></b>'),
+                          canonicalize(tostring(b)))
+        self.assertEqual(_bytes('<c><d></d></c>'),
+                          canonicalize(tostring(c)))
+        
+    def test_tostring_element_tail(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(c, 'd')
+        b.tail = 'Foo'
+
+        self.assertTrue(tostring(b) == _bytes('<b/>Foo') or
+                     tostring(b) == _bytes('<b />Foo'))
+
+    required_versions_ET['test_tostring_method_html'] = (1,3)
+    def test_tostring_method_html(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        html = Element('html')
+        body = SubElement(html, 'body')
+        p = SubElement(body, 'p')
+        p.text = "html"
+        SubElement(p, 'br').tail = "test"
+
+        self.assertEqual(_bytes('<html><body><p>html<br>test</p></body></html>'),
+                          tostring(html, method="html"))
+
+    required_versions_ET['test_tostring_method_text'] = (1,3)
+    def test_tostring_method_text(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        a.text = "A"
+        a.tail = "tail"
+        b = SubElement(a, 'b')
+        b.text = "B"
+        b.tail = "TAIL"
+        c = SubElement(a, 'c')
+        c.text = "C"
+        
+        self.assertEqual(_bytes('ABTAILCtail'),
+                          tostring(a, method="text"))
+
+    def test_iterparse(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b></b><c/></a>')
+
+        iterator = iterparse(f)
+        self.assertEqual(None,
+                          iterator.root)
+        events = list(iterator)
+        root = iterator.root
+        self.assertEqual(
+            [('end', root[0]), ('end', root[1]), ('end', root)],
+            events)
+
+    def test_iterparse_file(self):
+        iterparse = self.etree.iterparse
+        iterator = iterparse(fileInTestDir("test.xml"))
+        self.assertEqual(None,
+                          iterator.root)
+        events = list(iterator)
+        root = iterator.root
+        self.assertEqual(
+            [('end', root[0]), ('end', root)],
+            events)
+
+    def test_iterparse_start(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b></b><c/></a>')
+
+        iterator = iterparse(f, events=('start',))
+        events = list(iterator)
+        root = iterator.root
+        self.assertEqual(
+            [('start', root), ('start', root[0]), ('start', root[1])],
+            events)
+
+    def test_iterparse_start_end(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b></b><c/></a>')
+
+        iterator = iterparse(f, events=('start','end'))
+        events = list(iterator)
+        root = iterator.root
+        self.assertEqual(
+            [('start', root), ('start', root[0]), ('end', root[0]),
+             ('start', root[1]), ('end', root[1]), ('end', root)],
+            events)
+
+    def test_iterparse_clear(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b></b><c/></a>')
+
+        iterator = iterparse(f)
+        for event, elem in iterator:
+            elem.clear()
+
+        root = iterator.root
+        self.assertEqual(0,
+                          len(root))
+
+    def test_iterparse_large(self):
+        iterparse = self.etree.iterparse
+        CHILD_COUNT = 12345
+        f = BytesIO('<a>%s</a>' % ('<b>test</b>'*CHILD_COUNT))
+
+        i = 0
+        for key in iterparse(f):
+            event, element = key
+            i += 1
+        self.assertEqual(i, CHILD_COUNT + 1)
+
+    def test_iterparse_attrib_ns(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a xmlns="http://ns1/"><b><c xmlns="http://ns2/"/></b></a>')
+
+        attr_name = '{http://testns/}bla'
+        events = []
+        iterator = iterparse(f, events=('start','end','start-ns','end-ns'))
+        for event, elem in iterator:
+            events.append(event)
+            if event == 'start':
+                if elem.tag != '{http://ns1/}a':
+                    elem.set(attr_name, 'value')
+
+        self.assertEqual(
+            ['start-ns', 'start', 'start', 'start-ns', 'start',
+             'end', 'end-ns', 'end', 'end', 'end-ns'],
+            events)
+
+        root = iterator.root
+        self.assertEqual(
+            None,
+            root.get(attr_name))
+        self.assertEqual(
+            'value',
+            root[0].get(attr_name))
+
+    def test_iterparse_getiterator(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b><d/></b><c/></a>')
+
+        counts = []
+        for event, elem in iterparse(f):
+            counts.append(len(list(elem.getiterator())))
+        self.assertEqual(
+            [1,2,1,4],
+            counts)
+
+    def test_iterparse_move_elements(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b><d/></b><c/></a>')
+
+        for event, node in etree.iterparse(f): pass
+
+        root = etree.Element('new_root', {})
+        root[:] = node[:]
+
+        self.assertEqual(
+            ['b', 'c'],
+            [ el.tag for el in root ])
+
+    def test_iterparse_cdata(self):
+        tostring = self.etree.tostring
+        f = BytesIO('<root><![CDATA[test]]></root>')
+        context = self.etree.iterparse(f)
+        content = [ el.text for event,el in context ]
+
+        self.assertEqual(['test'], content)
+        self.assertEqual(_bytes('<root>test</root>'),
+                          tostring(context.root))
+
+    def test_parse_file(self):
+        parse = self.etree.parse
+        # from file
+        tree = parse(fileInTestDir('test.xml'))
+        self.assertXML(
+            _bytes('<a><b></b></a>'),
+            tree.getroot())
+
+    def test_parse_file_nonexistent(self):
+        parse = self.etree.parse
+        self.assertRaises(IOError, parse, fileInTestDir('notthere.xml'))  
+
+    def test_parse_error_none(self):
+        parse = self.etree.parse
+        self.assertRaises(TypeError, parse, None)
+
+    required_versions_ET['test_parse_error'] = (1,3)
+    def test_parse_error(self):
+        # ET < 1.3 raises ExpatError
+        parse = self.etree.parse
+        f = BytesIO('<a><b></c></b></a>')
+        self.assertRaises(SyntaxError, parse, f)
+        f.close()
+
+    required_versions_ET['test_parse_error_from_file'] = (1,3)
+    def test_parse_error_from_file(self):
+        parse = self.etree.parse
+        # from file
+        f = open(fileInTestDir('test_broken.xml'), 'rb')
+        self.assertRaises(SyntaxError, parse, f)
+        f.close()
+
+    def test_parse_file_object(self):
+        parse = self.etree.parse
+        # from file object
+        f = open(fileInTestDir('test.xml'), 'rb')
+        tree = parse(f)
+        f.close()
+        self.assertXML(
+            _bytes('<a><b></b></a>'),
+            tree.getroot())
+
+    def test_parse_stringio(self):
+        parse = self.etree.parse
+        f = BytesIO('<a><b></b></a>')
+        tree = parse(f)
+        f.close()
+        self.assertXML(
+            _bytes('<a><b></b></a>'),
+            tree.getroot()
+           )
+
+    def test_parse_cdata(self):
+        tostring = self.etree.tostring
+        root = self.etree.XML(_bytes('<root><![CDATA[test]]></root>'))
+
+        self.assertEqual('test', root.text)
+        self.assertEqual(_bytes('<root>test</root>'),
+                          tostring(root))
+
+    def test_parse_with_encoding(self):
+        # this can fail in libxml2 <= 2.6.22
+        parse = self.etree.parse
+        tree = parse(BytesIO('<?xml version="1.0" encoding="ascii"?><html/>'))
+        self.assertXML(_bytes('<html></html>'),
+                       tree.getroot())
+
+    def test_encoding(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        a.text = _str('Søk på nettet')
+        self.assertXML(
+            _str('<a>Søk på nettet</a>').encode('UTF-8'),
+            a, 'utf-8')
+
+    def test_encoding_exact(self):
+        ElementTree = self.etree.ElementTree
+        Element = self.etree.Element
+
+        a = Element('a')
+        a.text = _str('Søk på nettet')
+        
+        f = BytesIO()
+        tree = ElementTree(element=a)
+        tree.write(f, encoding='utf-8')
+        self.assertEqual(_str('<a>Søk på nettet</a>').encode('UTF-8'),
+                          f.getvalue().replace(_bytes('\n'),_bytes('')))
+
+    def test_parse_file_encoding(self):
+        parse = self.etree.parse
+        # from file
+        tree = parse(fileInTestDir('test-string.xml'))
+        self.assertXML(
+            _str('<a>Søk på nettet</a>').encode('UTF-8'),
+            tree.getroot(), 'UTF-8')
+
+    def test_parse_file_object_encoding(self):
+        parse = self.etree.parse
+        # from file object
+        f = open(fileInTestDir('test-string.xml'), 'rb')
+        tree = parse(f)
+        f.close()
+        self.assertXML(
+            _str('<a>Søk på nettet</a>').encode('UTF-8'),
+            tree.getroot(), 'UTF-8')
+
+    def test_encoding_8bit_latin1(self):
+        ElementTree = self.etree.ElementTree
+        Element = self.etree.Element
+
+        a = Element('a')
+        a.text = _str('Søk på nettet')
+
+        f = BytesIO()
+        tree = ElementTree(element=a)
+        tree.write(f, encoding='iso-8859-1')
+        result = f.getvalue()
+        declaration = _bytes("<?xml version=\'1.0\' encoding=\'iso-8859-1\'?>")
+        self.assertEncodingDeclaration(result, _bytes('iso-8859-1'))
+        result = result.split(_bytes('?>'), 1)[-1].replace(_bytes('\n'),_bytes(''))
+        self.assertEqual(_str('<a>Søk på nettet</a>').encode('iso-8859-1'),
+                          result)
+
+    required_versions_ET['test_parse_encoding_8bit_explicit'] = (1,3)
+    def test_parse_encoding_8bit_explicit(self):
+        XMLParser = self.XMLParser
+
+        text = _str('Søk på nettet')
+        xml_latin1 = (_str('<a>%s</a>') % text).encode('iso-8859-1')
+
+        self.assertRaises(self.etree.ParseError,
+                          self.etree.parse,
+                          BytesIO(xml_latin1))
+
+        tree = self.etree.parse(BytesIO(xml_latin1),
+                                XMLParser(encoding="iso-8859-1"))
+        a = tree.getroot()
+        self.assertEqual(a.text, text)
+
+    required_versions_ET['test_parse_encoding_8bit_override'] = (1,3)
+    def test_parse_encoding_8bit_override(self):
+        XMLParser = self.XMLParser
+
+        text = _str('Søk på nettet')
+        wrong_declaration = _str("<?xml version='1.0' encoding='UTF-8'?>")
+        xml_latin1 = (_str('%s<a>%s</a>') % (wrong_declaration, text)
+                      ).encode('iso-8859-1')
+
+        self.assertRaises(self.etree.ParseError,
+                          self.etree.parse,
+                          BytesIO(xml_latin1))
+
+        tree = self.etree.parse(BytesIO(xml_latin1),
+                                XMLParser(encoding="iso-8859-1"))
+        a = tree.getroot()
+        self.assertEqual(a.text, text)
+
+    def _test_wrong_unicode_encoding(self):
+        # raise error on wrong encoding declaration in unicode strings
+        XML = self.etree.XML
+        test_utf = (_str('<?xml version="1.0" encoding="iso-8859-1"?>') +
+                    _str('<a>Søk på nettet</a>'))
+        self.assertRaises(SyntaxError, XML, test_utf)
+
+    def test_encoding_write_default_encoding(self):
+        ElementTree = self.etree.ElementTree
+        Element = self.etree.Element
+
+        a = Element('a')
+        a.text = _str('Søk på nettet')
+        
+        f = BytesIO()
+        tree = ElementTree(element=a)
+        tree.write(f)
+        data = f.getvalue().replace(_bytes('\n'),_bytes(''))
+        self.assertEqual(
+            _str('<a>Søk på nettet</a>').encode('ASCII', 'xmlcharrefreplace'),
+            data)
+
+    def test_encoding_tostring(self):
+        Element = self.etree.Element
+        tostring = self.etree.tostring
+
+        a = Element('a')
+        a.text = _str('Søk på nettet')
+        self.assertEqual(_str('<a>Søk på nettet</a>').encode('UTF-8'),
+                         tostring(a, encoding='utf-8'))
+
+    def test_encoding_tostring_unknown(self):
+        Element = self.etree.Element
+        tostring = self.etree.tostring
+        
+        a = Element('a')
+        a.text = _str('Søk på nettet')
+        self.assertRaises(LookupError, tostring, a,
+                          encoding='Invalid Encoding')
+
+    def test_encoding_tostring_sub(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        tostring = self.etree.tostring
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        b.text = _str('Søk på nettet')
+        self.assertEqual(_str('<b>Søk på nettet</b>').encode('UTF-8'),
+                         tostring(b, encoding='utf-8'))
+
+    def test_encoding_tostring_sub_tail(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        tostring = self.etree.tostring
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        b.text = _str('Søk på nettet')
+        b.tail = _str('Søk')
+        self.assertEqual(_str('<b>Søk på nettet</b>Søk').encode('UTF-8'),
+                         tostring(b, encoding='utf-8'))
+        
+    def test_encoding_tostring_default_encoding(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        tostring = self.etree.tostring
+
+        a = Element('a')
+        a.text = _str('Søk på nettet')
+
+        expected = _bytes('<a>S&#248;k p&#229; nettet</a>')
+        self.assertEqual(
+            expected,
+            tostring(a))
+
+    def test_encoding_sub_tostring_default_encoding(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        tostring = self.etree.tostring
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        b.text = _str('Søk på nettet')
+
+        expected = _bytes('<b>S&#248;k p&#229; nettet</b>')
+        self.assertEqual(
+            expected,
+            tostring(b))
+
+    def test_encoding_8bit_xml(self):
+        utext = _str('Søk på nettet')
+        uxml = _str('<p>%s</p>') % utext
+        prologue = _bytes('<?xml version="1.0" encoding="iso-8859-1" ?>')
+        isoxml = prologue + uxml.encode('iso-8859-1')
+        tree = self.etree.XML(isoxml)
+        self.assertEqual(utext, tree.text)
+
+    def test_encoding_utf8_bom(self):
+        utext = _str('Søk på nettet')
+        uxml = (_str('<?xml version="1.0" encoding="UTF-8"?>') +
+                _str('<p>%s</p>') % utext)
+        bom = _bytes('\\xEF\\xBB\\xBF').decode("unicode_escape").encode("latin1")
+        xml = bom + uxml.encode("utf-8")
+        tree = etree.XML(xml)
+        self.assertEqual(utext, tree.text)
+
+    def test_encoding_8bit_parse_stringio(self):
+        utext = _str('Søk på nettet')
+        uxml = _str('<p>%s</p>') % utext
+        prologue = _bytes('<?xml version="1.0" encoding="iso-8859-1" ?>')
+        isoxml = prologue + uxml.encode('iso-8859-1')
+        el = self.etree.parse(BytesIO(isoxml)).getroot()
+        self.assertEqual(utext, el.text)
+
+    def test_deepcopy_elementtree(self):
+        Element = self.etree.Element
+        ElementTree = self.etree.ElementTree
+
+        a = Element('a')
+        a.text = "Foo"
+        atree = ElementTree(a)
+
+        btree = copy.deepcopy(atree)
+        self.assertEqual("Foo", atree.getroot().text)
+        self.assertEqual("Foo", btree.getroot().text)
+        self.assertFalse(btree is atree)
+        self.assertFalse(btree.getroot() is atree.getroot())
+
+    def test_deepcopy(self):
+        Element = self.etree.Element
+        
+        a = Element('a')
+        a.text = 'Foo'
+
+        b = copy.deepcopy(a)
+        self.assertEqual('Foo', b.text)
+        
+        b.text = 'Bar'
+        self.assertEqual('Bar', b.text)
+        self.assertEqual('Foo', a.text)
+
+        del a
+        self.assertEqual('Bar', b.text)
+
+    def test_deepcopy_tail(self):
+        Element = self.etree.Element
+        
+        a = Element('a')
+        a.tail = 'Foo'
+
+        b = copy.deepcopy(a)
+        self.assertEqual('Foo', b.tail)
+        
+        b.tail = 'Bar'
+        self.assertEqual('Bar', b.tail)
+        self.assertEqual('Foo', a.tail)
+
+        del a
+        self.assertEqual('Bar', b.tail)
+
+    def test_deepcopy_subelement(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        root = Element('root')
+        a = SubElement(root, 'a')
+        a.text = 'FooText'
+        a.tail = 'FooTail'
+
+        b = copy.deepcopy(a)
+        self.assertEqual('FooText', b.text)
+        self.assertEqual('FooTail', b.tail)
+        
+        b.text = 'BarText'
+        b.tail = 'BarTail'
+        self.assertEqual('BarTail', b.tail)
+        self.assertEqual('FooTail', a.tail)
+        self.assertEqual('BarText', b.text)
+        self.assertEqual('FooText', a.text)
+
+        del a
+        self.assertEqual('BarTail', b.tail)
+        self.assertEqual('BarText', b.text)
+
+    def test_deepcopy_namespaces(self):
+        root = self.etree.XML(_bytes('''<doc xmlns="dns" xmlns:t="tns">
+        <parent><node t:foo="bar" /></parent>
+        </doc>'''))
+        self.assertEqual(
+            root[0][0].get('{tns}foo'),
+            copy.deepcopy(root[0])[0].get('{tns}foo') )
+        self.assertEqual(
+            root[0][0].get('{tns}foo'),
+            copy.deepcopy(root[0][0]).get('{tns}foo') )
+        
+    def test_deepcopy_append(self):
+        # previously caused a crash
+        Element = self.etree.Element
+        tostring = self.etree.tostring
+        
+        a = Element('a')
+        b = copy.deepcopy(a)
+        a.append( Element('C') )
+        b.append( Element('X') )
+
+        self.assertEqual(_bytes('<a><C/></a>'),
+                          tostring(a).replace(_bytes(' '), _bytes('')))
+        self.assertEqual(_bytes('<a><X/></a>'),
+                          tostring(b).replace(_bytes(' '), _bytes('')))
+
+    def test_deepcopy_comment(self):
+        # previously caused a crash
+        # not supported by ET < 1.3!
+        Comment = self.etree.Comment
+        
+        a = Comment("ONE")
+        b = copy.deepcopy(a)
+        b.text = "ANOTHER"
+
+        self.assertEqual('ONE',     a.text)
+        self.assertEqual('ANOTHER', b.text)
+
+    def test_shallowcopy(self):
+        Element = self.etree.Element
+        
+        a = Element('a')
+        a.text = 'Foo'
+
+        b = copy.copy(a)
+        self.assertEqual('Foo', b.text)
+        
+        b.text = 'Bar'
+        self.assertEqual('Bar', b.text)
+        self.assertEqual('Foo', a.text)
+        # XXX ElementTree will share nodes, but lxml.etree won't..
+
+    def test_shallowcopy_elementtree(self):
+        Element = self.etree.Element
+        ElementTree = self.etree.ElementTree
+        
+        a = Element('a')
+        a.text = 'Foo'
+        atree = ElementTree(a)
+
+        btree = copy.copy(atree)
+        self.assertFalse(btree is atree)
+        self.assertTrue(btree.getroot() is atree.getroot())
+        self.assertEqual('Foo', atree.getroot().text)
+
+    def _test_element_boolean(self):
+        # deprecated as of ET 1.3/lxml 2.0
+        etree = self.etree
+        e = etree.Element('foo')
+        self.assertEqual(False, bool(e))
+        etree.SubElement(e, 'bar')
+        self.assertEqual(True, bool(e))
+        e = etree.Element('foo')
+        e.text = 'hey'
+        self.assertEqual(False, bool(e))
+        e = etree.Element('foo')
+        e.tail = 'bar'
+        self.assertEqual(False, bool(e))
+        e = etree.Element('foo')
+        e.set('bar', 'Bar')
+        self.assertEqual(False, bool(e))
+
+    def test_multiple_elementrees(self):
+        etree = self.etree
+
+        a = etree.Element('a')
+        b = etree.SubElement(a, 'b')
+
+        t = etree.ElementTree(a)
+        self.assertEqual(self._rootstring(t), _bytes('<a><b/></a>'))
+
+        t1 = etree.ElementTree(a)
+        self.assertEqual(self._rootstring(t1), _bytes('<a><b/></a>'))
+        self.assertEqual(self._rootstring(t),  _bytes('<a><b/></a>'))
+
+        t2 = etree.ElementTree(b)
+        self.assertEqual(self._rootstring(t2), _bytes('<b/>'))
+        self.assertEqual(self._rootstring(t1), _bytes('<a><b/></a>'))
+        self.assertEqual(self._rootstring(t),  _bytes('<a><b/></a>'))
+
+    def test_qname(self):
+        etree = self.etree
+        qname = etree.QName('myns', 'a')
+        a1 = etree.Element(qname)
+        a2 = etree.SubElement(a1, qname)
+        self.assertEqual(a1.tag, "{myns}a")
+        self.assertEqual(a2.tag, "{myns}a")
+
+    def test_qname_cmp(self):
+        etree = self.etree
+        qname1 = etree.QName('myns', 'a')
+        qname2 = etree.QName('myns', 'a')
+        self.assertEqual(qname1, "{myns}a")
+        self.assertEqual("{myns}a", qname2)
+        self.assertEqual(qname1, qname1)
+        self.assertEqual(qname1, qname2)
+
+    def test_qname_attribute_getset(self):
+        etree = self.etree
+        qname = etree.QName('myns', 'a')
+
+        a = etree.Element(qname)
+        a.set(qname, "value")
+
+        self.assertEqual(a.get(qname), "value")
+        self.assertEqual(a.get("{myns}a"), "value")
+
+    def test_qname_attrib(self):
+        etree = self.etree
+        qname = etree.QName('myns', 'a')
+
+        a = etree.Element(qname)
+        a.attrib[qname] = "value"
+
+        self.assertEqual(a.attrib[qname], "value")
+        self.assertEqual(a.attrib.get(qname), "value")
+
+        self.assertEqual(a.attrib["{myns}a"], "value")
+        self.assertEqual(a.attrib.get("{myns}a"), "value")
+
+    def test_qname_attribute_resolve(self):
+        etree = self.etree
+        qname = etree.QName('http://myns', 'a')
+        a = etree.Element(qname)
+        a.set(qname, qname)
+
+        self.assertXML(
+            _bytes('<ns0:a xmlns:ns0="http://myns" ns0:a="ns0:a"></ns0:a>'),
+            a)
+
+    def test_qname_attribute_resolve_new(self):
+        etree = self.etree
+        qname = etree.QName('http://myns', 'a')
+        a = etree.Element('a')
+        a.set('a', qname)
+
+        self.assertXML(
+            _bytes('<a xmlns:ns0="http://myns" a="ns0:a"></a>'),
+            a)
+
+    def test_qname_attrib_resolve(self):
+        etree = self.etree
+        qname = etree.QName('http://myns', 'a')
+        a = etree.Element(qname)
+        a.attrib[qname] = qname
+
+        self.assertXML(
+            _bytes('<ns0:a xmlns:ns0="http://myns" ns0:a="ns0:a"></ns0:a>'),
+            a)
+
+    def test_parser_version(self):
+        etree = self.etree
+        parser = etree.XMLParser()
+        if hasattr(parser, "version"):
+            # ElementTree 1.3+, cET
+            self.assertTrue(re.match("[^ ]+ [0-9.]+", parser.version))
+
+    # feed parser interface
+
+    def test_feed_parser_bytes(self):
+        parser = self.XMLParser()
+
+        parser.feed(_bytes('<?xml version='))
+        parser.feed(_bytes('"1.0"?><ro'))
+        parser.feed(_bytes('ot><'))
+        parser.feed(_bytes('a test="works"/'))
+        parser.feed(_bytes('></root'))
+        parser.feed(_bytes('>'))
+
+        root = parser.close()
+
+        self.assertEqual(root.tag, "root")
+        self.assertEqual(root[0].tag, "a")
+        self.assertEqual(root[0].get("test"), "works")
+
+    def test_feed_parser_unicode(self):
+        parser = self.XMLParser()
+
+        parser.feed(_str('<ro'))
+        parser.feed(_str('ot><'))
+        parser.feed(_str('a test="works"/'))
+        parser.feed(_str('></root'))
+        parser.feed(_str('>'))
+
+        root = parser.close()
+
+        self.assertEqual(root.tag, "root")
+        self.assertEqual(root[0].tag, "a")
+        self.assertEqual(root[0].get("test"), "works")
+
+    required_versions_ET['test_feed_parser_error_close_empty'] = (1,3)
+    def test_feed_parser_error_close_empty(self):
+        ParseError = self.etree.ParseError
+        parser = self.XMLParser()
+        self.assertRaises(ParseError, parser.close)
+
+    required_versions_ET['test_feed_parser_error_close_incomplete'] = (1,3)
+    def test_feed_parser_error_close_incomplete(self):
+        ParseError = self.etree.ParseError
+        parser = self.XMLParser()
+
+        parser.feed('<?xml version=')
+        parser.feed('"1.0"?><ro')
+
+        self.assertRaises(ParseError, parser.close)
+
+    required_versions_ET['test_feed_parser_error_broken'] = (1,3)
+    def test_feed_parser_error_broken(self):
+        ParseError = self.etree.ParseError
+        parser = self.XMLParser()
+
+        parser.feed('<?xml version=')
+        parser.feed('"1.0"?><ro')
+        try:
+            parser.feed('<><><><><><><')
+        except ParseError:
+            # can raise, but not required before close()
+            pass
+
+        self.assertRaises(ParseError, parser.close)
+
+    required_versions_ET['test_feed_parser_error_position'] = (1,3)
+    def test_feed_parser_error_position(self):
+        ParseError = self.etree.ParseError
+        parser = self.XMLParser()
+        try:
+            parser.close()
+        except ParseError:
+            e = sys.exc_info()[1]
+            self.assertNotEqual(None, e.code)
+            self.assertNotEqual(0, e.code)
+            self.assertTrue(isinstance(e.position, tuple))
+            self.assertTrue(e.position >= (0, 0))
+
+    # parser target interface
+
+    required_versions_ET['test_parser_target_property'] = (1,3)
+    def test_parser_target_property(self):
+        class Target(object):
+            pass
+
+        target = Target()
+        parser = self.XMLParser(target=target)
+
+        self.assertEqual(target, parser.target)
+
+    def test_parser_target_tag(self):
+        assertEqual = self.assertEqual
+        assertFalse  = self.assertFalse
+
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start")
+                assertFalse(attrib)
+                assertEqual("TAG", tag)
+            def end(self, tag):
+                events.append("end")
+                assertEqual("TAG", tag)
+            def close(self):
+                return "DONE"
+
+        parser = self.XMLParser(target=Target())
+
+        parser.feed("<TAG/>")
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual(["start", "end"], events)
+
+    def test_parser_target_error_in_start(self):
+        assertEqual = self.assertEqual
+
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start")
+                assertEqual("TAG", tag)
+                raise ValueError("TEST")
+            def end(self, tag):
+                events.append("end")
+                assertEqual("TAG", tag)
+            def close(self):
+                return "DONE"
+
+        parser = self.XMLParser(target=Target())
+
+        try:
+            parser.feed("<TAG/>")
+        except ValueError:
+            self.assertTrue('TEST' in str(sys.exc_info()[1]))
+        else:
+            self.assertTrue(False)
+        if 'lxml' in self.etree.__name__:
+            self.assertEqual(["start"], events)
+        else:
+            # cElementTree calls end() as well
+            self.assertTrue("start" in events)
+
+    def test_parser_target_error_in_end(self):
+        assertEqual = self.assertEqual
+
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start")
+                assertEqual("TAG", tag)
+            def end(self, tag):
+                events.append("end")
+                assertEqual("TAG", tag)
+                raise ValueError("TEST")
+            def close(self):
+                return "DONE"
+
+        parser = self.XMLParser(target=Target())
+
+        try:
+            parser.feed("<TAG/>")
+        except ValueError:
+            self.assertTrue('TEST' in str(sys.exc_info()[1]))
+        else:
+            self.assertTrue(False)
+        self.assertEqual(["start", "end"], events)
+
+    def test_parser_target_error_in_close(self):
+        assertEqual = self.assertEqual
+
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start")
+                assertEqual("TAG", tag)
+            def end(self, tag):
+                events.append("end")
+                assertEqual("TAG", tag)
+            def close(self):
+                raise ValueError("TEST")
+
+        parser = self.XMLParser(target=Target())
+
+        try:
+            parser.feed("<TAG/>")
+            parser.close()
+        except ValueError:
+            self.assertTrue('TEST' in str(sys.exc_info()[1]))
+        else:
+            self.assertTrue(False)
+        self.assertEqual(["start", "end"], events)
+
+    def test_parser_target_error_in_start_and_close(self):
+        assertEqual = self.assertEqual
+
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start")
+                assertEqual("TAG", tag)
+                raise IndexError("TEST-IE")
+            def end(self, tag):
+                events.append("end")
+                assertEqual("TAG", tag)
+            def close(self):
+                raise ValueError("TEST-VE")
+
+        parser = self.XMLParser(target=Target())
+
+        try:
+            parser.feed("<TAG/>")
+            parser.close()
+        except IndexError:
+            if 'lxml' in self.etree.__name__:
+                # we try not to swallow the initial exception in Py2
+                self.assertTrue(sys.version_info[0] < 3)
+            self.assertTrue('TEST-IE' in str(sys.exc_info()[1]))
+        except ValueError:
+            if 'lxml' in self.etree.__name__:
+                self.assertTrue(sys.version_info[0] >= 3)
+            self.assertTrue('TEST-VE' in str(sys.exc_info()[1]))
+        else:
+            self.assertTrue(False)
+
+        if 'lxml' in self.etree.__name__:
+            self.assertEqual(["start"], events)
+        else:
+            # cElementTree calls end() as well
+            self.assertTrue("start" in events)
+
+    def test_elementtree_parser_target(self):
+        assertEqual = self.assertEqual
+        assertFalse  = self.assertFalse
+        Element = self.etree.Element
+
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start")
+                assertFalse(attrib)
+                assertEqual("TAG", tag)
+            def end(self, tag):
+                events.append("end")
+                assertEqual("TAG", tag)
+            def close(self):
+                return Element("DONE")
+
+        parser = self.XMLParser(target=Target())
+        tree = self.etree.ElementTree()
+        tree.parse(BytesIO("<TAG/>"), parser=parser)
+
+        self.assertEqual("DONE", tree.getroot().tag)
+        self.assertEqual(["start", "end"], events)
+
+    def test_parser_target_attrib(self):
+        assertEqual = self.assertEqual
+
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start-" + tag)
+                for name, value in attrib.items():
+                    assertEqual(tag + name, value)
+            def end(self, tag):
+                events.append("end-" + tag)
+            def close(self):
+                return "DONE"
+
+        parser = self.XMLParser(target=Target())
+
+        parser.feed('<root a="roota" b="rootb"><sub c="subc"/></root>')
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual(["start-root", "start-sub", "end-sub", "end-root"],
+                          events)
+
+    def test_parser_target_data(self):
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start-" + tag)
+            def end(self, tag):
+                events.append("end-" + tag)
+            def data(self, data):
+                events.append("data-" + data)
+            def close(self):
+                return "DONE"
+
+        parser = self.XMLParser(target=Target())
+
+        parser.feed('<root>A<sub/>B</root>')
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual(["start-root", "data-A", "start-sub",
+                           "end-sub", "data-B", "end-root"],
+                          events)
+
+    def test_parser_target_entity(self):
+        events = []
+        class Target(object):
+            def __init__(self):
+                self._data = []
+            def _flush_data(self):
+                if self._data:
+                    events.append("data-" + ''.join(self._data))
+                    del self._data[:]
+            def start(self, tag, attrib):
+                self._flush_data()
+                events.append("start-" + tag)
+            def end(self, tag):
+                self._flush_data()
+                events.append("end-" + tag)
+            def data(self, data):
+                self._data.append(data)
+            def close(self):
+                self._flush_data()
+                return "DONE"
+
+        parser = self.XMLParser(target=Target())
+
+        dtd = '''
+            <!DOCTYPE root [
+            <!ELEMENT root (sub*)>
+            <!ELEMENT sub (#PCDATA)>
+            <!ENTITY ent "an entity">
+        ]>
+        '''
+        parser.feed(dtd+'<root><sub/><sub>this is &ent;</sub><sub/></root>')
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual(["start-root", "start-sub", "end-sub", "start-sub",
+                           "data-this is an entity",
+                           "end-sub", "start-sub", "end-sub", "end-root"],
+                          events)
+
+    required_versions_ET['test_parser_target_entity_unknown'] = (1,3)
+    def test_parser_target_entity_unknown(self):
+        events = []
+        class Target(object):
+            def __init__(self):
+                self._data = []
+            def _flush_data(self):
+                if self._data:
+                    events.append("data-" + ''.join(self._data))
+                    del self._data[:]
+            def start(self, tag, attrib):
+                self._flush_data()
+                events.append("start-" + tag)
+            def end(self, tag):
+                self._flush_data()
+                events.append("end-" + tag)
+            def data(self, data):
+                self._data.append(data)
+            def close(self):
+                self._flush_data()
+                return "DONE"
+
+        parser = self.XMLParser(target=Target())
+
+        def feed():
+            parser.feed('<root><sub/><sub>some &ent;</sub><sub/></root>')
+            parser.close()
+
+        self.assertRaises(self.etree.ParseError, feed)
+
+    def test_treebuilder(self):
+        builder = self.etree.TreeBuilder()
+        el = builder.start("root", {'a':'A', 'b':'B'})
+        self.assertEqual("root", el.tag)
+        self.assertEqual({'a':'A', 'b':'B'}, el.attrib)
+        builder.data("ROOTTEXT")
+        el = builder.start("child", {'x':'X', 'y':'Y'})
+        self.assertEqual("child", el.tag)
+        self.assertEqual({'x':'X', 'y':'Y'}, el.attrib)
+        builder.data("CHILDTEXT")
+        el = builder.end("child")
+        self.assertEqual("child", el.tag)
+        self.assertEqual({'x':'X', 'y':'Y'}, el.attrib)
+        self.assertEqual("CHILDTEXT", el.text)
+        self.assertEqual(None, el.tail)
+        builder.data("CHILDTAIL")
+        root = builder.end("root")
+
+        self.assertEqual("root", root.tag)
+        self.assertEqual("ROOTTEXT", root.text)
+        self.assertEqual("CHILDTEXT", root[0].text)
+        self.assertEqual("CHILDTAIL", root[0].tail)
+
+    def test_treebuilder_target(self):
+        parser = self.XMLParser(target=self.etree.TreeBuilder())
+        parser.feed('<root>ROOTTEXT<child>CHILDTEXT</child>CHILDTAIL</root>')
+        root = parser.close()
+
+        self.assertEqual("root", root.tag)
+        self.assertEqual("ROOTTEXT", root.text)
+        self.assertEqual("CHILDTEXT", root[0].text)
+        self.assertEqual("CHILDTAIL", root[0].tail)
+
+    # helper methods
+
+    def _writeElement(self, element, encoding='us-ascii'):
+        """Write out element for comparison.
+        """
+        data = self.etree.tostring(element, encoding=encoding)
+        return canonicalize(data)
+
+    def _writeElementFile(self, element, encoding='us-ascii'):
+        """Write out element for comparison, using real file.
+        """
+        ElementTree = self.etree.ElementTree
+        handle, filename = tempfile.mkstemp()
+        try:
+            f = open(filename, 'wb')
+            tree = ElementTree(element=element)
+            tree.write(f, encoding=encoding)
+            f.close()
+            f = open(filename, 'rb')
+            data = f.read()
+            f.close()
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        return canonicalize(data)
+
+    def assertXML(self, expected, element, encoding='us-ascii'):
+        """Writes element out and checks whether it is expected.
+
+        Does this two ways; once using BytesIO, once using a real file.
+        """
+        if isinstance(expected, unicode):
+            expected = expected.encode(encoding)
+        self.assertEqual(expected, self._writeElement(element, encoding))
+        self.assertEqual(expected, self._writeElementFile(element, encoding))
+
+    def assertEncodingDeclaration(self, result, encoding):
+        "Checks if the result XML byte string specifies the encoding."
+        enc_re = r"<\?xml[^>]+ encoding=[\"']([^\"']+)[\"']"
+        if isinstance(result, str):
+            has_encoding = re.compile(enc_re).match
+        else:
+            has_encoding = re.compile(_bytes(enc_re)).match
+        self.assertTrue(has_encoding(result))
+        result_encoding = has_encoding(result).group(1)
+        self.assertEqual(result_encoding.upper(), encoding.upper())
+        
+    def _rootstring(self, tree):
+        return self.etree.tostring(tree.getroot()).replace(
+            _bytes(' '), _bytes('')).replace(_bytes('\n'), _bytes(''))
+
+    def _check_element_tree(self, tree):
+        self._check_element(tree.getroot())
+        
+    def _check_element(self, element):
+        self.assertTrue(hasattr(element, 'tag'))
+        self.assertTrue(hasattr(element, 'attrib'))
+        self.assertTrue(hasattr(element, 'text'))
+        self.assertTrue(hasattr(element, 'tail'))
+        self._check_string(element.tag)
+        self._check_mapping(element.attrib)
+        if element.text != None:
+            self._check_string(element.text)
+        if element.tail != None:
+            self._check_string(element.tail)
+        
+    def _check_string(self, string):
+        len(string)
+        for char in string:
+            self.assertEqual(1, len(char))
+        new_string = string + ""
+        new_string = string + " "
+        string[:0]
+
+    def _check_mapping(self, mapping):
+        len(mapping)
+        keys = mapping.keys()
+        values = mapping.values()
+        items = mapping.items()
+        for key in keys:
+            item = mapping[key]
+        mapping["key"] = "value"
+        self.assertEqual("value", mapping["key"])
+
+
+class _XMLPullParserTest(unittest.TestCase):
+    etree = None
+
+    def _feed(self, parser, data, chunk_size=None):
+        if chunk_size is None:
+            parser.feed(data)
+        else:
+            for i in range(0, len(data), chunk_size):
+                parser.feed(data[i:i+chunk_size])
+
+    def _close_and_return_root(self, parser):
+        if 'ElementTree' in self.etree.__name__:
+            # ElementTree's API is a bit unwieldy in Py3.4
+            root = parser._close_and_return_root()
+        else:
+            root = parser.close()
+        return root
+
+    def assert_event_tags(self, parser, expected):
+        events = parser.read_events()
+        self.assertEqual([(action, elem.tag) for action, elem in events],
+                         expected)
+
+    def test_simple_xml(self):
+        for chunk_size in (None, 1, 5):
+            #with self.subTest(chunk_size=chunk_size):
+                parser = self.etree.XMLPullParser()
+                self.assert_event_tags(parser, [])
+                self._feed(parser, "<!-- comment -->\n", chunk_size)
+                self.assert_event_tags(parser, [])
+                self._feed(parser,
+                           "<root>\n  <element key='value'>text</element",
+                           chunk_size)
+                self.assert_event_tags(parser, [])
+                self._feed(parser, ">\n", chunk_size)
+                self.assert_event_tags(parser, [('end', 'element')])
+                self._feed(parser, "<element>text</element>tail\n", chunk_size)
+                self._feed(parser, "<empty-element/>\n", chunk_size)
+                self.assert_event_tags(parser, [
+                    ('end', 'element'),
+                    ('end', 'empty-element'),
+                    ])
+                self._feed(parser, "</root>\n", chunk_size)
+                self.assert_event_tags(parser, [('end', 'root')])
+                root = self._close_and_return_root(parser)
+                self.assertEqual(root.tag, 'root')
+
+    def test_feed_while_iterating(self):
+        parser = self.etree.XMLPullParser()
+        it = parser.read_events()
+        self._feed(parser, "<root>\n  <element key='value'>text</element>\n")
+        action, elem = next(it)
+        self.assertEqual((action, elem.tag), ('end', 'element'))
+        self._feed(parser, "</root>\n")
+        action, elem = next(it)
+        self.assertEqual((action, elem.tag), ('end', 'root'))
+        try:
+            next(it)
+        except StopIteration:
+            self.assertTrue(True)
+        else:
+            self.assertTrue(False)
+
+    def test_simple_xml_with_ns(self):
+        parser = self.etree.XMLPullParser()
+        self.assert_event_tags(parser, [])
+        self._feed(parser, "<!-- comment -->\n")
+        self.assert_event_tags(parser, [])
+        self._feed(parser, "<root xmlns='namespace'>\n")
+        self.assert_event_tags(parser, [])
+        self._feed(parser, "<element key='value'>text</element")
+        self.assert_event_tags(parser, [])
+        self._feed(parser, ">\n")
+        self.assert_event_tags(parser, [('end', '{namespace}element')])
+        self._feed(parser, "<element>text</element>tail\n")
+        self._feed(parser, "<empty-element/>\n")
+        self.assert_event_tags(parser, [
+            ('end', '{namespace}element'),
+            ('end', '{namespace}empty-element'),
+            ])
+        self._feed(parser, "</root>\n")
+        self.assert_event_tags(parser, [('end', '{namespace}root')])
+        root = self._close_and_return_root(parser)
+        self.assertEqual(root.tag, '{namespace}root')
+
+    def test_ns_events(self):
+        parser = self.etree.XMLPullParser(events=('start-ns', 'end-ns'))
+        self._feed(parser, "<!-- comment -->\n")
+        self._feed(parser, "<root xmlns='namespace'>\n")
+        self.assertEqual(
+            list(parser.read_events()),
+            [('start-ns', ('', 'namespace'))])
+        self._feed(parser, "<element key='value'>text</element")
+        self._feed(parser, ">\n")
+        self._feed(parser, "<element>text</element>tail\n")
+        self._feed(parser, "<empty-element/>\n")
+        self._feed(parser, "</root>\n")
+        self.assertEqual(list(parser.read_events()), [('end-ns', None)])
+        parser.close()
+
+    def test_events(self):
+        parser = self.etree.XMLPullParser(events=())
+        self._feed(parser, "<root/>\n")
+        self.assert_event_tags(parser, [])
+
+        parser = self.etree.XMLPullParser(events=('start', 'end'))
+        self._feed(parser, "<!-- comment -->\n")
+        self.assert_event_tags(parser, [])
+        self._feed(parser, "<root>\n")
+        self.assert_event_tags(parser, [('start', 'root')])
+        self._feed(parser, "<element key='value'>text</element")
+        self.assert_event_tags(parser, [('start', 'element')])
+        self._feed(parser, ">\n")
+        self.assert_event_tags(parser, [('end', 'element')])
+        self._feed(parser,
+                   "<element xmlns='foo'>text<empty-element/></element>tail\n")
+        self.assert_event_tags(parser, [
+            ('start', '{foo}element'),
+            ('start', '{foo}empty-element'),
+            ('end', '{foo}empty-element'),
+            ('end', '{foo}element'),
+            ])
+        self._feed(parser, "</root>")
+        root = self._close_and_return_root(parser)
+        self.assert_event_tags(parser, [('end', 'root')])
+        self.assertEqual(root.tag, 'root')
+
+        parser = self.etree.XMLPullParser(events=('start',))
+        self._feed(parser, "<!-- comment -->\n")
+        self.assert_event_tags(parser, [])
+        self._feed(parser, "<root>\n")
+        self.assert_event_tags(parser, [('start', 'root')])
+        self._feed(parser, "<element key='value'>text</element")
+        self.assert_event_tags(parser, [('start', 'element')])
+        self._feed(parser, ">\n")
+        self.assert_event_tags(parser, [])
+        self._feed(parser,
+                   "<element xmlns='foo'>text<empty-element/></element>tail\n")
+        self.assert_event_tags(parser, [
+            ('start', '{foo}element'),
+            ('start', '{foo}empty-element'),
+            ])
+        self._feed(parser, "</root>")
+        root = self._close_and_return_root(parser)
+        self.assertEqual(root.tag, 'root')
+
+    def test_events_sequence(self):
+        # Test that events can be some sequence that's not just a tuple or list
+        eventset = set(['end', 'start'])
+        parser = self.etree.XMLPullParser(events=eventset)
+        self._feed(parser, "<foo>bar</foo>")
+        self.assert_event_tags(parser, [('start', 'foo'), ('end', 'foo')])
+
+        class DummyIter:
+            def __init__(self):
+                self.events = iter(['start', 'end', 'start-ns'])
+            def __iter__(self):
+                return self
+            def __next__(self):
+                return next(self.events)
+            next = __next__
+
+        parser = self.etree.XMLPullParser(events=DummyIter())
+        self._feed(parser, "<foo>bar</foo>")
+        self.assert_event_tags(parser, [('start', 'foo'), ('end', 'foo')])
+
+    def test_unknown_event(self):
+        try:
+            self.etree.XMLPullParser(events=('start', 'end', 'bogus'))
+        except ValueError:
+            self.assertTrue(True)
+        else:
+            self.assertTrue(False)
+
+
+if etree:
+    class ETreeTestCase(_ETreeTestCaseBase):
+        etree = etree
+
+    class ETreePullTestCase(_XMLPullParserTest):
+        etree = etree
+
+
+if ElementTree:
+    class ElementTreeTestCase(_ETreeTestCaseBase):
+        etree = ElementTree
+
+        @classmethod
+        def setUpClass(cls):
+            import warnings
+            # ElementTree warns about getiterator() in recent Pythons
+            warnings.filterwarnings(
+                'ignore',
+                'This method will be removed.*\.iter\(\).*instead',
+                PendingDeprecationWarning)
+
+    filter_by_version(
+        ElementTreeTestCase,
+        ElementTreeTestCase.required_versions_ET, ET_VERSION)
+
+    if hasattr(ElementTree, 'XMLPullParser'):
+        class ElementTreePullTestCase(_XMLPullParserTest):
+            etree = ElementTree
+    else:
+        ElementTreePullTestCase = None
+
+
+if cElementTree:
+    class CElementTreeTestCase(_ETreeTestCaseBase):
+        etree = cElementTree
+
+    filter_by_version(
+        CElementTreeTestCase,
+        CElementTreeTestCase.required_versions_cET, CET_VERSION)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    if etree:
+        suite.addTests([unittest.makeSuite(ETreeTestCase)])
+        suite.addTests([unittest.makeSuite(ETreePullTestCase)])
+    if ElementTree:
+        suite.addTests([unittest.makeSuite(ElementTreeTestCase)])
+        if ElementTreePullTestCase:
+            suite.addTests([unittest.makeSuite(ElementTreePullTestCase)])
+    if cElementTree:
+        suite.addTests([unittest.makeSuite(CElementTreeTestCase)])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_errors.py b/lib/lxml/tests/test_errors.py
new file mode 100644
index 00000000..fb6dfc43
--- /dev/null
+++ b/lib/lxml/tests/test_errors.py
@@ -0,0 +1,50 @@
+# -*- coding: utf-8 -*-
+import unittest, doctest
+
+# These tests check that error handling in the Pyrex code is
+# complete.
+# It is likely that if there are errors, instead of failing the code
+# will simply crash.
+
+import sys, gc, os.path
+from lxml import etree
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import HelperTestCase
+
+class ErrorTestCase(HelperTestCase):
+    etree = etree
+
+    def test_bad_element(self):
+        # attrib argument of Element() should be a dictionary, so if
+        # we pass a string we should get an error.
+        self.assertRaises(TypeError, self.etree.Element, 'a', 'b')
+
+    def test_empty_parse(self):
+        self.assertRaises(etree.XMLSyntaxError, etree.fromstring, '')
+
+    def test_element_cyclic_gc_none(self):
+        # test if cyclic reference can crash etree
+        Element = self.etree.Element
+        gc.collect()
+
+        count = sys.getrefcount(None)
+
+        l = [Element('name'), Element('name')]
+        l.append(l)
+
+        del l
+        gc.collect()
+
+        self.assertEqual(sys.getrefcount(None), count)
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ErrorTestCase)])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_etree.py b/lib/lxml/tests/test_etree.py
new file mode 100644
index 00000000..e9161618
--- /dev/null
+++ b/lib/lxml/tests/test_etree.py
@@ -0,0 +1,4163 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests specific to the extended etree API
+
+Tests that apply to the general ElementTree API should go into
+test_elementtree
+"""
+
+import os.path
+import unittest
+import copy
+import sys
+import re
+import gc
+import operator
+import tempfile
+import textwrap
+import zlib
+import gzip
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, StringIO, BytesIO, HelperTestCase
+from common_imports import fileInTestDir, fileUrlInTestDir, read_file, path2url
+from common_imports import SillyFileLike, LargeFileLikeUnicode, doctest, make_doctest
+from common_imports import canonicalize, sorted, _str, _bytes
+
+print("")
+print("TESTED VERSION: %s" % etree.__version__)
+print("    Python:           " + repr(sys.version_info))
+print("    lxml.etree:       " + repr(etree.LXML_VERSION))
+print("    libxml used:      " + repr(etree.LIBXML_VERSION))
+print("    libxml compiled:  " + repr(etree.LIBXML_COMPILED_VERSION))
+print("    libxslt used:     " + repr(etree.LIBXSLT_VERSION))
+print("    libxslt compiled: " + repr(etree.LIBXSLT_COMPILED_VERSION))
+print("")
+
+try:
+    _unicode = unicode
+except NameError:
+    # Python 3
+    _unicode = str
+
+class ETreeOnlyTestCase(HelperTestCase):
+    """Tests only for etree, not ElementTree"""
+    etree = etree
+
+    def test_version(self):
+        self.assertTrue(isinstance(etree.__version__, _unicode))
+        self.assertTrue(isinstance(etree.LXML_VERSION, tuple))
+        self.assertEqual(len(etree.LXML_VERSION), 4)
+        self.assertTrue(isinstance(etree.LXML_VERSION[0], int))
+        self.assertTrue(isinstance(etree.LXML_VERSION[1], int))
+        self.assertTrue(isinstance(etree.LXML_VERSION[2], int))
+        self.assertTrue(isinstance(etree.LXML_VERSION[3], int))
+        self.assertTrue(etree.__version__.startswith(
+            str(etree.LXML_VERSION[0])))
+
+    def test_c_api(self):
+        if hasattr(self.etree, '__pyx_capi__'):
+            # newer Pyrex compatible C-API
+            self.assertTrue(isinstance(self.etree.__pyx_capi__, dict))
+            self.assertTrue(len(self.etree.__pyx_capi__) > 0)
+        else:
+            # older C-API mechanism
+            self.assertTrue(hasattr(self.etree, '_import_c_api'))
+
+    def test_element_names(self):
+        Element = self.etree.Element
+        el = Element('name')
+        self.assertEqual(el.tag, 'name')
+        el = Element('{}name')
+        self.assertEqual(el.tag, 'name')
+
+    def test_element_name_empty(self):
+        Element = self.etree.Element
+        el = Element('name')
+        self.assertRaises(ValueError, Element, '{}')
+        self.assertRaises(ValueError, setattr, el, 'tag', '{}')
+
+        self.assertRaises(ValueError, Element, '{test}')
+        self.assertRaises(ValueError, setattr, el, 'tag', '{test}')
+
+    def test_element_name_colon(self):
+        Element = self.etree.Element
+        self.assertRaises(ValueError, Element, 'p:name')
+        self.assertRaises(ValueError, Element, '{test}p:name')
+
+        el = Element('name')
+        self.assertRaises(ValueError, setattr, el, 'tag', 'p:name')
+
+    def test_element_name_quote(self):
+        Element = self.etree.Element
+        self.assertRaises(ValueError, Element, "p'name")
+        self.assertRaises(ValueError, Element, 'p"name')
+
+        self.assertRaises(ValueError, Element, "{test}p'name")
+        self.assertRaises(ValueError, Element, '{test}p"name')
+
+        el = Element('name')
+        self.assertRaises(ValueError, setattr, el, 'tag', "p'name")
+        self.assertRaises(ValueError, setattr, el, 'tag', 'p"name')
+
+    def test_element_name_space(self):
+        Element = self.etree.Element
+        self.assertRaises(ValueError, Element, ' name ')
+        self.assertRaises(ValueError, Element, 'na me')
+        self.assertRaises(ValueError, Element, '{test} name')
+
+        el = Element('name')
+        self.assertRaises(ValueError, setattr, el, 'tag', ' name ')
+
+    def test_subelement_name_empty(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        self.assertRaises(ValueError, SubElement, el, '{}')
+        self.assertRaises(ValueError, SubElement, el, '{test}')
+
+    def test_subelement_name_colon(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        self.assertRaises(ValueError, SubElement, el, 'p:name')
+        self.assertRaises(ValueError, SubElement, el, '{test}p:name')
+
+    def test_subelement_name_quote(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        self.assertRaises(ValueError, SubElement, el, "p'name")
+        self.assertRaises(ValueError, SubElement, el, "{test}p'name")
+
+        self.assertRaises(ValueError, SubElement, el, 'p"name')
+        self.assertRaises(ValueError, SubElement, el, '{test}p"name')
+
+    def test_subelement_name_space(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        self.assertRaises(ValueError, SubElement, el, ' name ')
+        self.assertRaises(ValueError, SubElement, el, 'na me')
+        self.assertRaises(ValueError, SubElement, el, '{test} name')
+
+    def test_subelement_attribute_invalid(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        self.assertRaises(ValueError, SubElement, el, 'name', {'a b c' : 'abc'})
+        self.assertRaises(ValueError, SubElement, el, 'name', {'a' : 'a\0\n'})
+        self.assertEqual(0, len(el))
+
+    def test_qname_empty(self):
+        QName = self.etree.QName
+        self.assertRaises(ValueError, QName, '')
+        self.assertRaises(ValueError, QName, 'test', '')
+
+    def test_qname_colon(self):
+        QName = self.etree.QName
+        self.assertRaises(ValueError, QName, 'p:name')
+        self.assertRaises(ValueError, QName, 'test', 'p:name')
+
+    def test_qname_space(self):
+        QName = self.etree.QName
+        self.assertRaises(ValueError, QName, ' name ')
+        self.assertRaises(ValueError, QName, 'na me')
+        self.assertRaises(ValueError, QName, 'test', ' name')
+
+    def test_qname_namespace_localname(self):
+        # ET doesn't have namespace/localname properties on QNames
+        QName = self.etree.QName
+        namespace, localname = 'http://myns', 'a'
+        qname = QName(namespace, localname)
+        self.assertEqual(namespace, qname.namespace)
+        self.assertEqual(localname, qname.localname)
+
+    def test_qname_element(self):
+        # ET doesn't have namespace/localname properties on QNames
+        QName = self.etree.QName
+        qname1 = QName('http://myns', 'a')
+        a = self.etree.Element(qname1, nsmap={'p' : 'http://myns'})
+
+        qname2 = QName(a)
+        self.assertEqual(a.tag, qname1.text)
+        self.assertEqual(qname1.text, qname2.text)
+        self.assertEqual(qname1, qname2)
+
+    def test_qname_text_resolve(self):
+        # ET doesn't resove QNames as text values
+        etree = self.etree
+        qname = etree.QName('http://myns', 'a')
+        a = etree.Element(qname, nsmap={'p' : 'http://myns'})
+        a.text = qname
+
+        self.assertEqual("p:a", a.text)
+
+    def test_nsmap_prefix_invalid(self):
+        etree = self.etree
+        self.assertRaises(ValueError,
+                          etree.Element, "root", nsmap={'"' : 'testns'})
+        self.assertRaises(ValueError,
+                          etree.Element, "root", nsmap={'&' : 'testns'})
+        self.assertRaises(ValueError,
+                          etree.Element, "root", nsmap={'a:b' : 'testns'})
+
+    def test_attribute_has_key(self):
+        # ET in Py 3.x has no "attrib.has_key()" method
+        XML = self.etree.XML
+
+        root = XML(_bytes('<foo bar="Bar" xmlns:ns="http://ns.codespeak.net/test" ns:baz="Baz" />'))
+        self.assertEqual(
+            True, root.attrib.has_key('bar'))
+        self.assertEqual(
+            False, root.attrib.has_key('baz'))
+        self.assertEqual(
+            False, root.attrib.has_key('hah'))
+        self.assertEqual(
+            True,
+            root.attrib.has_key('{http://ns.codespeak.net/test}baz'))
+
+    def test_attribute_set(self):
+        Element = self.etree.Element
+        root = Element("root")
+        root.set("attr", "TEST")
+        self.assertEqual("TEST", root.get("attr"))
+
+    def test_attrib_and_keywords(self):
+        Element = self.etree.Element
+
+        root = Element("root")
+        root.set("attr", "TEST")
+        self.assertEqual("TEST", root.attrib["attr"])
+
+        root2 = Element("root2", root.attrib, attr2='TOAST')
+        self.assertEqual("TEST", root2.attrib["attr"])
+        self.assertEqual("TOAST", root2.attrib["attr2"])
+        self.assertEqual(None, root.attrib.get("attr2"))
+
+    def test_attrib_order(self):
+        Element = self.etree.Element
+
+        keys = ["attr%d" % i for i in range(10)]
+        values = ["TEST-%d" % i for i in range(10)]
+        items = list(zip(keys, values))
+
+        root = Element("root")
+        for key, value in items:
+            root.set(key, value)
+        self.assertEqual(keys, root.attrib.keys())
+        self.assertEqual(values, root.attrib.values())
+
+        root2 = Element("root2", root.attrib,
+                        attr_99='TOAST-1', attr_98='TOAST-2')
+        self.assertEqual(['attr_98', 'attr_99'] + keys,
+                         root2.attrib.keys())
+        self.assertEqual(['TOAST-2', 'TOAST-1'] + values,
+                         root2.attrib.values())
+
+        self.assertEqual(keys, root.attrib.keys())
+        self.assertEqual(values, root.attrib.values())
+
+    def test_attribute_set_invalid(self):
+        # ElementTree accepts arbitrary attribute values
+        # lxml.etree allows only strings
+        Element = self.etree.Element
+        root = Element("root")
+        self.assertRaises(TypeError, root.set, "newattr", 5)
+        self.assertRaises(TypeError, root.set, "newattr", None)
+
+    def test_strip_attributes(self):
+        XML = self.etree.XML
+        xml = _bytes('<test a="5" b="10" c="20"><x a="4" b="2"/></test>')
+
+        root = XML(xml)
+        self.etree.strip_attributes(root, 'a')
+        self.assertEqual(_bytes('<test b="10" c="20"><x b="2"></x></test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_attributes(root, 'b', 'c')
+        self.assertEqual(_bytes('<test a="5"><x a="4"></x></test>'),
+                          self._writeElement(root))
+
+    def test_strip_attributes_ns(self):
+        XML = self.etree.XML
+        xml = _bytes('<test xmlns:n="http://test/ns" a="6" b="10" c="20" n:a="5"><x a="4" n:b="2"/></test>')
+
+        root = XML(xml)
+        self.etree.strip_attributes(root, 'a')
+        self.assertEqual(
+            _bytes('<test xmlns:n="http://test/ns" b="10" c="20" n:a="5"><x n:b="2"></x></test>'),
+            self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_attributes(root, '{http://test/ns}a', 'c')
+        self.assertEqual(
+            _bytes('<test xmlns:n="http://test/ns" a="6" b="10"><x a="4" n:b="2"></x></test>'),
+            self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_attributes(root, '{http://test/ns}*')
+        self.assertEqual(
+            _bytes('<test xmlns:n="http://test/ns" a="6" b="10" c="20"><x a="4"></x></test>'),
+            self._writeElement(root))
+
+    def test_strip_elements(self):
+        XML = self.etree.XML
+        xml = _bytes('<test><a><b><c/></b></a><x><a><b/><c/></a></x></test>')
+
+        root = XML(xml)
+        self.etree.strip_elements(root, 'a')
+        self.assertEqual(_bytes('<test><x></x></test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_elements(root, 'b', 'c', 'X', 'Y', 'Z')
+        self.assertEqual(_bytes('<test><a></a><x><a></a></x></test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_elements(root, 'c')
+        self.assertEqual(_bytes('<test><a><b></b></a><x><a><b></b></a></x></test>'),
+                          self._writeElement(root))
+
+    def test_strip_elements_ns(self):
+        XML = self.etree.XML
+        xml = _bytes('<test>TEST<n:a xmlns:n="urn:a">A<b>B<c xmlns="urn:c"/>C</b>BT</n:a>AT<x>X<a>A<b xmlns="urn:a"/>BT<c xmlns="urn:x"/>CT</a>AT</x>XT</test>')
+
+        root = XML(xml)
+        self.etree.strip_elements(root, 'a')
+        self.assertEqual(_bytes('<test>TEST<n:a xmlns:n="urn:a">A<b>B<c xmlns="urn:c"></c>C</b>BT</n:a>AT<x>X</x>XT</test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_elements(root, '{urn:a}b', 'c')
+        self.assertEqual(_bytes('<test>TEST<n:a xmlns:n="urn:a">A<b>B<c xmlns="urn:c"></c>C</b>BT</n:a>AT<x>X<a>A<c xmlns="urn:x"></c>CT</a>AT</x>XT</test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_elements(root, '{urn:a}*', 'c')
+        self.assertEqual(_bytes('<test>TEST<x>X<a>A<c xmlns="urn:x"></c>CT</a>AT</x>XT</test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_elements(root, '{urn:a}*', 'c', with_tail=False)
+        self.assertEqual(_bytes('<test>TESTAT<x>X<a>ABT<c xmlns="urn:x"></c>CT</a>AT</x>XT</test>'),
+                          self._writeElement(root))
+
+    def test_strip_tags(self):
+        XML = self.etree.XML
+        xml = _bytes('<test>TEST<a>A<b>B<c/>CT</b>BT</a>AT<x>X<a>A<b/>BT<c/>CT</a>AT</x>XT</test>')
+
+        root = XML(xml)
+        self.etree.strip_tags(root, 'a')
+        self.assertEqual(_bytes('<test>TESTA<b>B<c></c>CT</b>BTAT<x>XA<b></b>BT<c></c>CTAT</x>XT</test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(root, 'b', 'c', 'X', 'Y', 'Z')
+        self.assertEqual(_bytes('<test>TEST<a>ABCTBT</a>AT<x>X<a>ABTCT</a>AT</x>XT</test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(root, 'c')
+        self.assertEqual(_bytes('<test>TEST<a>A<b>BCT</b>BT</a>AT<x>X<a>A<b></b>BTCT</a>AT</x>XT</test>'),
+                          self._writeElement(root))
+
+    def test_strip_tags_pi_comment(self):
+        XML = self.etree.XML
+        PI = self.etree.ProcessingInstruction
+        Comment = self.etree.Comment
+        xml = _bytes('<!--comment1-->\n<?PI1?>\n<test>TEST<!--comment2-->XT<?PI2?></test>\n<!--comment3-->\n<?PI1?>')
+
+        root = XML(xml)
+        self.etree.strip_tags(root, PI)
+        self.assertEqual(_bytes('<!--comment1-->\n<?PI1?>\n<test>TEST<!--comment2-->XT</test>\n<!--comment3-->\n<?PI1?>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(root, Comment)
+        self.assertEqual(_bytes('<!--comment1-->\n<?PI1?>\n<test>TESTXT<?PI2?></test>\n<!--comment3-->\n<?PI1?>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(root, PI, Comment)
+        self.assertEqual(_bytes('<!--comment1-->\n<?PI1?>\n<test>TESTXT</test>\n<!--comment3-->\n<?PI1?>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(root, Comment, PI)
+        self.assertEqual(_bytes('<!--comment1-->\n<?PI1?>\n<test>TESTXT</test>\n<!--comment3-->\n<?PI1?>'),
+                          self._writeElement(root))
+
+    def test_strip_tags_pi_comment_all(self):
+        XML = self.etree.XML
+        ElementTree = self.etree.ElementTree
+        PI = self.etree.ProcessingInstruction
+        Comment = self.etree.Comment
+        xml = _bytes('<!--comment1-->\n<?PI1?>\n<test>TEST<!--comment2-->XT<?PI2?></test>\n<!--comment3-->\n<?PI1?>')
+
+        root = XML(xml)
+        self.etree.strip_tags(ElementTree(root), PI)
+        self.assertEqual(_bytes('<!--comment1-->\n<test>TEST<!--comment2-->XT</test>\n<!--comment3-->'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(ElementTree(root), Comment)
+        self.assertEqual(_bytes('<?PI1?>\n<test>TESTXT<?PI2?></test>\n<?PI1?>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(ElementTree(root), PI, Comment)
+        self.assertEqual(_bytes('<test>TESTXT</test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(ElementTree(root), Comment, PI)
+        self.assertEqual(_bytes('<test>TESTXT</test>'),
+                          self._writeElement(root))
+
+    def test_strip_tags_doc_style(self):
+        XML = self.etree.XML
+        xml = _bytes('''
+        <div>
+            <div>
+                I like <strong>sheep</strong>.
+                <br/>
+                I like lots of <strong>sheep</strong>.
+                <br/>
+                Click <a href="http://www.sheep.com">here</a>
+                 for <a href="http://www.sheep.com">those</a> sheep.
+                <br/>
+            </div>
+        </div>
+        '''.strip())
+
+        root = XML(xml)
+        self.etree.strip_tags(root, 'a')
+        self.assertEqual(re.sub(_bytes('</?a[^>]*>'), _bytes(''), xml).replace(_bytes('<br/>'), _bytes('<br></br>')),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(root, 'a', 'br')
+        self.assertEqual(re.sub(_bytes('</?a[^>]*>'), _bytes(''),
+                                 re.sub(_bytes('<br[^>]*>'), _bytes(''), xml)),
+                          self._writeElement(root))
+
+    def test_strip_tags_ns(self):
+        XML = self.etree.XML
+        xml = _bytes('<test>TEST<n:a xmlns:n="urn:a">A<b>B<c xmlns="urn:c"/>CT</b>BT</n:a>AT<x>X<a>A<b xmlns="urn:a"/>BT<c xmlns="urn:x"/>CT</a>AT</x>XT</test>')
+
+        root = XML(xml)
+        self.etree.strip_tags(root, 'a')
+        self.assertEqual(_bytes('<test>TEST<n:a xmlns:n="urn:a">A<b>B<c xmlns="urn:c"></c>CT</b>BT</n:a>AT<x>XA<b xmlns="urn:a"></b>BT<c xmlns="urn:x"></c>CTAT</x>XT</test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(root, '{urn:a}b', 'c')
+        self.assertEqual(_bytes('<test>TEST<n:a xmlns:n="urn:a">A<b>B<c xmlns="urn:c"></c>CT</b>BT</n:a>AT<x>X<a>ABT<c xmlns="urn:x"></c>CT</a>AT</x>XT</test>'),
+                          self._writeElement(root))
+
+        root = XML(xml)
+        self.etree.strip_tags(root, '{urn:a}*', 'c')
+        self.assertEqual(_bytes('<test>TESTA<b>B<c xmlns="urn:c"></c>CT</b>BTAT<x>X<a>ABT<c xmlns="urn:x"></c>CT</a>AT</x>XT</test>'),
+                          self._writeElement(root))
+
+    def test_strip_tags_and_remove(self):
+        # previously crashed
+        HTML = self.etree.HTML
+        root = HTML(_bytes('<div><h1>title</h1> <b>foo</b> <p>boo</p></div>'))[0][0]
+        self.assertEqual(_bytes('<div><h1>title</h1> <b>foo</b> <p>boo</p></div>'),
+                          self.etree.tostring(root))
+        self.etree.strip_tags(root, 'b')
+        self.assertEqual(_bytes('<div><h1>title</h1> foo <p>boo</p></div>'),
+                          self.etree.tostring(root))
+        root.remove(root[0])
+        self.assertEqual(_bytes('<div><p>boo</p></div>'),
+                          self.etree.tostring(root))
+
+    def test_pi(self):
+        # lxml.etree separates target and text
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        ProcessingInstruction = self.etree.ProcessingInstruction
+
+        a = Element('a')
+        a.append(ProcessingInstruction('foo', 'some more text'))
+        self.assertEqual(a[0].target, 'foo')
+        self.assertEqual(a[0].text, 'some more text')
+
+    def test_pi_parse(self):
+        XML = self.etree.XML
+        root = XML(_bytes("<test><?mypi my test ?></test>"))
+        self.assertEqual(root[0].target, "mypi")
+        self.assertEqual(root[0].text, "my test ")
+
+    def test_pi_pseudo_attributes_get(self):
+        XML = self.etree.XML
+        root = XML(_bytes("<test><?mypi my='1' test=\" abc \" quotes=\"' '\" only names ?></test>"))
+        self.assertEqual(root[0].target, "mypi")
+        self.assertEqual(root[0].get('my'), "1")
+        self.assertEqual(root[0].get('test'), " abc ")
+        self.assertEqual(root[0].get('quotes'), "' '")
+        self.assertEqual(root[0].get('only'), None)
+        self.assertEqual(root[0].get('names'), None)
+        self.assertEqual(root[0].get('nope'), None)
+
+    def test_pi_pseudo_attributes_attrib(self):
+        XML = self.etree.XML
+        root = XML(_bytes("<test><?mypi my='1' test=\" abc \" quotes=\"' '\" only names ?></test>"))
+        self.assertEqual(root[0].target, "mypi")
+        self.assertEqual(root[0].attrib['my'], "1")
+        self.assertEqual(root[0].attrib['test'], " abc ")
+        self.assertEqual(root[0].attrib['quotes'], "' '")
+        self.assertRaises(KeyError, root[0].attrib.__getitem__, 'only')
+        self.assertRaises(KeyError, root[0].attrib.__getitem__, 'names')
+        self.assertRaises(KeyError, root[0].attrib.__getitem__, 'nope')
+
+    def test_deepcopy_pi(self):
+        # previously caused a crash
+        ProcessingInstruction = self.etree.ProcessingInstruction
+        
+        a = ProcessingInstruction("PI", "ONE")
+        b = copy.deepcopy(a)
+        b.text = "ANOTHER"
+
+        self.assertEqual('ONE',     a.text)
+        self.assertEqual('ANOTHER', b.text)
+
+    def test_deepcopy_elementtree_pi(self):
+        XML = self.etree.XML
+        tostring = self.etree.tostring
+        root = XML(_bytes("<?mypi my test ?><test/><!--comment -->"))
+        tree1 = self.etree.ElementTree(root)
+        self.assertEqual(_bytes("<?mypi my test ?><test/><!--comment -->"),
+                          tostring(tree1))
+
+        tree2 = copy.deepcopy(tree1)
+        self.assertEqual(_bytes("<?mypi my test ?><test/><!--comment -->"),
+                          tostring(tree2))
+
+        root2 = copy.deepcopy(tree1.getroot())
+        self.assertEqual(_bytes("<test/>"),
+                          tostring(root2))
+
+    def test_deepcopy_elementtree_dtd(self):
+        XML = self.etree.XML
+        tostring = self.etree.tostring
+        xml = _bytes('<!DOCTYPE test [\n<!ENTITY entity "tasty">\n]>\n<test/>')
+        root = XML(xml)
+        tree1 = self.etree.ElementTree(root)
+        self.assertEqual(xml, tostring(tree1))
+
+        tree2 = copy.deepcopy(tree1)
+        self.assertEqual(xml, tostring(tree2))
+
+        root2 = copy.deepcopy(tree1.getroot())
+        self.assertEqual(_bytes("<test/>"),
+                          tostring(root2))
+
+    def test_attribute_set(self):
+        # ElementTree accepts arbitrary attribute values
+        # lxml.etree allows only strings
+        Element = self.etree.Element
+
+        root = Element("root")
+        root.set("attr", "TEST")
+        self.assertEqual("TEST", root.get("attr"))
+        self.assertRaises(TypeError, root.set, "newattr", 5)
+
+    def test_parse_remove_comments(self):
+        fromstring = self.etree.fromstring
+        tostring = self.etree.tostring
+        XMLParser = self.etree.XMLParser
+
+        xml = _bytes('<a><!--A--><b><!-- B --><c/></b><!--C--></a>')
+        parser = XMLParser(remove_comments=True)
+        root = fromstring(xml, parser)
+        self.assertEqual(
+            _bytes('<a><b><c/></b></a>'),
+            tostring(root))
+
+    def test_parse_remove_pis(self):
+        parse = self.etree.parse
+        tostring = self.etree.tostring
+        XMLParser = self.etree.XMLParser
+
+        xml = _bytes('<?test?><a><?A?><b><?B?><c/></b><?C?></a><?tail?>')
+
+        f = BytesIO(xml)
+        tree = parse(f)
+        self.assertEqual(
+            xml,
+            tostring(tree))
+
+        parser = XMLParser(remove_pis=True)
+        tree = parse(f, parser)
+        self.assertEqual(
+            _bytes('<a><b><c/></b></a>'),
+            tostring(tree))
+
+    def test_parse_parser_type_error(self):
+        # ET raises IOError only
+        parse = self.etree.parse
+        self.assertRaises(TypeError, parse, 'notthere.xml', object())
+
+    def test_iterparse_tree_comments(self):
+        # ET removes comments
+        iterparse = self.etree.iterparse
+        tostring = self.etree.tostring
+
+        f = BytesIO('<a><!--A--><b><!-- B --><c/></b><!--C--></a>')
+        events = list(iterparse(f))
+        root = events[-1][1]
+        self.assertEqual(3, len(events))
+        self.assertEqual(
+            _bytes('<a><!--A--><b><!-- B --><c/></b><!--C--></a>'),
+            tostring(root))
+
+    def test_iterparse_comments(self):
+        # ET removes comments
+        iterparse = self.etree.iterparse
+        tostring = self.etree.tostring
+
+        def name(event, el):
+            if event == 'comment':
+                return el.text
+            else:
+                return el.tag
+
+        f = BytesIO('<a><!--A--><b><!-- B --><c/></b><!--C--></a>')
+        events = list(iterparse(f, events=('end', 'comment')))
+        root = events[-1][1]
+        self.assertEqual(6, len(events))
+        self.assertEqual(['A', ' B ', 'c', 'b', 'C', 'a'],
+                          [ name(*item) for item in events ])
+        self.assertEqual(
+            _bytes('<a><!--A--><b><!-- B --><c/></b><!--C--></a>'),
+            tostring(root))
+
+    def test_iterparse_pis(self):
+        # ET removes pis
+        iterparse = self.etree.iterparse
+        tostring = self.etree.tostring
+        ElementTree = self.etree.ElementTree
+
+        def name(event, el):
+            if event == 'pi':
+                return (el.target, el.text)
+            else:
+                return el.tag
+
+        f = BytesIO('<?pia a?><a><?pib b?><b><?pic c?><c/></b><?pid d?></a><?pie e?>')
+        events = list(iterparse(f, events=('end', 'pi')))
+        root = events[-2][1]
+        self.assertEqual(8, len(events))
+        self.assertEqual([('pia','a'), ('pib','b'), ('pic','c'), 'c', 'b',
+                           ('pid','d'), 'a', ('pie','e')],
+                          [ name(*item) for item in events ])
+        self.assertEqual(
+            _bytes('<?pia a?><a><?pib b?><b><?pic c?><c/></b><?pid d?></a><?pie e?>'),
+            tostring(ElementTree(root)))
+
+    def test_iterparse_remove_comments(self):
+        iterparse = self.etree.iterparse
+        tostring = self.etree.tostring
+
+        f = BytesIO('<a><!--A--><b><!-- B --><c/></b><!--C--></a>')
+        events = list(iterparse(f, remove_comments=True,
+                                events=('end', 'comment')))
+        root = events[-1][1]
+        self.assertEqual(3, len(events))
+        self.assertEqual(['c', 'b', 'a'],
+                          [ el.tag for (event, el) in events ])
+        self.assertEqual(
+            _bytes('<a><b><c/></b></a>'),
+            tostring(root))
+
+    def test_iterparse_broken(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b><c/></a>')
+        # ET raises ExpatError, lxml raises XMLSyntaxError
+        self.assertRaises(self.etree.XMLSyntaxError, list, iterparse(f))
+
+    def test_iterparse_broken_recover(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b><c/></a>')
+        it = iterparse(f, events=('start', 'end'), recover=True)
+        events = [(ev, el.tag) for ev, el in it]
+        root = it.root
+        self.assertTrue(root is not None)
+
+        self.assertEqual(1, events.count(('start', 'a')))
+        self.assertEqual(1, events.count(('end', 'a')))
+
+        self.assertEqual(1, events.count(('start', 'b')))
+        self.assertEqual(1, events.count(('end', 'b')))
+
+        self.assertEqual(1, events.count(('start', 'c')))
+        self.assertEqual(1, events.count(('end', 'c')))
+
+    def test_iterparse_broken_multi_recover(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b><c/></d><b><c/></a></b>')
+        it = iterparse(f, events=('start', 'end'), recover=True)
+        events = [(ev, el.tag) for ev, el in it]
+        root = it.root
+        self.assertTrue(root is not None)
+
+        self.assertEqual(1, events.count(('start', 'a')))
+        self.assertEqual(1, events.count(('end', 'a')))
+
+        self.assertEqual(2, events.count(('start', 'b')))
+        self.assertEqual(2, events.count(('end', 'b')))
+
+        self.assertEqual(2, events.count(('start', 'c')))
+        self.assertEqual(2, events.count(('end', 'c')))
+
+    def test_iterparse_strip(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO("""
+               <a>  \n \n  <b> b test </b>  \n
+
+               \n\t <c> \n </c> </a>  \n """)
+        iterator = iterparse(f, remove_blank_text=True)
+        text = [ (element.text, element.tail)
+                 for event, element in iterator ]
+        self.assertEqual(
+            [(" b test ", None), (" \n ", None), (None, None)],
+            text)
+
+    def test_iterparse_tag(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b><d/></b><c/></a>')
+
+        iterator = iterparse(f, tag="b", events=('start', 'end'))
+        events = list(iterator)
+        root = iterator.root
+        self.assertEqual(
+            [('start', root[0]), ('end', root[0])],
+            events)
+
+    def test_iterparse_tag_all(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b><d/></b><c/></a>')
+
+        iterator = iterparse(f, tag="*", events=('start', 'end'))
+        events = list(iterator)
+        self.assertEqual(
+            8,
+            len(events))
+
+    def test_iterparse_tag_ns(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a xmlns="urn:test:1"><b><d/></b><c/></a>')
+
+        iterator = iterparse(f, tag="{urn:test:1}b", events=('start', 'end'))
+        events = list(iterator)
+        root = iterator.root
+        self.assertEqual(
+            [('start', root[0]), ('end', root[0])],
+            events)
+
+    def test_iterparse_tag_ns_empty(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a><b><d/></b><c/></a>')
+        iterator = iterparse(f, tag="{}b", events=('start', 'end'))
+        events = list(iterator)
+        root = iterator.root
+        self.assertEqual(
+            [('start', root[0]), ('end', root[0])],
+            events)
+
+        f = BytesIO('<a xmlns="urn:test:1"><b><d/></b><c/></a>')
+        iterator = iterparse(f, tag="{}b", events=('start', 'end'))
+        events = list(iterator)
+        root = iterator.root
+        self.assertEqual([], events)
+
+    def test_iterparse_tag_ns_all(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a xmlns="urn:test:1"><b><d/></b><c/></a>')
+        iterator = iterparse(f, tag="{urn:test:1}*", events=('start', 'end'))
+        events = list(iterator)
+        self.assertEqual(8, len(events))
+
+    def test_iterparse_tag_ns_empty_all(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<a xmlns="urn:test:1"><b><d/></b><c/></a>')
+        iterator = iterparse(f, tag="{}*", events=('start', 'end'))
+        events = list(iterator)
+        self.assertEqual([], events)
+
+        f = BytesIO('<a><b><d/></b><c/></a>')
+        iterator = iterparse(f, tag="{}*", events=('start', 'end'))
+        events = list(iterator)
+        self.assertEqual(8, len(events))
+
+    def test_iterparse_encoding_error(self):
+        text = _str('Søk på nettet')
+        wrong_declaration = "<?xml version='1.0' encoding='UTF-8'?>"
+        xml_latin1 = (_str('%s<a>%s</a>') % (wrong_declaration, text)
+                      ).encode('iso-8859-1')
+
+        self.assertRaises(self.etree.ParseError,
+                          list, self.etree.iterparse(BytesIO(xml_latin1)))
+
+    def test_iterparse_encoding_8bit_override(self):
+        text = _str('Søk på nettet', encoding="UTF-8")
+        wrong_declaration = "<?xml version='1.0' encoding='UTF-8'?>"
+        xml_latin1 = (_str('%s<a>%s</a>') % (wrong_declaration, text)
+                      ).encode('iso-8859-1')
+
+        iterator = self.etree.iterparse(BytesIO(xml_latin1),
+                                        encoding="iso-8859-1")
+        self.assertEqual(1, len(list(iterator)))
+
+        a = iterator.root
+        self.assertEqual(a.text, text)
+
+    def test_iterparse_keep_cdata(self):
+        tostring = self.etree.tostring
+        f = BytesIO('<root><![CDATA[test]]></root>')
+        context = self.etree.iterparse(f, strip_cdata=False)
+        content = [ el.text for event,el in context ]
+
+        self.assertEqual(['test'], content)
+        self.assertEqual(_bytes('<root><![CDATA[test]]></root>'),
+                          tostring(context.root))
+
+    def test_parser_encoding_unknown(self):
+        self.assertRaises(
+            LookupError, self.etree.XMLParser, encoding="hopefully unknown")
+
+    def test_parser_encoding(self):
+        self.etree.XMLParser(encoding="ascii")
+        self.etree.XMLParser(encoding="utf-8")
+        self.etree.XMLParser(encoding="iso-8859-1")
+
+    def test_feed_parser_recover(self):
+        parser = self.etree.XMLParser(recover=True)
+
+        parser.feed('<?xml version=')
+        parser.feed('"1.0"?><ro')
+        parser.feed('ot><')
+        parser.feed('a test="works"')
+        parser.feed('><othertag/></root') # <a> not closed!
+        parser.feed('>')
+
+        root = parser.close()
+
+        self.assertEqual(root.tag, "root")
+        self.assertEqual(len(root), 1)
+        self.assertEqual(root[0].tag, "a")
+        self.assertEqual(root[0].get("test"), "works")
+        self.assertEqual(len(root[0]), 1)
+        self.assertEqual(root[0][0].tag, "othertag")
+        # FIXME: would be nice to get some errors logged ...
+        #self.assertTrue(len(parser.error_log) > 0, "error log is empty")
+
+    def test_elementtree_parser_target_type_error(self):
+        assertEqual = self.assertEqual
+        assertFalse  = self.assertFalse
+
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start")
+                assertFalse(attrib)
+                assertEqual("TAG", tag)
+            def end(self, tag):
+                events.append("end")
+                assertEqual("TAG", tag)
+            def close(self):
+                return "DONE" # no Element!
+
+        parser = self.etree.XMLParser(target=Target())
+        tree = self.etree.ElementTree()
+
+        self.assertRaises(TypeError,
+                          tree.parse, BytesIO("<TAG/>"), parser=parser)
+        self.assertEqual(["start", "end"], events)
+
+    def test_parser_target_feed_exception(self):
+        # ET doesn't call .close() on errors
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start-" + tag)
+            def end(self, tag):
+                events.append("end-" + tag)
+                if tag == 'a':
+                    raise ValueError("dead and gone")
+            def data(self, data):
+                events.append("data-" + data)
+            def close(self):
+                events.append("close")
+                return "DONE"
+
+        parser = self.etree.XMLParser(target=Target())
+
+        try:
+            parser.feed(_bytes('<root>A<a>ca</a>B</root>'))
+            done = parser.close()
+            self.fail("error expected, but parsing succeeded")
+        except ValueError:
+            done = 'value error received as expected'
+
+        self.assertEqual(["start-root", "data-A", "start-a",
+                           "data-ca", "end-a", "close"],
+                          events)
+
+    def test_parser_target_fromstring_exception(self):
+        # ET doesn't call .close() on errors
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start-" + tag)
+            def end(self, tag):
+                events.append("end-" + tag)
+                if tag == 'a':
+                    raise ValueError("dead and gone")
+            def data(self, data):
+                events.append("data-" + data)
+            def close(self):
+                events.append("close")
+                return "DONE"
+
+        parser = self.etree.XMLParser(target=Target())
+
+        try:
+            done = self.etree.fromstring(_bytes('<root>A<a>ca</a>B</root>'),
+                                         parser=parser)
+            self.fail("error expected, but parsing succeeded")
+        except ValueError:
+            done = 'value error received as expected'
+
+        self.assertEqual(["start-root", "data-A", "start-a",
+                           "data-ca", "end-a", "close"],
+                          events)
+
+    def test_parser_target_comment(self):
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start-" + tag)
+            def end(self, tag):
+                events.append("end-" + tag)
+            def data(self, data):
+                events.append("data-" + data)
+            def comment(self, text):
+                events.append("comment-" + text)
+            def close(self):
+                return "DONE"
+
+        parser = self.etree.XMLParser(target=Target())
+
+        parser.feed(_bytes('<!--a--><root>A<!--b--><sub/><!--c-->B</root><!--d-->'))
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual(["comment-a", "start-root", "data-A", "comment-b",
+                           "start-sub", "end-sub", "comment-c", "data-B",
+                           "end-root", "comment-d"],
+                          events)
+
+    def test_parser_target_pi(self):
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start-" + tag)
+            def end(self, tag):
+                events.append("end-" + tag)
+            def data(self, data):
+                events.append("data-" + data)
+            def pi(self, target, data):
+                events.append("pi-" + target + "-" + data)
+            def close(self):
+                return "DONE"
+
+        parser = self.etree.XMLParser(target=Target())
+
+        parser.feed(_bytes('<?test a?><root>A<?test b?>B</root><?test c?>'))
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual(["pi-test-a", "start-root", "data-A", "pi-test-b",
+                           "data-B", "end-root", "pi-test-c"],
+                          events)
+
+    def test_parser_target_cdata(self):
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start-" + tag)
+            def end(self, tag):
+                events.append("end-" + tag)
+            def data(self, data):
+                events.append("data-" + data)
+            def close(self):
+                return "DONE"
+
+        parser = self.etree.XMLParser(target=Target(),
+                                      strip_cdata=False)
+
+        parser.feed(_bytes('<root>A<a><![CDATA[ca]]></a>B</root>'))
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual(["start-root", "data-A", "start-a",
+                           "data-ca", "end-a", "data-B", "end-root"],
+                          events)
+
+    def test_parser_target_recover(self):
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append("start-" + tag)
+            def end(self, tag):
+                events.append("end-" + tag)
+            def data(self, data):
+                events.append("data-" + data)
+            def close(self):
+                events.append("close")
+                return "DONE"
+
+        parser = self.etree.XMLParser(target=Target(),
+                                      recover=True)
+
+        parser.feed(_bytes('<root>A<a>ca</a>B</not-root>'))
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual(["start-root", "data-A", "start-a",
+                           "data-ca", "end-a", "data-B",
+                           "end-root", "close"],
+                          events)
+
+    def test_iterwalk_tag(self):
+        iterwalk = self.etree.iterwalk
+        root = self.etree.XML(_bytes('<a><b><d/></b><c/></a>'))
+
+        iterator = iterwalk(root, tag="b", events=('start', 'end'))
+        events = list(iterator)
+        self.assertEqual(
+            [('start', root[0]), ('end', root[0])],
+            events)
+
+    def test_iterwalk_tag_all(self):
+        iterwalk = self.etree.iterwalk
+        root = self.etree.XML(_bytes('<a><b><d/></b><c/></a>'))
+
+        iterator = iterwalk(root, tag="*", events=('start', 'end'))
+        events = list(iterator)
+        self.assertEqual(
+            8,
+            len(events))
+
+    def test_iterwalk(self):
+        iterwalk = self.etree.iterwalk
+        root = self.etree.XML(_bytes('<a><b></b><c/></a>'))
+
+        events = list(iterwalk(root))
+        self.assertEqual(
+            [('end', root[0]), ('end', root[1]), ('end', root)],
+            events)
+
+    def test_iterwalk_start(self):
+        iterwalk = self.etree.iterwalk
+        root = self.etree.XML(_bytes('<a><b></b><c/></a>'))
+
+        iterator = iterwalk(root, events=('start',))
+        events = list(iterator)
+        self.assertEqual(
+            [('start', root), ('start', root[0]), ('start', root[1])],
+            events)
+
+    def test_iterwalk_start_end(self):
+        iterwalk = self.etree.iterwalk
+        root = self.etree.XML(_bytes('<a><b></b><c/></a>'))
+
+        iterator = iterwalk(root, events=('start','end'))
+        events = list(iterator)
+        self.assertEqual(
+            [('start', root), ('start', root[0]), ('end', root[0]),
+             ('start', root[1]), ('end', root[1]), ('end', root)],
+            events)
+
+    def test_iterwalk_clear(self):
+        iterwalk = self.etree.iterwalk
+        root = self.etree.XML(_bytes('<a><b></b><c/></a>'))
+
+        iterator = iterwalk(root)
+        for event, elem in iterator:
+            elem.clear()
+
+        self.assertEqual(0,
+                          len(root))
+
+    def test_iterwalk_attrib_ns(self):
+        iterwalk = self.etree.iterwalk
+        root = self.etree.XML(_bytes('<a xmlns="ns1"><b><c xmlns="ns2"/></b></a>'))
+
+        attr_name = '{testns}bla'
+        events = []
+        iterator = iterwalk(root, events=('start','end','start-ns','end-ns'))
+        for event, elem in iterator:
+            events.append(event)
+            if event == 'start':
+                if elem.tag != '{ns1}a':
+                    elem.set(attr_name, 'value')
+
+        self.assertEqual(
+            ['start-ns', 'start', 'start', 'start-ns', 'start',
+             'end', 'end-ns', 'end', 'end', 'end-ns'],
+            events)
+
+        self.assertEqual(
+            None,
+            root.get(attr_name))
+        self.assertEqual(
+            'value',
+            root[0].get(attr_name))
+
+    def test_iterwalk_getiterator(self):
+        iterwalk = self.etree.iterwalk
+        root = self.etree.XML(_bytes('<a><b><d/></b><c/></a>'))
+
+        counts = []
+        for event, elem in iterwalk(root):
+            counts.append(len(list(elem.getiterator())))
+        self.assertEqual(
+            [1,2,1,4],
+            counts)
+
+    def test_resolve_string_dtd(self):
+        parse = self.etree.parse
+        parser = self.etree.XMLParser(dtd_validation=True)
+        assertEqual = self.assertEqual
+        test_url = _str("__nosuch.dtd")
+
+        class MyResolver(self.etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, test_url)
+                return self.resolve_string(
+                    _str('''<!ENTITY myentity "%s">
+                        <!ELEMENT doc ANY>''') % url, context)
+
+        parser.resolvers.add(MyResolver())
+
+        xml = _str('<!DOCTYPE doc SYSTEM "%s"><doc>&myentity;</doc>') % test_url
+        tree = parse(StringIO(xml), parser)
+        root = tree.getroot()
+        self.assertEqual(root.text, test_url)
+
+    def test_resolve_bytes_dtd(self):
+        parse = self.etree.parse
+        parser = self.etree.XMLParser(dtd_validation=True)
+        assertEqual = self.assertEqual
+        test_url = _str("__nosuch.dtd")
+
+        class MyResolver(self.etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, test_url)
+                return self.resolve_string(
+                    (_str('''<!ENTITY myentity "%s">
+                             <!ELEMENT doc ANY>''') % url).encode('utf-8'),
+                    context)
+
+        parser.resolvers.add(MyResolver())
+
+        xml = _str('<!DOCTYPE doc SYSTEM "%s"><doc>&myentity;</doc>') % test_url
+        tree = parse(StringIO(xml), parser)
+        root = tree.getroot()
+        self.assertEqual(root.text, test_url)
+
+    def test_resolve_filelike_dtd(self):
+        parse = self.etree.parse
+        parser = self.etree.XMLParser(dtd_validation=True)
+        assertEqual = self.assertEqual
+        test_url = _str("__nosuch.dtd")
+
+        class MyResolver(self.etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, test_url)
+                return self.resolve_file(
+                    SillyFileLike(
+                        _str('''<!ENTITY myentity "%s">
+                        <!ELEMENT doc ANY>''') % url), context)
+
+        parser.resolvers.add(MyResolver())
+
+        xml = _str('<!DOCTYPE doc SYSTEM "%s"><doc>&myentity;</doc>') % test_url
+        tree = parse(StringIO(xml), parser)
+        root = tree.getroot()
+        self.assertEqual(root.text, test_url)
+
+    def test_resolve_filename_dtd(self):
+        parse = self.etree.parse
+        parser = self.etree.XMLParser(attribute_defaults=True)
+        assertEqual = self.assertEqual
+        test_url = _str("__nosuch.dtd")
+
+        class MyResolver(self.etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, test_url)
+                return self.resolve_filename(
+                    fileInTestDir('test.dtd'), context)
+
+        parser.resolvers.add(MyResolver())
+
+        xml = _str('<!DOCTYPE a SYSTEM "%s"><a><b/></a>') % test_url
+        tree = parse(StringIO(xml), parser)
+        root = tree.getroot()
+        self.assertEqual(
+            root.attrib,    {'default': 'valueA'})
+        self.assertEqual(
+            root[0].attrib, {'default': 'valueB'})
+
+    def test_resolve_filename_dtd_relative(self):
+        parse = self.etree.parse
+        parser = self.etree.XMLParser(attribute_defaults=True)
+        assertEqual = self.assertEqual
+        test_url = _str("__nosuch.dtd")
+
+        class MyResolver(self.etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, fileUrlInTestDir(test_url))
+                return self.resolve_filename(
+                    fileUrlInTestDir('test.dtd'), context)
+
+        parser.resolvers.add(MyResolver())
+
+        xml = _str('<!DOCTYPE a SYSTEM "%s"><a><b/></a>') % test_url
+        tree = parse(StringIO(xml), parser,
+                     base_url=fileUrlInTestDir('__test.xml'))
+        root = tree.getroot()
+        self.assertEqual(
+            root.attrib,    {'default': 'valueA'})
+        self.assertEqual(
+            root[0].attrib, {'default': 'valueB'})
+
+    def test_resolve_file_dtd(self):
+        parse = self.etree.parse
+        parser = self.etree.XMLParser(attribute_defaults=True)
+        assertEqual = self.assertEqual
+        test_url = _str("__nosuch.dtd")
+
+        class MyResolver(self.etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, test_url)
+                return self.resolve_file(
+                    open(fileInTestDir('test.dtd'), 'rb'), context)
+
+        parser.resolvers.add(MyResolver())
+
+        xml = _str('<!DOCTYPE a SYSTEM "%s"><a><b/></a>') % test_url
+        tree = parse(StringIO(xml), parser)
+        root = tree.getroot()
+        self.assertEqual(
+            root.attrib,    {'default': 'valueA'})
+        self.assertEqual(
+            root[0].attrib, {'default': 'valueB'})
+
+    def test_resolve_empty(self):
+        parse = self.etree.parse
+        parser = self.etree.XMLParser(load_dtd=True)
+        assertEqual = self.assertEqual
+        test_url = _str("__nosuch.dtd")
+
+        class check(object):
+            resolved = False
+
+        class MyResolver(self.etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, test_url)
+                check.resolved = True
+                return self.resolve_empty(context)
+
+        parser.resolvers.add(MyResolver())
+
+        xml = _str('<!DOCTYPE doc SYSTEM "%s"><doc>&myentity;</doc>') % test_url
+        self.assertRaises(etree.XMLSyntaxError, parse, StringIO(xml), parser)
+        self.assertTrue(check.resolved)
+
+    def test_resolve_error(self):
+        parse = self.etree.parse
+        parser = self.etree.XMLParser(dtd_validation=True)
+
+        class _LocalException(Exception):
+            pass
+
+        class MyResolver(self.etree.Resolver):
+            def resolve(self, url, id, context):
+                raise _LocalException
+
+        parser.resolvers.add(MyResolver())
+
+        xml = '<!DOCTYPE doc SYSTEM "test"><doc>&myentity;</doc>'
+        self.assertRaises(_LocalException, parse, BytesIO(xml), parser)
+
+    if etree.LIBXML_VERSION > (2,6,20):
+        def test_entity_parse(self):
+            parse = self.etree.parse
+            tostring = self.etree.tostring
+            parser = self.etree.XMLParser(resolve_entities=False)
+            Entity = self.etree.Entity
+
+            xml = _bytes('<!DOCTYPE doc SYSTEM "test"><doc>&myentity;</doc>')
+            tree = parse(BytesIO(xml), parser)
+            root = tree.getroot()
+            self.assertEqual(root[0].tag, Entity)
+            self.assertEqual(root[0].text, "&myentity;")
+            self.assertEqual(root[0].tail, None)
+            self.assertEqual(root[0].name, "myentity")
+
+            self.assertEqual(_bytes('<doc>&myentity;</doc>'),
+                              tostring(root))
+
+        def test_entity_restructure(self):
+            xml = _bytes('''<!DOCTYPE root [ <!ENTITY nbsp "&#160;"> ]>
+                <root>
+                  <child1/>
+                  <child2/>
+                  <child3>&nbsp;</child3>
+                </root>''')
+
+            parser = self.etree.XMLParser(resolve_entities=False)
+            root = etree.fromstring(xml, parser)
+            self.assertEqual([ el.tag for el in root ],
+                              ['child1', 'child2', 'child3'])
+
+            root[0] = root[-1]
+            self.assertEqual([ el.tag for el in root ],
+                              ['child3', 'child2'])
+            self.assertEqual(root[0][0].text, '&nbsp;')
+            self.assertEqual(root[0][0].name, 'nbsp')
+
+    def test_entity_append(self):
+        Entity = self.etree.Entity
+        Element = self.etree.Element
+        tostring = self.etree.tostring
+
+        root = Element("root")
+        root.append( Entity("test") )
+
+        self.assertEqual(root[0].tag, Entity)
+        self.assertEqual(root[0].text, "&test;")
+        self.assertEqual(root[0].tail, None)
+        self.assertEqual(root[0].name, "test")
+
+        self.assertEqual(_bytes('<root>&test;</root>'),
+                          tostring(root))
+
+    def test_entity_values(self):
+        Entity = self.etree.Entity
+        self.assertEqual(Entity("test").text, '&test;')
+        self.assertEqual(Entity("#17683").text, '&#17683;')
+        self.assertEqual(Entity("#x1768").text, '&#x1768;')
+        self.assertEqual(Entity("#x98AF").text, '&#x98AF;')
+
+    def test_entity_error(self):
+        Entity = self.etree.Entity
+        self.assertRaises(ValueError, Entity, 'a b c')
+        self.assertRaises(ValueError, Entity, 'a,b')
+        self.assertRaises(ValueError, Entity, 'a\0b')
+        self.assertRaises(ValueError, Entity, '#abc')
+        self.assertRaises(ValueError, Entity, '#xxyz')
+
+    def test_cdata(self):
+        CDATA = self.etree.CDATA
+        Element = self.etree.Element
+        tostring = self.etree.tostring
+
+        root = Element("root")
+        root.text = CDATA('test')
+
+        self.assertEqual('test',
+                          root.text)
+        self.assertEqual(_bytes('<root><![CDATA[test]]></root>'),
+                          tostring(root))
+
+    def test_cdata_type(self):
+        CDATA = self.etree.CDATA
+        Element = self.etree.Element
+        root = Element("root")
+
+        root.text = CDATA("test")
+        self.assertEqual('test', root.text)
+
+        root.text = CDATA(_str("test"))
+        self.assertEqual('test', root.text)
+
+        self.assertRaises(TypeError, CDATA, 1)
+
+    def test_cdata_errors(self):
+        CDATA = self.etree.CDATA
+        Element = self.etree.Element
+
+        root = Element("root")
+        cdata = CDATA('test')
+        
+        self.assertRaises(TypeError,
+                          setattr, root, 'tail', cdata)
+        self.assertRaises(TypeError,
+                          root.set, 'attr', cdata)
+        self.assertRaises(TypeError,
+                          operator.setitem, root.attrib, 'attr', cdata)
+
+    def test_cdata_parser(self):
+        tostring = self.etree.tostring
+        parser = self.etree.XMLParser(strip_cdata=False)
+        root = self.etree.XML(_bytes('<root><![CDATA[test]]></root>'), parser)
+
+        self.assertEqual('test', root.text)
+        self.assertEqual(_bytes('<root><![CDATA[test]]></root>'),
+                          tostring(root))
+
+    def test_cdata_xpath(self):
+        tostring = self.etree.tostring
+        parser = self.etree.XMLParser(strip_cdata=False)
+        root = self.etree.XML(_bytes('<root><![CDATA[test]]></root>'), parser)
+        self.assertEqual(_bytes('<root><![CDATA[test]]></root>'),
+                          tostring(root))
+
+        self.assertEqual(['test'], root.xpath('//text()'))
+
+    # TypeError in etree, AssertionError in ElementTree;
+    def test_setitem_assert(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        
+        self.assertRaises(TypeError,
+                          a.__setitem__, 0, 'foo')
+
+    def test_append_error(self):
+        Element = self.etree.Element
+        root = Element('root')
+        # raises AssertionError in ElementTree
+        self.assertRaises(TypeError, root.append, None)
+        self.assertRaises(TypeError, root.extend, [None])
+        self.assertRaises(TypeError, root.extend, [Element('one'), None])
+        self.assertEqual('one', root[0].tag)
+
+    def test_append_recursive_error(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        root = Element('root')
+        self.assertRaises(ValueError, root.append, root)
+        child = SubElement(root, 'child')
+        self.assertRaises(ValueError, child.append, root)
+        child2 = SubElement(child, 'child2')
+        self.assertRaises(ValueError, child2.append, root)
+        self.assertRaises(ValueError, child2.append, child)
+        self.assertEqual('child2', root[0][0].tag)
+
+    def test_addnext(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        root = Element('root')
+        SubElement(root, 'a')
+        SubElement(root, 'b')
+
+        self.assertEqual(['a', 'b'],
+                          [c.tag for c in root])
+        root[1].addnext(root[0])
+        self.assertEqual(['b', 'a'],
+                          [c.tag for c in root])
+
+    def test_addprevious(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        root = Element('root')
+        SubElement(root, 'a')
+        SubElement(root, 'b')
+
+        self.assertEqual(['a', 'b'],
+                          [c.tag for c in root])
+        root[0].addprevious(root[1])
+        self.assertEqual(['b', 'a'],
+                          [c.tag for c in root])
+
+    def test_addprevious_noops(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        root = Element('root')
+        a = SubElement(root, 'a')
+        b = SubElement(root, 'b')
+        a.addprevious(a)
+        self.assertEqual('a', root[0].tag)
+        self.assertEqual('b', root[1].tag)
+        b.addprevious(b)
+        self.assertEqual('a', root[0].tag)
+        self.assertEqual('b', root[1].tag)
+        b.addprevious(a)
+        self.assertEqual('a', root[0].tag)
+        self.assertEqual('b', root[1].tag)
+
+    def test_addnext_noops(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        root = Element('root')
+        a = SubElement(root, 'a')
+        b = SubElement(root, 'b')
+        a.addnext(a)
+        self.assertEqual('a', root[0].tag)
+        self.assertEqual('b', root[1].tag)
+        b.addnext(b)
+        self.assertEqual('a', root[0].tag)
+        self.assertEqual('b', root[1].tag)
+        a.addnext(b)
+        self.assertEqual('a', root[0].tag)
+        self.assertEqual('b', root[1].tag)
+
+    def test_addnext_root(self):
+        Element = self.etree.Element
+        a = Element('a')
+        b = Element('b')
+        self.assertRaises(TypeError, a.addnext, b)
+
+    def test_addprevious_pi(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        PI = self.etree.PI
+        root = Element('root')
+        SubElement(root, 'a')
+        pi = PI('TARGET', 'TEXT')
+        pi.tail = "TAIL"
+
+        self.assertEqual(_bytes('<root><a></a></root>'),
+                          self._writeElement(root))
+        root[0].addprevious(pi)
+        self.assertEqual(_bytes('<root><?TARGET TEXT?>TAIL<a></a></root>'),
+                          self._writeElement(root))
+
+    def test_addprevious_root_pi(self):
+        Element = self.etree.Element
+        PI = self.etree.PI
+        root = Element('root')
+        pi = PI('TARGET', 'TEXT')
+        pi.tail = "TAIL"
+
+        self.assertEqual(_bytes('<root></root>'),
+                          self._writeElement(root))
+        root.addprevious(pi)
+        self.assertEqual(_bytes('<?TARGET TEXT?>\n<root></root>'),
+                          self._writeElement(root))
+
+    def test_addnext_pi(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        PI = self.etree.PI
+        root = Element('root')
+        SubElement(root, 'a')
+        pi = PI('TARGET', 'TEXT')
+        pi.tail = "TAIL"
+
+        self.assertEqual(_bytes('<root><a></a></root>'),
+                          self._writeElement(root))
+        root[0].addnext(pi)
+        self.assertEqual(_bytes('<root><a></a><?TARGET TEXT?>TAIL</root>'),
+                          self._writeElement(root))
+
+    def test_addnext_root_pi(self):
+        Element = self.etree.Element
+        PI = self.etree.PI
+        root = Element('root')
+        pi = PI('TARGET', 'TEXT')
+        pi.tail = "TAIL"
+
+        self.assertEqual(_bytes('<root></root>'),
+                          self._writeElement(root))
+        root.addnext(pi)
+        self.assertEqual(_bytes('<root></root>\n<?TARGET TEXT?>'),
+                          self._writeElement(root))
+
+    def test_addnext_comment(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        Comment = self.etree.Comment
+        root = Element('root')
+        SubElement(root, 'a')
+        comment = Comment('TEXT ')
+        comment.tail = "TAIL"
+
+        self.assertEqual(_bytes('<root><a></a></root>'),
+                          self._writeElement(root))
+        root[0].addnext(comment)
+        self.assertEqual(_bytes('<root><a></a><!--TEXT -->TAIL</root>'),
+                          self._writeElement(root))
+
+    def test_addnext_root_comment(self):
+        Element = self.etree.Element
+        Comment = self.etree.Comment
+        root = Element('root')
+        comment = Comment('TEXT ')
+        comment.tail = "TAIL"
+
+        self.assertEqual(_bytes('<root></root>'),
+                          self._writeElement(root))
+        root.addnext(comment)
+        self.assertEqual(_bytes('<root></root>\n<!--TEXT -->'),
+                          self._writeElement(root))
+
+    def test_addprevious_comment(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        Comment = self.etree.Comment
+        root = Element('root')
+        SubElement(root, 'a')
+        comment = Comment('TEXT ')
+        comment.tail = "TAIL"
+
+        self.assertEqual(_bytes('<root><a></a></root>'),
+                          self._writeElement(root))
+        root[0].addprevious(comment)
+        self.assertEqual(_bytes('<root><!--TEXT -->TAIL<a></a></root>'),
+                          self._writeElement(root))
+
+    def test_addprevious_root_comment(self):
+        Element = self.etree.Element
+        Comment = self.etree.Comment
+        root = Element('root')
+        comment = Comment('TEXT ')
+        comment.tail = "TAIL"
+
+        self.assertEqual(_bytes('<root></root>'),
+                          self._writeElement(root))
+        root.addprevious(comment)
+        self.assertEqual(_bytes('<!--TEXT -->\n<root></root>'),
+                          self._writeElement(root))
+
+    # ET's Elements have items() and key(), but not values()
+    def test_attribute_values(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc alpha="Alpha" beta="Beta" gamma="Gamma"/>'))
+        values = root.values()
+        values.sort()
+        self.assertEqual(['Alpha', 'Beta', 'Gamma'], values)
+
+    # gives error in ElementTree
+    def test_comment_empty(self):
+        Element = self.etree.Element
+        Comment = self.etree.Comment
+
+        a = Element('a')
+        a.append(Comment())
+        self.assertEqual(
+            _bytes('<a><!----></a>'),
+            self._writeElement(a))
+
+    # ElementTree ignores comments
+    def test_comment_parse_empty(self):
+        ElementTree = self.etree.ElementTree
+        tostring = self.etree.tostring
+
+        xml = _bytes('<a><b/><!----><c/></a>')
+        f = BytesIO(xml)
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        self.assertEqual(
+            '',
+            a[1].text)
+        self.assertEqual(
+            xml,
+            tostring(a))
+
+    # ElementTree ignores comments
+    def test_comment_no_proxy_yet(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<a><b></b><!-- hoi --><c></c></a>')
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        self.assertEqual(
+            ' hoi ',
+            a[1].text)
+
+    # does not raise an exception in ElementTree
+    def test_comment_immutable(self):
+        Element = self.etree.Element
+        Comment = self.etree.Comment
+
+        c = Comment()
+        el = Element('myel')
+
+        self.assertRaises(TypeError, c.append, el)
+        self.assertRaises(TypeError, c.insert, 0, el)
+        self.assertRaises(TypeError, c.set, "myattr", "test")
+
+    def test_comment_immutable_attrib(self):
+        c = self.etree.Comment()
+        self.assertEqual(0, len(c.attrib))
+
+        self.assertFalse(c.attrib.__contains__('nope'))
+        self.assertFalse('nope' in c.attrib)
+        self.assertFalse('nope' in c.attrib.keys())
+        self.assertFalse('nope' in c.attrib.values())
+        self.assertFalse(('nope', 'huhu') in c.attrib.items())
+
+        self.assertEqual([], list(c.attrib))
+        self.assertEqual([], list(c.attrib.keys()))
+        self.assertEqual([], list(c.attrib.items()))
+        self.assertEqual([], list(c.attrib.values()))
+        self.assertEqual([], list(c.attrib.iterkeys()))
+        self.assertEqual([], list(c.attrib.iteritems()))
+        self.assertEqual([], list(c.attrib.itervalues()))
+
+        self.assertEqual('HUHU', c.attrib.pop('nope', 'HUHU'))
+        self.assertRaises(KeyError, c.attrib.pop, 'nope')
+
+        self.assertRaises(KeyError, c.attrib.__getitem__, 'only')
+        self.assertRaises(KeyError, c.attrib.__getitem__, 'names')
+        self.assertRaises(KeyError, c.attrib.__getitem__, 'nope')
+        self.assertRaises(KeyError, c.attrib.__setitem__, 'nope', 'yep')
+        self.assertRaises(KeyError, c.attrib.__delitem__, 'nope')
+
+    # test passing 'None' to dump()
+    def test_dump_none(self):
+        self.assertRaises(TypeError, self.etree.dump, None)
+
+    def test_prefix(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<a xmlns:foo="http://www.infrae.com/ns/1"><foo:b/></a>')
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        self.assertEqual(
+            None,
+            a.prefix)
+        self.assertEqual(
+            'foo',
+            a[0].prefix)
+
+    def test_prefix_default_ns(self):
+        ElementTree = self.etree.ElementTree
+        
+        f = BytesIO('<a xmlns="http://www.infrae.com/ns/1"><b/></a>')
+        doc = ElementTree(file=f)
+        a = doc.getroot()
+        self.assertEqual(
+            None,
+            a.prefix)
+        self.assertEqual(
+            None,
+            a[0].prefix)
+
+    def test_getparent(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        self.assertEqual(
+            None,
+            a.getparent())
+        self.assertEqual(
+            a,
+            b.getparent())
+        self.assertEqual(
+            b.getparent(),
+            c.getparent())
+        self.assertEqual(
+            b,
+            d.getparent())
+
+    def test_iterchildren(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<three/></doc>'))
+        result = []
+        for el in root.iterchildren():
+            result.append(el.tag)
+        self.assertEqual(['one', 'two', 'three'], result)
+
+    def test_iterchildren_reversed(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<three/></doc>'))
+        result = []
+        for el in root.iterchildren(reversed=True):
+            result.append(el.tag)
+        self.assertEqual(['three', 'two', 'one'], result)
+
+    def test_iterchildren_tag(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<two>Bla</two></doc>'))
+        result = []
+        for el in root.iterchildren(tag='two'):
+            result.append(el.text)
+        self.assertEqual(['Two', 'Bla'], result)
+
+    def test_iterchildren_tag_posarg(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<two>Bla</two></doc>'))
+        result = []
+        for el in root.iterchildren('two'):
+            result.append(el.text)
+        self.assertEqual(['Two', 'Bla'], result)
+
+    def test_iterchildren_tag_reversed(self):
+        XML = self.etree.XML
+        
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<two>Bla</two></doc>'))
+        result = []
+        for el in root.iterchildren(reversed=True, tag='two'):
+            result.append(el.text)
+        self.assertEqual(['Bla', 'Two'], result)
+
+    def test_iterchildren_tag_multiple(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<two>Bla</two><three/></doc>'))
+        result = []
+        for el in root.iterchildren(tag=['two', 'three']):
+            result.append(el.text)
+        self.assertEqual(['Two', 'Bla', None], result)
+
+    def test_iterchildren_tag_multiple_posarg(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<two>Bla</two><three/></doc>'))
+        result = []
+        for el in root.iterchildren('two', 'three'):
+            result.append(el.text)
+        self.assertEqual(['Two', 'Bla', None], result)
+
+    def test_iterchildren_tag_multiple_reversed(self):
+        XML = self.etree.XML
+
+        root = XML(_bytes('<doc><one/><two>Two</two>Hm<two>Bla</two><three/></doc>'))
+        result = []
+        for el in root.iterchildren(reversed=True, tag=['two', 'three']):
+            result.append(el.text)
+        self.assertEqual([None, 'Bla', 'Two'], result)
+
+    def test_iterancestors(self):
+        Element    = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        self.assertEqual(
+            [],
+            list(a.iterancestors()))
+        self.assertEqual(
+            [a],
+            list(b.iterancestors()))
+        self.assertEqual(
+            [a],
+            list(c.iterancestors()))
+        self.assertEqual(
+            [b, a],
+            list(d.iterancestors()))
+
+    def test_iterancestors_tag(self):
+        Element    = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        self.assertEqual(
+            [a],
+            list(d.iterancestors('a')))
+        self.assertEqual(
+            [a],
+            list(d.iterancestors(tag='a')))
+
+        self.assertEqual(
+            [b, a],
+            list(d.iterancestors('*')))
+        self.assertEqual(
+            [b, a],
+            list(d.iterancestors(tag='*')))
+
+    def test_iterancestors_tag_multiple(self):
+        Element    = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        self.assertEqual(
+            [b, a],
+            list(d.iterancestors(tag=('a', 'b'))))
+        self.assertEqual(
+            [b, a],
+            list(d.iterancestors('a', 'b')))
+
+        self.assertEqual(
+            [],
+            list(d.iterancestors(tag=('w', 'x', 'y', 'z'))))
+        self.assertEqual(
+            [],
+            list(d.iterancestors('w', 'x', 'y', 'z')))
+
+        self.assertEqual(
+            [],
+            list(d.iterancestors(tag=('d', 'x'))))
+        self.assertEqual(
+            [],
+            list(d.iterancestors('d', 'x')))
+
+        self.assertEqual(
+            [b, a],
+            list(d.iterancestors(tag=('b', '*'))))
+        self.assertEqual(
+            [b, a],
+            list(d.iterancestors('b', '*')))
+
+        self.assertEqual(
+            [b],
+            list(d.iterancestors(tag=('b', 'c'))))
+        self.assertEqual(
+            [b],
+            list(d.iterancestors('b', 'c')))
+
+    def test_iterdescendants(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+
+        self.assertEqual(
+            [b, d, c, e],
+            list(a.iterdescendants()))
+        self.assertEqual(
+            [],
+            list(d.iterdescendants()))
+
+    def test_iterdescendants_tag(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+
+        self.assertEqual(
+            [],
+            list(a.iterdescendants('a')))
+        self.assertEqual(
+            [],
+            list(a.iterdescendants(tag='a')))
+
+        a2 = SubElement(e, 'a')
+        self.assertEqual(
+            [a2],
+            list(a.iterdescendants('a')))
+
+        self.assertEqual(
+            [a2],
+            list(c.iterdescendants('a')))
+        self.assertEqual(
+            [a2],
+            list(c.iterdescendants(tag='a')))
+
+    def test_iterdescendants_tag_multiple(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+
+        self.assertEqual(
+            [b, e],
+            list(a.iterdescendants(tag=('a', 'b', 'e'))))
+        self.assertEqual(
+            [b, e],
+            list(a.iterdescendants('a', 'b', 'e')))
+
+        a2 = SubElement(e, 'a')
+        self.assertEqual(
+            [b, a2],
+            list(a.iterdescendants(tag=('a', 'b'))))
+        self.assertEqual(
+            [b, a2],
+            list(a.iterdescendants('a', 'b')))
+
+        self.assertEqual(
+            [],
+            list(c.iterdescendants(tag=('x', 'y', 'z'))))
+        self.assertEqual(
+            [],
+            list(c.iterdescendants('x', 'y', 'z')))
+
+        self.assertEqual(
+            [b, d, c, e, a2],
+            list(a.iterdescendants(tag=('x', 'y', 'z', '*'))))
+        self.assertEqual(
+            [b, d, c, e, a2],
+            list(a.iterdescendants('x', 'y', 'z', '*')))
+
+    def test_getroottree(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        self.assertEqual(
+            a,
+            a.getroottree().getroot())
+        self.assertEqual(
+            a,
+            b.getroottree().getroot())
+        self.assertEqual(
+            a,
+            d.getroottree().getroot())
+
+    def test_getnext(self):
+        Element    = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        self.assertEqual(
+            None,
+            a.getnext())
+        self.assertEqual(
+            c,
+            b.getnext())
+        self.assertEqual(
+            None,
+            c.getnext())
+
+    def test_getprevious(self):
+        Element    = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        self.assertEqual(
+            None,
+            a.getprevious())
+        self.assertEqual(
+            b,
+            c.getprevious())
+        self.assertEqual(
+            None,
+            b.getprevious())
+
+    def test_itersiblings(self):
+        Element    = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        self.assertEqual(
+            [],
+            list(a.itersiblings()))
+        self.assertEqual(
+            [c],
+            list(b.itersiblings()))
+        self.assertEqual(
+            [],
+            list(c.itersiblings()))
+        self.assertEqual(
+            [b],
+            list(c.itersiblings(preceding=True)))
+        self.assertEqual(
+            [],
+            list(b.itersiblings(preceding=True)))
+
+    def test_itersiblings_tag(self):
+        Element    = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        self.assertEqual(
+            [],
+            list(a.itersiblings(tag='XXX')))
+        self.assertEqual(
+            [c],
+            list(b.itersiblings(tag='c')))
+        self.assertEqual(
+            [c],
+            list(b.itersiblings(tag='*')))
+        self.assertEqual(
+            [b],
+            list(c.itersiblings(preceding=True, tag='b')))
+        self.assertEqual(
+            [],
+            list(c.itersiblings(preceding=True, tag='c')))
+
+    def test_itersiblings_tag_multiple(self):
+        Element    = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(a, 'e')
+        self.assertEqual(
+            [],
+            list(a.itersiblings(tag=('XXX', 'YYY'))))
+        self.assertEqual(
+            [c, e],
+            list(b.itersiblings(tag=('c', 'd', 'e'))))
+        self.assertEqual(
+            [b],
+            list(c.itersiblings(preceding=True, tag=('b', 'b', 'c', 'd'))))
+        self.assertEqual(
+            [c, b],
+            list(e.itersiblings(preceding=True, tag=('c', '*'))))
+
+    def test_parseid(self):
+        parseid = self.etree.parseid
+        XML     = self.etree.XML
+        xml_text = _bytes('''
+        <!DOCTYPE document [
+        <!ELEMENT document (h1,p)*>
+        <!ELEMENT h1 (#PCDATA)>
+        <!ATTLIST h1 myid ID #REQUIRED>
+        <!ELEMENT p  (#PCDATA)>
+        <!ATTLIST p  someid ID #REQUIRED>
+        ]>
+        <document>
+          <h1 myid="chapter1">...</h1>
+          <p id="note1" class="note">...</p>
+          <p>Regular paragraph.</p>
+          <p xml:id="xmlid">XML:ID paragraph.</p>
+          <p someid="warn1" class="warning">...</p>
+        </document>
+        ''')
+
+        tree, dic = parseid(BytesIO(xml_text))
+        root = tree.getroot()
+        root2 = XML(xml_text)
+        self.assertEqual(self._writeElement(root),
+                          self._writeElement(root2))
+        expected = {
+            "chapter1" : root[0],
+            "xmlid"    : root[3],
+            "warn1"    : root[4]
+            }
+        self.assertTrue("chapter1" in dic)
+        self.assertTrue("warn1" in dic)
+        self.assertTrue("xmlid" in dic)
+        self._checkIDDict(dic, expected)
+
+    def test_XMLDTDID(self):
+        XMLDTDID = self.etree.XMLDTDID
+        XML      = self.etree.XML
+        xml_text = _bytes('''
+        <!DOCTYPE document [
+        <!ELEMENT document (h1,p)*>
+        <!ELEMENT h1 (#PCDATA)>
+        <!ATTLIST h1 myid ID #REQUIRED>
+        <!ELEMENT p  (#PCDATA)>
+        <!ATTLIST p  someid ID #REQUIRED>
+        ]>
+        <document>
+          <h1 myid="chapter1">...</h1>
+          <p id="note1" class="note">...</p>
+          <p>Regular paragraph.</p>
+          <p xml:id="xmlid">XML:ID paragraph.</p>
+          <p someid="warn1" class="warning">...</p>
+        </document>
+        ''')
+
+        root, dic = XMLDTDID(xml_text)
+        root2 = XML(xml_text)
+        self.assertEqual(self._writeElement(root),
+                          self._writeElement(root2))
+        expected = {
+            "chapter1" : root[0],
+            "xmlid"    : root[3],
+            "warn1"    : root[4]
+            }
+        self.assertTrue("chapter1" in dic)
+        self.assertTrue("warn1" in dic)
+        self.assertTrue("xmlid" in dic)
+        self._checkIDDict(dic, expected)
+
+    def test_XMLDTDID_empty(self):
+        XMLDTDID = self.etree.XMLDTDID
+        XML      = self.etree.XML
+        xml_text = _bytes('''
+        <document>
+          <h1 myid="chapter1">...</h1>
+          <p id="note1" class="note">...</p>
+          <p>Regular paragraph.</p>
+          <p someid="warn1" class="warning">...</p>
+        </document>
+        ''')
+
+        root, dic = XMLDTDID(xml_text)
+        root2 = XML(xml_text)
+        self.assertEqual(self._writeElement(root),
+                          self._writeElement(root2))
+        expected = {}
+        self._checkIDDict(dic, expected)
+
+    def _checkIDDict(self, dic, expected):
+        self.assertEqual(len(dic),
+                          len(expected))
+        self.assertEqual(sorted(dic.items()),
+                          sorted(expected.items()))
+        if sys.version_info < (3,):
+            self.assertEqual(sorted(dic.iteritems()),
+                              sorted(expected.iteritems()))
+        self.assertEqual(sorted(dic.keys()),
+                          sorted(expected.keys()))
+        if sys.version_info < (3,):
+            self.assertEqual(sorted(dic.iterkeys()),
+                              sorted(expected.iterkeys()))
+        if sys.version_info < (3,):
+            self.assertEqual(sorted(dic.values()),
+                              sorted(expected.values()))
+            self.assertEqual(sorted(dic.itervalues()),
+                              sorted(expected.itervalues()))
+
+    def test_namespaces(self):
+        etree = self.etree
+
+        r = {'foo': 'http://ns.infrae.com/foo'}
+        e = etree.Element('{http://ns.infrae.com/foo}bar', nsmap=r)
+        self.assertEqual(
+            'foo',
+            e.prefix)
+        self.assertEqual(
+            _bytes('<foo:bar xmlns:foo="http://ns.infrae.com/foo"></foo:bar>'),
+            self._writeElement(e))
+        
+    def test_namespaces_default(self):
+        etree = self.etree
+
+        r = {None: 'http://ns.infrae.com/foo'}
+        e = etree.Element('{http://ns.infrae.com/foo}bar', nsmap=r)
+        self.assertEqual(
+            None,
+            e.prefix)
+        self.assertEqual(
+            '{http://ns.infrae.com/foo}bar',
+            e.tag)
+        self.assertEqual(
+            _bytes('<bar xmlns="http://ns.infrae.com/foo"></bar>'),
+            self._writeElement(e))
+
+    def test_namespaces_default_and_attr(self):
+        etree = self.etree
+
+        r = {None: 'http://ns.infrae.com/foo',
+             'hoi': 'http://ns.infrae.com/hoi'}
+        e = etree.Element('{http://ns.infrae.com/foo}bar', nsmap=r)
+        e.set('{http://ns.infrae.com/hoi}test', 'value')
+        self.assertEqual(
+            _bytes('<bar xmlns="http://ns.infrae.com/foo" xmlns:hoi="http://ns.infrae.com/hoi" hoi:test="value"></bar>'),
+            self._writeElement(e))
+
+    def test_attribute_keeps_namespace_prefix_on_merge(self):
+        etree = self.etree
+
+        root = etree.Element('{http://test/ns}root',
+                             nsmap={None: 'http://test/ns'})
+        sub = etree.Element('{http://test/ns}sub',
+                            nsmap={'test': 'http://test/ns'})
+
+        sub.attrib['{http://test/ns}attr'] = 'value'
+        self.assertEqual(sub.attrib['{http://test/ns}attr'], 'value')
+        self.assertEqual(
+            _bytes('<test:sub xmlns:test="http://test/ns" test:attr="value"/>'),
+            etree.tostring(sub))
+
+        root.append(sub)
+        self.assertEqual(
+            _bytes('<root xmlns="http://test/ns">'
+                   '<sub xmlns:test="http://test/ns" test:attr="value"/>'
+                   '</root>'),
+            etree.tostring(root))
+
+    def test_attribute_keeps_namespace_prefix_on_merge_with_nons(self):
+        etree = self.etree
+
+        root = etree.Element('root')
+        sub = etree.Element('{http://test/ns}sub',
+                            nsmap={'test': 'http://test/ns'})
+
+        sub.attrib['{http://test/ns}attr'] = 'value'
+        self.assertEqual(sub.attrib['{http://test/ns}attr'], 'value')
+        self.assertEqual(
+            _bytes('<test:sub xmlns:test="http://test/ns" test:attr="value"/>'),
+            etree.tostring(sub))
+
+        root.append(sub)
+        self.assertEqual(
+            _bytes('<root>'
+                   '<test:sub xmlns:test="http://test/ns" test:attr="value"/>'
+                   '</root>'),
+            etree.tostring(root))
+
+    def test_attribute_gets_namespace_prefix_on_merge_with_nons(self):
+        etree = self.etree
+
+        root = etree.Element('root')
+        sub = etree.Element('{http://test/ns}sub',
+                            nsmap={None: 'http://test/ns'})
+
+        sub.attrib['{http://test/ns}attr'] = 'value'
+        self.assertEqual(sub.attrib['{http://test/ns}attr'], 'value')
+        self.assertEqual(
+            _bytes('<sub xmlns="http://test/ns" '
+                   'xmlns:ns0="http://test/ns" ns0:attr="value"/>'),
+            etree.tostring(sub))
+
+        root.append(sub)
+        self.assertEqual(
+            _bytes('<root>'
+                   '<sub xmlns="http://test/ns"'
+                   ' xmlns:ns0="http://test/ns" ns0:attr="value"/>'
+                   '</root>'),
+            etree.tostring(root))
+
+    def test_attribute_gets_namespace_prefix_on_merge(self):
+        etree = self.etree
+
+        root = etree.Element('{http://test/ns}root',
+                             nsmap={'test': 'http://test/ns',
+                                    None: 'http://test/ns'})
+        sub = etree.Element('{http://test/ns}sub',
+                            nsmap={None: 'http://test/ns'})
+
+        sub.attrib['{http://test/ns}attr'] = 'value'
+        self.assertEqual(sub.attrib['{http://test/ns}attr'], 'value')
+        self.assertEqual(
+            _bytes('<sub xmlns="http://test/ns" '
+                   'xmlns:ns0="http://test/ns" ns0:attr="value"/>'),
+            etree.tostring(sub))
+
+        root.append(sub)
+        self.assertEqual(
+            _bytes('<test:root xmlns:test="http://test/ns" xmlns="http://test/ns">'
+                   '<test:sub test:attr="value"/>'
+                   '</test:root>'),
+            etree.tostring(root))
+
+    def test_namespaces_elementtree(self):
+        etree = self.etree
+        r = {None: 'http://ns.infrae.com/foo',
+             'hoi': 'http://ns.infrae.com/hoi'} 
+        e = etree.Element('{http://ns.infrae.com/foo}z', nsmap=r)
+        tree = etree.ElementTree(element=e)
+        etree.SubElement(e, '{http://ns.infrae.com/hoi}x')
+        self.assertEqual(
+            _bytes('<z xmlns="http://ns.infrae.com/foo" xmlns:hoi="http://ns.infrae.com/hoi"><hoi:x></hoi:x></z>'),
+            self._writeElement(e))
+
+    def test_namespaces_default_copy_element(self):
+        etree = self.etree
+
+        r = {None: 'http://ns.infrae.com/foo'}
+        e1 = etree.Element('{http://ns.infrae.com/foo}bar', nsmap=r)
+        e2 = etree.Element('{http://ns.infrae.com/foo}bar', nsmap=r)
+
+        e1.append(e2)
+
+        self.assertEqual(
+            None,
+            e1.prefix)
+        self.assertEqual(
+            None,
+            e1[0].prefix)
+        self.assertEqual(
+            '{http://ns.infrae.com/foo}bar',
+            e1.tag)
+        self.assertEqual(
+            '{http://ns.infrae.com/foo}bar',
+            e1[0].tag)
+
+    def test_namespaces_copy_element(self):
+        etree = self.etree
+
+        r = {None: 'http://ns.infrae.com/BAR'}
+        e1 = etree.Element('{http://ns.infrae.com/BAR}bar', nsmap=r)
+        e2 = etree.Element('{http://ns.infrae.com/foo}bar', nsmap=r)
+
+        e1.append(e2)
+
+        self.assertEqual(
+            None,
+            e1.prefix)
+        self.assertNotEqual(
+            None,
+            e2.prefix)
+        self.assertEqual(
+            '{http://ns.infrae.com/BAR}bar',
+            e1.tag)
+        self.assertEqual(
+            '{http://ns.infrae.com/foo}bar',
+            e2.tag)
+
+    def test_namespaces_reuse_after_move(self):
+        ns_href = "http://a.b.c"
+        one = self.etree.fromstring(
+            _bytes('<foo><bar xmlns:ns="%s"><ns:baz/></bar></foo>' % ns_href))
+        baz = one[0][0]
+
+        two = self.etree.fromstring(
+            _bytes('<root xmlns:ns="%s"/>' % ns_href))
+        two.append(baz)
+        del one # make sure the source document is deallocated
+
+        self.assertEqual('{%s}baz' % ns_href, baz.tag)
+        self.assertEqual(
+            _bytes('<root xmlns:ns="%s"><ns:baz/></root>' % ns_href),
+            self.etree.tostring(two))
+
+    def test_namespace_cleanup(self):
+        xml = _bytes('<foo xmlns="F" xmlns:x="x"><bar xmlns:ns="NS" xmlns:b="b" xmlns="B"><ns:baz/></bar></foo>')
+        root = self.etree.fromstring(xml)
+        self.assertEqual(xml,
+                          self.etree.tostring(root))
+        self.etree.cleanup_namespaces(root)
+        self.assertEqual(
+            _bytes('<foo xmlns="F"><bar xmlns:ns="NS" xmlns="B"><ns:baz/></bar></foo>'),
+            self.etree.tostring(root))
+
+    def test_element_nsmap(self):
+        etree = self.etree
+
+        r = {None: 'http://ns.infrae.com/foo',
+             'hoi': 'http://ns.infrae.com/hoi'}
+        e = etree.Element('{http://ns.infrae.com/foo}bar', nsmap=r)
+        self.assertEqual(
+            r,
+            e.nsmap)
+
+    def test_subelement_nsmap(self):
+        etree = self.etree
+
+        re = {None: 'http://ns.infrae.com/foo',
+             'hoi': 'http://ns.infrae.com/hoi'}
+        e = etree.Element('{http://ns.infrae.com/foo}bar', nsmap=re)
+
+        rs = {None: 'http://ns.infrae.com/honk',
+             'top': 'http://ns.infrae.com/top'}
+        s = etree.SubElement(e, '{http://ns.infrae.com/honk}bar', nsmap=rs)
+
+        r = re.copy()
+        r.update(rs)
+        self.assertEqual(re, e.nsmap)
+        self.assertEqual(r,  s.nsmap)
+
+    def test_html_prefix_nsmap(self):
+        etree = self.etree
+        el = etree.HTML('<hha:page-description>aa</hha:page-description>').find('.//page-description')
+        self.assertEqual({'hha': None}, el.nsmap)
+
+    def test_getiterator_filter_multiple(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+        f = SubElement(c, 'f')
+
+        self.assertEqual(
+            [a, b],
+               list(a.getiterator('a', 'b')))
+        self.assertEqual(
+            [],
+              list(a.getiterator('x', 'y')))
+        self.assertEqual(
+            [a, f],
+              list(a.getiterator('f', 'a')))
+        self.assertEqual(
+            [c, e, f],
+               list(c.getiterator('c', '*', 'a')))
+        self.assertEqual(
+            [],
+                  list(a.getiterator( (), () )))
+
+    def test_getiterator_filter_multiple_tuple(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(b, 'd')
+        e = SubElement(c, 'e')
+        f = SubElement(c, 'f')
+
+        self.assertEqual(
+            [a, b],
+                  list(a.getiterator( ('a', 'b') )))
+        self.assertEqual(
+            [],
+              list(a.getiterator( ('x', 'y') )))
+        self.assertEqual(
+            [a, f],
+                  list(a.getiterator( ('f', 'a') )))
+        self.assertEqual(
+            [c, e, f],
+                     list(c.getiterator( ('c', '*', 'a') )))
+        self.assertEqual(
+            [],
+              list(a.getiterator( () )))
+
+    def test_getiterator_filter_namespace(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('{a}a')
+        b = SubElement(a, '{a}b')
+        c = SubElement(a, '{a}c')
+        d = SubElement(b, '{b}d')
+        e = SubElement(c, '{a}e')
+        f = SubElement(c, '{b}f')
+        g = SubElement(c, 'g')
+
+        self.assertEqual(
+            [a],
+            list(a.getiterator('{a}a')))
+        self.assertEqual(
+            [],
+            list(a.getiterator('{b}a')))
+        self.assertEqual(
+            [],
+            list(a.getiterator('a')))
+        self.assertEqual(
+            [a,b,d,c,e,f,g],
+            list(a.getiterator('*')))
+        self.assertEqual(
+            [f],
+            list(c.getiterator('{b}*')))
+        self.assertEqual(
+            [d, f],
+            list(a.getiterator('{b}*')))
+        self.assertEqual(
+            [g],
+            list(a.getiterator('g')))
+        self.assertEqual(
+            [g],
+            list(a.getiterator('{}g')))
+        self.assertEqual(
+            [g],
+            list(a.getiterator('{}*')))
+
+    def test_getiterator_filter_local_name(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('{a}a')
+        b = SubElement(a, '{nsA}b')
+        c = SubElement(b, '{nsB}b')
+        d = SubElement(a, 'b')
+        e = SubElement(a, '{nsA}e')
+        f = SubElement(e, '{nsB}e')
+        g = SubElement(e, 'e')
+
+        self.assertEqual(
+            [b, c, d],
+            list(a.getiterator('{*}b')))
+        self.assertEqual(
+            [e, f, g],
+            list(a.getiterator('{*}e')))
+        self.assertEqual(
+            [a, b, c, d, e, f, g],
+            list(a.getiterator('{*}*')))
+
+    def test_getiterator_filter_entities(self):
+        Element = self.etree.Element
+        Entity = self.etree.Entity
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        entity_b = Entity("TEST-b")
+        b.append(entity_b)
+
+        self.assertEqual(
+            [entity_b],
+            list(a.getiterator(Entity)))
+
+        entity_a = Entity("TEST-a")
+        a.append(entity_a)
+
+        self.assertEqual(
+            [entity_b, entity_a],
+            list(a.getiterator(Entity)))
+
+        self.assertEqual(
+            [entity_b],
+            list(b.getiterator(Entity)))
+
+    def test_getiterator_filter_element(self):
+        Element = self.etree.Element
+        Comment = self.etree.Comment
+        PI = self.etree.PI
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        a.append(Comment("test"))
+        a.append(PI("pi", "content"))
+        c = SubElement(a, 'c')
+
+        self.assertEqual(
+            [a, b, c],
+            list(a.getiterator(Element)))
+
+    def test_getiterator_filter_all_comment_pi(self):
+        # ElementTree iterates over everything here
+        Element = self.etree.Element
+        Comment = self.etree.Comment
+        PI = self.etree.PI
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        a.append(Comment("test"))
+        a.append(PI("pi", "content"))
+        c = SubElement(a, 'c')
+
+        self.assertEqual(
+            [a, b, c],
+            list(a.getiterator('*')))
+
+    def test_elementtree_find_qname(self):
+        XML = self.etree.XML
+        ElementTree = self.etree.ElementTree
+        QName = self.etree.QName
+        tree = ElementTree(XML(_bytes('<a><b><c/></b><b/><c><b/></c></a>')))
+        self.assertEqual(tree.find(QName("c")), tree.getroot()[2])
+
+    def test_elementtree_findall_qname(self):
+        XML = self.etree.XML
+        ElementTree = self.etree.ElementTree
+        QName = self.etree.QName
+        tree = ElementTree(XML(_bytes('<a><b><c/></b><b/><c><b/></c></a>')))
+        self.assertEqual(len(list(tree.findall(QName("c")))), 1)
+
+    def test_elementtree_findall_ns_qname(self):
+        XML = self.etree.XML
+        ElementTree = self.etree.ElementTree
+        QName = self.etree.QName
+        tree = ElementTree(XML(
+                _bytes('<a xmlns:x="X" xmlns:y="Y"><x:b><c/></x:b><b/><c><x:b/><b/></c><b/></a>')))
+        self.assertEqual(len(list(tree.findall(QName("b")))), 2)
+        self.assertEqual(len(list(tree.findall(QName("X", "b")))), 1)
+
+    def test_findall_ns(self):
+        XML = self.etree.XML
+        root = XML(_bytes('<a xmlns:x="X" xmlns:y="Y"><x:b><c/></x:b><b/><c><x:b/><b/></c><b/></a>'))
+        self.assertEqual(len(root.findall(".//{X}b")), 2)
+        self.assertEqual(len(root.findall(".//{X}*")), 2)
+        self.assertEqual(len(root.findall(".//b")), 3)
+
+    def test_findall_different_nsmaps(self):
+        XML = self.etree.XML
+        root = XML(_bytes('<a xmlns:x="X" xmlns:y="Y"><x:b><c/></x:b><b/><c><x:b/><b/></c><y:b/></a>'))
+        nsmap = {'xx': 'X'}
+        self.assertEqual(len(root.findall(".//xx:b", namespaces=nsmap)), 2)
+        self.assertEqual(len(root.findall(".//xx:*", namespaces=nsmap)), 2)
+        self.assertEqual(len(root.findall(".//b", namespaces=nsmap)), 2)
+        nsmap = {'xx': 'Y'}
+        self.assertEqual(len(root.findall(".//xx:b", namespaces=nsmap)), 1)
+        self.assertEqual(len(root.findall(".//xx:*", namespaces=nsmap)), 1)
+        self.assertEqual(len(root.findall(".//b", namespaces=nsmap)), 2)
+
+    def test_findall_different_nsmaps(self):
+        XML = self.etree.XML
+        root = XML(_bytes('<a xmlns:x="X" xmlns:y="Y"><x:b><c/></x:b><b/><c><x:b/><b/></c><y:b/></a>'))
+        nsmap = {'xx': 'X'}
+        self.assertEqual(len(root.findall(".//xx:b", namespaces=nsmap)), 2)
+        self.assertEqual(len(root.findall(".//xx:*", namespaces=nsmap)), 2)
+        self.assertEqual(len(root.findall(".//b", namespaces=nsmap)), 2)
+        nsmap = {'xx': 'Y'}
+        self.assertEqual(len(root.findall(".//xx:b", namespaces=nsmap)), 1)
+        self.assertEqual(len(root.findall(".//xx:*", namespaces=nsmap)), 1)
+        self.assertEqual(len(root.findall(".//b", namespaces=nsmap)), 2)
+
+    def test_findall_syntax_error(self):
+        XML = self.etree.XML
+        root = XML(_bytes('<a><b><c/></b><b/><c><b/><b/></c><b/></a>'))
+        self.assertRaises(SyntaxError, root.findall, '')
+        self.assertRaises(SyntaxError, root.findall, '//')  # absolute path on Element
+        self.assertRaises(SyntaxError, root.findall, './//')
+
+    def test_index(self):
+        etree = self.etree
+        e = etree.Element('foo')
+        for i in range(10):
+            etree.SubElement(e, 'a%s' % i)
+        for i in range(10):
+            self.assertEqual(
+                i,
+                e.index(e[i]))
+        self.assertEqual(
+            3, e.index(e[3], 3))
+        self.assertRaises(
+            ValueError, e.index, e[3], 4)
+        self.assertRaises(
+            ValueError, e.index, e[3], 0, 2)
+        self.assertRaises(
+            ValueError, e.index, e[8], 0, -3)
+        self.assertRaises(
+            ValueError, e.index, e[8], -5, -3)
+        self.assertEqual(
+            8, e.index(e[8], 0, -1))
+        self.assertEqual(
+            8, e.index(e[8], -12, -1))
+        self.assertEqual(
+            0, e.index(e[0], -12, -1))
+
+    def test_replace(self):
+        etree = self.etree
+        e = etree.Element('foo')
+        for i in range(10):
+            el = etree.SubElement(e, 'a%s' % i)
+            el.text = "text%d" % i
+            el.tail = "tail%d" % i
+
+        child0 = e[0]
+        child1 = e[1]
+        child2 = e[2]
+
+        e.replace(e[0], e[1])
+        self.assertEqual(
+            9, len(e))
+        self.assertEqual(
+            child1, e[0])
+        self.assertEqual(
+            child1.text, "text1")
+        self.assertEqual(
+            child1.tail, "tail1")
+        self.assertEqual(
+            child0.tail, "tail0")
+        self.assertEqual(
+            child2, e[1])
+
+        e.replace(e[-1], e[0])
+        self.assertEqual(
+            child1, e[-1])
+        self.assertEqual(
+            child1.text, "text1")
+        self.assertEqual(
+            child1.tail, "tail1")
+        self.assertEqual(
+            child2, e[0])
+
+    def test_replace_new(self):
+        etree = self.etree
+        e = etree.Element('foo')
+        for i in range(10):
+            etree.SubElement(e, 'a%s' % i)
+
+        new_element = etree.Element("test")
+        new_element.text = "TESTTEXT"
+        new_element.tail = "TESTTAIL"
+        child1 = e[1]
+        e.replace(e[0], new_element)
+        self.assertEqual(
+            new_element, e[0])
+        self.assertEqual(
+            "TESTTEXT",
+            e[0].text)
+        self.assertEqual(
+            "TESTTAIL",
+            e[0].tail)
+        self.assertEqual(
+            child1, e[1])
+
+    def test_setslice_all_empty_reversed(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+
+        e = Element('e')
+        f = Element('f')
+        g = Element('g')
+
+        s = [e, f, g]
+        a[::-1] = s
+        self.assertEqual(
+            [g, f, e],
+            list(a))
+
+    def test_setslice_step(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        x = Element('x')
+        y = Element('y')
+
+        a[1::2] = [x, y]
+        self.assertEqual(
+            [b, x, d, y],
+            list(a))
+
+    def test_setslice_step_negative(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        x = Element('x')
+        y = Element('y')
+
+        a[1::-1] = [x, y]
+        self.assertEqual(
+            [y, x, d, e],
+            list(a))
+
+    def test_setslice_step_negative2(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        x = Element('x')
+        y = Element('y')
+
+        a[::-2] = [x, y]
+        self.assertEqual(
+            [b, y, d, x],
+            list(a))
+
+    def test_setslice_step_overrun(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        try:
+            slice
+        except NameError:
+            print("slice() not found")
+            return
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(a, 'd')
+        e = SubElement(a, 'e')
+
+        x = Element('x')
+        y = Element('y')
+        z = Element('z')
+
+        self.assertRaises(
+            ValueError,
+            operator.setitem, a, slice(1,None,2), [x, y, z])
+
+        self.assertEqual(
+            [b, c, d, e],
+            list(a))
+
+    def test_sourceline_XML(self):
+        XML = self.etree.XML
+        root = XML(_bytes('''<?xml version="1.0"?>
+        <root><test>
+
+        <bla/></test>
+        </root>
+        '''))
+
+        self.assertEqual(
+            [2, 2, 4],
+            [ el.sourceline for el in root.getiterator() ])
+
+    def test_large_sourceline_XML(self):
+        XML = self.etree.XML
+        root = XML(_bytes(
+            '<?xml version="1.0"?>\n'
+            '<root>' + '\n' * 65536 +
+            '<p>' + '\n' * 65536 + '</p>\n' +
+            '<br/>\n'
+            '</root>'))
+
+        if self.etree.LIBXML_VERSION >= (2, 9):
+            expected = [2, 131074, 131076]
+        else:
+            expected = [2, 65535, 65535]
+
+        self.assertEqual(expected, [el.sourceline for el in root.iter()])
+
+    def test_sourceline_parse(self):
+        parse = self.etree.parse
+        tree = parse(fileInTestDir('include/test_xinclude.xml'))
+
+        self.assertEqual(
+            [1, 2, 3],
+            [ el.sourceline for el in tree.getiterator() ])
+
+    def test_sourceline_iterparse_end(self):
+        iterparse = self.etree.iterparse
+        lines = [ el.sourceline for (event, el) in 
+                  iterparse(fileInTestDir('include/test_xinclude.xml')) ]
+
+        self.assertEqual(
+            [2, 3, 1],
+            lines)
+
+    def test_sourceline_iterparse_start(self):
+        iterparse = self.etree.iterparse
+        lines = [ el.sourceline for (event, el) in 
+                  iterparse(fileInTestDir('include/test_xinclude.xml'),
+                            events=("start",)) ]
+
+        self.assertEqual(
+            [1, 2, 3],
+            lines)
+
+    def test_sourceline_element(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        el = Element("test")
+        self.assertEqual(None, el.sourceline)
+
+        child = SubElement(el, "test")
+        self.assertEqual(None, el.sourceline)
+        self.assertEqual(None, child.sourceline)
+
+    def test_XML_base_url_docinfo(self):
+        etree = self.etree
+        root = etree.XML(_bytes("<root/>"), base_url="http://no/such/url")
+        docinfo = root.getroottree().docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+
+    def test_XML_set_base_url_docinfo(self):
+        etree = self.etree
+        root = etree.XML(_bytes("<root/>"), base_url="http://no/such/url")
+        docinfo = root.getroottree().docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+        docinfo.URL = "https://secret/url"
+        self.assertEqual(docinfo.URL, "https://secret/url")
+
+    def test_parse_stringio_base_url(self):
+        etree = self.etree
+        tree = etree.parse(BytesIO("<root/>"), base_url="http://no/such/url")
+        docinfo = tree.docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+
+    def test_parse_base_url_docinfo(self):
+        etree = self.etree
+        tree = etree.parse(fileInTestDir('include/test_xinclude.xml'),
+                           base_url="http://no/such/url")
+        docinfo = tree.docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+
+    def test_HTML_base_url_docinfo(self):
+        etree = self.etree
+        root = etree.HTML(_bytes("<html/>"), base_url="http://no/such/url")
+        docinfo = root.getroottree().docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+
+    def test_docinfo_public(self):
+        etree = self.etree
+        xml_header = '<?xml version="1.0" encoding="ascii"?>'
+        pub_id = "-//W3C//DTD XHTML 1.0 Transitional//EN"
+        sys_id = "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"
+        doctype_string = '<!DOCTYPE html PUBLIC "%s" "%s">' % (pub_id, sys_id)
+
+        xml = _bytes(xml_header + doctype_string + '<html><body></body></html>')
+
+        tree = etree.parse(BytesIO(xml))
+        docinfo = tree.docinfo
+        self.assertEqual(docinfo.encoding,    "ascii")
+        self.assertEqual(docinfo.xml_version, "1.0")
+        self.assertEqual(docinfo.public_id,   pub_id)
+        self.assertEqual(docinfo.system_url,  sys_id)
+        self.assertEqual(docinfo.root_name,   'html')
+        self.assertEqual(docinfo.doctype, doctype_string)
+
+    def test_docinfo_system(self):
+        etree = self.etree
+        xml_header = '<?xml version="1.0" encoding="UTF-8"?>'
+        sys_id = "some.dtd"
+        doctype_string = '<!DOCTYPE html SYSTEM "%s">' % sys_id
+        xml = _bytes(xml_header + doctype_string + '<html><body></body></html>')
+
+        tree = etree.parse(BytesIO(xml))
+        docinfo = tree.docinfo
+        self.assertEqual(docinfo.encoding,    "UTF-8")
+        self.assertEqual(docinfo.xml_version, "1.0")
+        self.assertEqual(docinfo.public_id,   None)
+        self.assertEqual(docinfo.system_url,  sys_id)
+        self.assertEqual(docinfo.root_name,   'html')
+        self.assertEqual(docinfo.doctype, doctype_string)
+
+    def test_docinfo_empty(self):
+        etree = self.etree
+        xml = _bytes('<html><body></body></html>')
+        tree = etree.parse(BytesIO(xml))
+        docinfo = tree.docinfo
+        self.assertEqual(docinfo.encoding,    "UTF-8")
+        self.assertEqual(docinfo.xml_version, "1.0")
+        self.assertEqual(docinfo.public_id,   None)
+        self.assertEqual(docinfo.system_url,  None)
+        self.assertEqual(docinfo.root_name,   'html')
+        self.assertEqual(docinfo.doctype, '')
+
+    def test_docinfo_name_only(self):
+        etree = self.etree
+        xml = _bytes('<!DOCTYPE root><root></root>')
+        tree = etree.parse(BytesIO(xml))
+        docinfo = tree.docinfo
+        self.assertEqual(docinfo.encoding,    "UTF-8")
+        self.assertEqual(docinfo.xml_version, "1.0")
+        self.assertEqual(docinfo.public_id,   None)
+        self.assertEqual(docinfo.system_url,  None)
+        self.assertEqual(docinfo.root_name,   'root')
+        self.assertEqual(docinfo.doctype, '<!DOCTYPE root>')
+
+    def test_doctype_name_only_roundtrip(self):
+        etree = self.etree
+        xml = _bytes('<!DOCTYPE root>\n<root/>')
+        tree = etree.parse(BytesIO(xml))
+        self.assertEqual(xml, etree.tostring(tree))
+
+    def test_doctype_output_override(self):
+        etree = self.etree
+        pub_id = "-//W3C//DTD XHTML 1.0 Transitional//EN"
+        sys_id = "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"
+        doctype_string = _bytes('<!DOCTYPE html PUBLIC "%s" "%s">' % (pub_id, sys_id))
+
+        xml = _bytes('<!DOCTYPE root>\n<root/>')
+        tree = etree.parse(BytesIO(xml))
+        self.assertEqual(xml.replace(_bytes('<!DOCTYPE root>'), doctype_string),
+                          etree.tostring(tree, doctype=doctype_string))
+
+    def test_xml_base(self):
+        etree = self.etree
+        root = etree.XML(_bytes("<root/>"), base_url="http://no/such/url")
+        self.assertEqual(root.base, "http://no/such/url")
+        self.assertEqual(
+            root.get('{http://www.w3.org/XML/1998/namespace}base'), None)
+        root.base = "https://secret/url"
+        self.assertEqual(root.base, "https://secret/url")
+        self.assertEqual(
+            root.get('{http://www.w3.org/XML/1998/namespace}base'),
+            "https://secret/url")
+
+    def test_xml_base_attribute(self):
+        etree = self.etree
+        root = etree.XML(_bytes("<root/>"), base_url="http://no/such/url")
+        self.assertEqual(root.base, "http://no/such/url")
+        self.assertEqual(
+            root.get('{http://www.w3.org/XML/1998/namespace}base'), None)
+        root.set('{http://www.w3.org/XML/1998/namespace}base',
+                 "https://secret/url")
+        self.assertEqual(root.base, "https://secret/url")
+        self.assertEqual(
+            root.get('{http://www.w3.org/XML/1998/namespace}base'),
+            "https://secret/url")
+
+    def test_html_base(self):
+        etree = self.etree
+        root = etree.HTML(_bytes("<html><body></body></html>"),
+                          base_url="http://no/such/url")
+        self.assertEqual(root.base, "http://no/such/url")
+
+    def test_html_base_tag(self):
+        etree = self.etree
+        root = etree.HTML(_bytes('<html><head><base href="http://no/such/url"></head></html>'))
+        self.assertEqual(root.base, "http://no/such/url")
+
+    def test_parse_fileobject_unicode(self):
+        # parse from a file object that returns unicode strings
+        f = LargeFileLikeUnicode()
+        tree = self.etree.parse(f)
+        root = tree.getroot()
+        self.assertTrue(root.tag.endswith('root'))
+
+    def test_dtd_io(self):
+        # check that DTDs that go in also go back out
+        xml = _bytes('''\
+        <!DOCTYPE test SYSTEM "test.dtd" [
+          <!ENTITY entity "tasty">
+          <!ELEMENT test (a)>
+          <!ELEMENT a (#PCDATA)>
+        ]>
+        <test><a>test-test</a></test>\
+        ''')
+        tree = self.etree.parse(BytesIO(xml))
+        self.assertEqual(self.etree.tostring(tree).replace(_bytes(" "), _bytes("")),
+                         xml.replace(_bytes(" "), _bytes("")))
+
+    def test_byte_zero(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        self.assertRaises(ValueError, setattr, a, "text", 'ha\0ho')
+        self.assertRaises(ValueError, setattr, a, "tail", 'ha\0ho')
+
+        self.assertRaises(ValueError, Element, 'ha\0ho')
+
+    def test_unicode_byte_zero(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        self.assertRaises(ValueError, setattr, a, "text",
+                          _str('ha\0ho'))
+        self.assertRaises(ValueError, setattr, a, "tail",
+                          _str('ha\0ho'))
+
+        self.assertRaises(ValueError, Element,
+                          _str('ha\0ho'))
+
+    def test_byte_invalid(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        self.assertRaises(ValueError, setattr, a, "text", 'ha\x07ho')
+        self.assertRaises(ValueError, setattr, a, "text", 'ha\x02ho')
+
+        self.assertRaises(ValueError, setattr, a, "tail", 'ha\x07ho')
+        self.assertRaises(ValueError, setattr, a, "tail", 'ha\x02ho')
+
+        self.assertRaises(ValueError, Element, 'ha\x07ho')
+        self.assertRaises(ValueError, Element, 'ha\x02ho')
+
+    def test_unicode_byte_invalid(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        self.assertRaises(ValueError, setattr, a, "text",
+                          _str('ha\x07ho'))
+        self.assertRaises(ValueError, setattr, a, "text",
+                          _str('ha\x02ho'))
+
+        self.assertRaises(ValueError, setattr, a, "tail",
+                          _str('ha\x07ho'))
+        self.assertRaises(ValueError, setattr, a, "tail",
+                          _str('ha\x02ho'))
+
+        self.assertRaises(ValueError, Element,
+                          _str('ha\x07ho'))
+        self.assertRaises(ValueError, Element,
+                          _str('ha\x02ho'))
+
+    def test_unicode_byte_invalid_sequence(self):
+        Element = self.etree.Element
+
+        a = Element('a')
+        self.assertRaises(ValueError, setattr, a, "text",
+                          _str('ha\u1234\x07ho'))
+        self.assertRaises(ValueError, setattr, a, "text",
+                          _str('ha\u1234\x02ho'))
+
+        self.assertRaises(ValueError, setattr, a, "tail",
+                          _str('ha\u1234\x07ho'))
+        self.assertRaises(ValueError, setattr, a, "tail",
+                          _str('ha\u1234\x02ho'))
+
+        self.assertRaises(ValueError, Element,
+                          _str('ha\u1234\x07ho'))
+        self.assertRaises(ValueError, Element,
+                          _str('ha\u1234\x02ho'))
+
+    def test_encoding_tostring_utf16(self):
+        # ElementTree fails to serialize this
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        result = tostring(a, encoding='UTF-16')
+        self.assertEqual(_bytes('<a><b></b><c></c></a>'),
+                          canonicalize(result))
+
+    def test_tostring_none(self):
+        # ElementTree raises an AssertionError here
+        tostring = self.etree.tostring
+        self.assertRaises(TypeError, self.etree.tostring, None)
+
+    def test_tostring_pretty(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        result = tostring(a)
+        self.assertEqual(result, _bytes("<a><b/><c/></a>"))
+
+        result = tostring(a, pretty_print=False)
+        self.assertEqual(result, _bytes("<a><b/><c/></a>"))
+
+        result = tostring(a, pretty_print=True)
+        self.assertEqual(result, _bytes("<a>\n  <b/>\n  <c/>\n</a>\n"))
+
+    def test_tostring_with_tail(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        a.tail = "aTAIL"
+        b = SubElement(a, 'b')
+        b.tail = "bTAIL"
+        c = SubElement(a, 'c')
+
+        result = tostring(a)
+        self.assertEqual(result, _bytes("<a><b/>bTAIL<c/></a>aTAIL"))
+
+        result = tostring(a, with_tail=False)
+        self.assertEqual(result, _bytes("<a><b/>bTAIL<c/></a>"))
+
+        result = tostring(a, with_tail=True)
+        self.assertEqual(result, _bytes("<a><b/>bTAIL<c/></a>aTAIL"))
+
+    def test_tostring_method_html_with_tail(self):
+        tostring = self.etree.tostring
+        html = self.etree.fromstring(
+            '<html><body>'
+            '<div><p>Some text<i>\r\n</i></p></div>\r\n'
+            '</body></html>',
+            parser=self.etree.HTMLParser())
+        self.assertEqual(html.tag, 'html')
+        div = html.find('.//div')
+        self.assertEqual(div.tail, '\r\n')
+        result = tostring(div, method='html')
+        self.assertEqual(
+            result,
+            _bytes("<div><p>Some text<i>\r\n</i></p></div>\r\n"))
+        result = tostring(div, method='html', with_tail=True)
+        self.assertEqual(
+            result,
+            _bytes("<div><p>Some text<i>\r\n</i></p></div>\r\n"))
+        result = tostring(div, method='html', with_tail=False)
+        self.assertEqual(
+            result,
+            _bytes("<div><p>Some text<i>\r\n</i></p></div>"))
+
+    def test_standalone(self):
+        tostring = self.etree.tostring
+        XML = self.etree.XML
+        ElementTree = self.etree.ElementTree
+        Element = self.etree.Element
+
+        tree = Element("root").getroottree()
+        self.assertEqual(None, tree.docinfo.standalone)
+
+        tree = XML(_bytes("<root/>")).getroottree()
+        self.assertEqual(None, tree.docinfo.standalone)
+
+        tree = XML(_bytes(
+            "<?xml version='1.0' encoding='ASCII' standalone='yes'?>\n<root/>"
+            )).getroottree()
+        self.assertEqual(True, tree.docinfo.standalone)
+
+        tree = XML(_bytes(
+            "<?xml version='1.0' encoding='ASCII' standalone='no'?>\n<root/>"
+            )).getroottree()
+        self.assertEqual(False, tree.docinfo.standalone)
+
+    def test_tostring_standalone(self):
+        tostring = self.etree.tostring
+        XML = self.etree.XML
+        ElementTree = self.etree.ElementTree
+
+        root = XML(_bytes("<root/>"))
+
+        tree = ElementTree(root)
+        self.assertEqual(None, tree.docinfo.standalone)
+
+        result = tostring(root, xml_declaration=True, encoding="ASCII")
+        self.assertEqual(result, _bytes(
+            "<?xml version='1.0' encoding='ASCII'?>\n<root/>"))
+
+        result = tostring(root, xml_declaration=True, encoding="ASCII",
+                          standalone=True)
+        self.assertEqual(result, _bytes(
+            "<?xml version='1.0' encoding='ASCII' standalone='yes'?>\n<root/>"))
+
+        tree = ElementTree(XML(result))
+        self.assertEqual(True, tree.docinfo.standalone)
+
+        result = tostring(root, xml_declaration=True, encoding="ASCII",
+                          standalone=False)
+        self.assertEqual(result, _bytes(
+            "<?xml version='1.0' encoding='ASCII' standalone='no'?>\n<root/>"))
+
+        tree = ElementTree(XML(result))
+        self.assertEqual(False, tree.docinfo.standalone)
+
+    def test_tostring_standalone_in_out(self):
+        tostring = self.etree.tostring
+        XML = self.etree.XML
+        ElementTree = self.etree.ElementTree
+
+        root = XML(_bytes(
+            "<?xml version='1.0' encoding='UTF-8' standalone='yes'?>\n<root/>"))
+
+        tree = ElementTree(root)
+        self.assertEqual(True, tree.docinfo.standalone)
+
+        result = tostring(root, xml_declaration=True, encoding="ASCII")
+        self.assertEqual(result, _bytes(
+            "<?xml version='1.0' encoding='ASCII'?>\n<root/>"))
+
+        result = tostring(root, xml_declaration=True, encoding="ASCII",
+                          standalone=True)
+        self.assertEqual(result, _bytes(
+            "<?xml version='1.0' encoding='ASCII' standalone='yes'?>\n<root/>"))
+
+    def test_tostring_method_text_encoding(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        a.text = "A"
+        a.tail = "tail"
+        b = SubElement(a, 'b')
+        b.text = "B"
+        b.tail = _str("Søk på nettet")
+        c = SubElement(a, 'c')
+        c.text = "C"
+
+        result = tostring(a, method="text", encoding="UTF-16")
+
+        self.assertEqual(_str('ABSøk på nettetCtail').encode("UTF-16"),
+                          result)
+
+    def test_tostring_method_text_unicode(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        a.text = _str('Søk på nettetA')
+        a.tail = "tail"
+        b = SubElement(a, 'b')
+        b.text = "B"
+        b.tail = _str('Søk på nettetB')
+        c = SubElement(a, 'c')
+        c.text = "C"
+        
+        self.assertRaises(UnicodeEncodeError,
+                          tostring, a, method="text")
+        
+        self.assertEqual(
+            _str('Søk på nettetABSøk på nettetBCtail').encode('utf-8'),
+            tostring(a, encoding="UTF-8", method="text"))
+
+    def test_tounicode(self):
+        tounicode = self.etree.tounicode
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        
+        self.assertTrue(isinstance(tounicode(a), _unicode))
+        self.assertEqual(_bytes('<a><b></b><c></c></a>'),
+                          canonicalize(tounicode(a)))
+
+    def test_tounicode_element(self):
+        tounicode = self.etree.tounicode
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(c, 'd')
+        self.assertTrue(isinstance(tounicode(b), _unicode))
+        self.assertTrue(isinstance(tounicode(c), _unicode))
+        self.assertEqual(_bytes('<b></b>'),
+                          canonicalize(tounicode(b)))
+        self.assertEqual(_bytes('<c><d></d></c>'),
+                          canonicalize(tounicode(c)))
+
+    def test_tounicode_none(self):
+        tounicode = self.etree.tounicode
+        self.assertRaises(TypeError, self.etree.tounicode, None)
+
+    def test_tounicode_element_tail(self):
+        tounicode = self.etree.tounicode
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(c, 'd')
+        b.tail = 'Foo'
+
+        self.assertTrue(isinstance(tounicode(b), _unicode))
+        self.assertTrue(tounicode(b) == '<b/>Foo' or
+                     tounicode(b) == '<b />Foo')
+
+    def test_tounicode_pretty(self):
+        tounicode = self.etree.tounicode
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        result = tounicode(a)
+        self.assertEqual(result, "<a><b/><c/></a>")
+
+        result = tounicode(a, pretty_print=False)
+        self.assertEqual(result, "<a><b/><c/></a>")
+
+        result = tounicode(a, pretty_print=True)
+        self.assertEqual(result, "<a>\n  <b/>\n  <c/>\n</a>\n")
+
+    def test_tostring_unicode(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        
+        self.assertTrue(isinstance(tostring(a, encoding=_unicode), _unicode))
+        self.assertEqual(_bytes('<a><b></b><c></c></a>'),
+                          canonicalize(tostring(a, encoding=_unicode)))
+
+    def test_tostring_unicode_element(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(c, 'd')
+        self.assertTrue(isinstance(tostring(b, encoding=_unicode), _unicode))
+        self.assertTrue(isinstance(tostring(c, encoding=_unicode), _unicode))
+        self.assertEqual(_bytes('<b></b>'),
+                          canonicalize(tostring(b, encoding=_unicode)))
+        self.assertEqual(_bytes('<c><d></d></c>'),
+                          canonicalize(tostring(c, encoding=_unicode)))
+
+    def test_tostring_unicode_none(self):
+        tostring = self.etree.tostring
+        self.assertRaises(TypeError, self.etree.tostring,
+                          None, encoding=_unicode)
+
+    def test_tostring_unicode_element_tail(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+        d = SubElement(c, 'd')
+        b.tail = 'Foo'
+
+        self.assertTrue(isinstance(tostring(b, encoding=_unicode), _unicode))
+        self.assertTrue(tostring(b, encoding=_unicode) == '<b/>Foo' or
+                     tostring(b, encoding=_unicode) == '<b />Foo')
+
+    def test_tostring_unicode_pretty(self):
+        tostring = self.etree.tostring
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+
+        a = Element('a')
+        b = SubElement(a, 'b')
+        c = SubElement(a, 'c')
+
+        result = tostring(a, encoding=_unicode)
+        self.assertEqual(result, "<a><b/><c/></a>")
+
+        result = tostring(a, encoding=_unicode, pretty_print=False)
+        self.assertEqual(result, "<a><b/><c/></a>")
+
+        result = tostring(a, encoding=_unicode, pretty_print=True)
+        self.assertEqual(result, "<a>\n  <b/>\n  <c/>\n</a>\n")
+
+    def test_pypy_proxy_collect(self):
+        root = etree.Element('parent')
+        etree.SubElement(root, 'child')
+
+        self.assertEqual(len(root), 1)
+        self.assertEqual(root[0].tag, 'child')
+
+        # in PyPy, GC used to kill the Python proxy instance without cleanup
+        gc.collect()
+        self.assertEqual(len(root), 1)
+        self.assertEqual(root[0].tag, 'child')
+
+    def test_element_refcycle(self):
+        class SubEl(etree.ElementBase):
+            pass
+
+        el1 = SubEl()
+        el2 = SubEl()
+        self.assertEqual('SubEl', el1.tag)
+        self.assertEqual('SubEl', el2.tag)
+        el1.other = el2
+        el2.other = el1
+
+        del el1, el2
+        gc.collect()
+        # not really testing anything here, but it shouldn't crash
+
+    # helper methods
+
+    def _writeElement(self, element, encoding='us-ascii', compression=0):
+        """Write out element for comparison.
+        """
+        ElementTree = self.etree.ElementTree
+        f = BytesIO()
+        tree = ElementTree(element=element)
+        tree.write(f, encoding=encoding, compression=compression)
+        data = f.getvalue()
+        if compression:
+            data = zlib.decompress(data)
+        return canonicalize(data)
+
+
+class _XIncludeTestCase(HelperTestCase):
+    def test_xinclude_text(self):
+        filename = fileInTestDir('test_broken.xml')
+        root = etree.XML(_bytes('''\
+        <doc xmlns:xi="http://www.w3.org/2001/XInclude">
+          <xi:include href="%s" parse="text"/>
+        </doc>
+        ''' % path2url(filename)))
+        old_text = root.text
+        content = read_file(filename)
+        old_tail = root[0].tail
+
+        self.include( etree.ElementTree(root) )
+        self.assertEqual(old_text + content + old_tail,
+                          root.text)
+
+    def test_xinclude(self):
+        tree = etree.parse(fileInTestDir('include/test_xinclude.xml'))
+        self.assertNotEqual(
+            'a',
+            tree.getroot()[1].tag)
+        # process xincludes
+        self.include( tree )
+        # check whether we find it replaced with included data
+        self.assertEqual(
+            'a',
+            tree.getroot()[1].tag)
+
+    def test_xinclude_resolver(self):
+        class res(etree.Resolver):
+            include_text = read_file(fileInTestDir('test.xml'))
+            called = {}
+            def resolve(self, url, id, context):
+                if url.endswith(".dtd"):
+                    self.called["dtd"] = True
+                    return self.resolve_filename(
+                        fileInTestDir('test.dtd'), context)
+                elif url.endswith("test_xinclude.xml"):
+                    self.called["input"] = True
+                    return None # delegate to default resolver
+                else:
+                    self.called["include"] = True
+                    return self.resolve_string(self.include_text, context)
+
+        res_instance = res()
+        parser = etree.XMLParser(load_dtd = True)
+        parser.resolvers.add(res_instance)
+
+        tree = etree.parse(fileInTestDir('include/test_xinclude.xml'),
+                           parser = parser)
+
+        self.include(tree)
+
+        called = list(res_instance.called.items())
+        called.sort()
+        self.assertEqual(
+            [("dtd", True), ("include", True), ("input", True)],
+            called)
+
+    def test_xinclude_resolver_recursive(self):
+        data = textwrap.dedent('''
+        <doc xmlns:xi="http://www.w3.org/2001/XInclude">
+        <foo/>
+        <xi:include href="./test.xml" />
+        </doc>
+        ''')
+
+        class Resolver(etree.Resolver):
+            called = {}
+
+            def resolve(self, url, id, context):
+                if url.endswith("test_xinclude.xml"):
+                    assert not self.called.get("input")
+                    self.called["input"] = True
+                    return None  # delegate to default resolver
+                elif url.endswith('/test5.xml'):
+                    assert not self.called.get("DONE")
+                    self.called["DONE"] = True
+                    return self.resolve_string('<DONE/>', context)
+                else:
+                    _, filename = url.rsplit('/', 1)
+                    assert not self.called.get(filename)
+                    self.called[filename] = True
+                    next_data = data.replace(
+                        'test.xml', 'test%d.xml' % len(self.called))
+                    return self.resolve_string(next_data, context)
+
+        res_instance = Resolver()
+        parser = etree.XMLParser(load_dtd=True)
+        parser.resolvers.add(res_instance)
+
+        tree = etree.parse(fileInTestDir('include/test_xinclude.xml'),
+                           parser=parser)
+
+        self.include(tree)
+
+        called = list(res_instance.called.items())
+        called.sort()
+        self.assertEqual(
+            [("DONE", True), ("input", True), ("test.xml", True),
+             ("test2.xml", True), ("test3.xml", True), ("test4.xml", True)],
+            called)
+
+
+class ETreeXIncludeTestCase(_XIncludeTestCase):
+    def include(self, tree):
+        tree.xinclude()
+
+
+class ElementIncludeTestCase(_XIncludeTestCase):
+    from lxml import ElementInclude
+    def include(self, tree):
+        self.ElementInclude.include(tree.getroot())
+
+
+class ETreeC14NTestCase(HelperTestCase):
+    def test_c14n(self):
+        tree = self.parse(_bytes('<a><b/></a>'))
+        f = BytesIO()
+        tree.write_c14n(f)
+        s = f.getvalue()
+        self.assertEqual(_bytes('<a><b></b></a>'),
+                          s)
+
+    def test_c14n_gzip(self):
+        tree = self.parse(_bytes('<a>'+'<b/>'*200+'</a>'))
+        f = BytesIO()
+        tree.write_c14n(f, compression=9)
+        gzfile = gzip.GzipFile(fileobj=BytesIO(f.getvalue()))
+        try:
+            s = gzfile.read()
+        finally:
+            gzfile.close()
+        self.assertEqual(_bytes('<a>'+'<b></b>'*200+'</a>'),
+                          s)
+
+    def test_c14n_file(self):
+        tree = self.parse(_bytes('<a><b/></a>'))
+        handle, filename = tempfile.mkstemp()
+        try:
+            tree.write_c14n(filename)
+            data = read_file(filename, 'rb')
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        self.assertEqual(_bytes('<a><b></b></a>'),
+                          data)
+
+    def test_c14n_file_gzip(self):
+        tree = self.parse(_bytes('<a>'+'<b/>'*200+'</a>'))
+        handle, filename = tempfile.mkstemp()
+        try:
+            tree.write_c14n(filename, compression=9)
+            f = gzip.open(filename, 'rb')
+            try:
+                data = f.read()
+            finally:
+                f.close()
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        self.assertEqual(_bytes('<a>'+'<b></b>'*200+'</a>'),
+                          data)
+
+    def test_c14n_with_comments(self):
+        tree = self.parse(_bytes('<!--hi--><a><!--ho--><b/></a><!--hu-->'))
+        f = BytesIO()
+        tree.write_c14n(f)
+        s = f.getvalue()
+        self.assertEqual(_bytes('<!--hi-->\n<a><!--ho--><b></b></a>\n<!--hu-->'),
+                          s)
+        f = BytesIO()
+        tree.write_c14n(f, with_comments=True)
+        s = f.getvalue()
+        self.assertEqual(_bytes('<!--hi-->\n<a><!--ho--><b></b></a>\n<!--hu-->'),
+                          s)
+        f = BytesIO()
+        tree.write_c14n(f, with_comments=False)
+        s = f.getvalue()
+        self.assertEqual(_bytes('<a><b></b></a>'),
+                          s)
+
+    def test_c14n_tostring_with_comments(self):
+        tree = self.parse(_bytes('<!--hi--><a><!--ho--><b/></a><!--hu-->'))
+        s = etree.tostring(tree, method='c14n')
+        self.assertEqual(_bytes('<!--hi-->\n<a><!--ho--><b></b></a>\n<!--hu-->'),
+                          s)
+        s = etree.tostring(tree, method='c14n', with_comments=True)
+        self.assertEqual(_bytes('<!--hi-->\n<a><!--ho--><b></b></a>\n<!--hu-->'),
+                          s)
+        s = etree.tostring(tree, method='c14n', with_comments=False)
+        self.assertEqual(_bytes('<a><b></b></a>'),
+                          s)
+
+    def test_c14n_element_tostring_with_comments(self):
+        tree = self.parse(_bytes('<!--hi--><a><!--ho--><b/></a><!--hu-->'))
+        s = etree.tostring(tree.getroot(), method='c14n')
+        self.assertEqual(_bytes('<a><!--ho--><b></b></a>'),
+                          s)
+        s = etree.tostring(tree.getroot(), method='c14n', with_comments=True)
+        self.assertEqual(_bytes('<a><!--ho--><b></b></a>'),
+                          s)
+        s = etree.tostring(tree.getroot(), method='c14n', with_comments=False)
+        self.assertEqual(_bytes('<a><b></b></a>'),
+                          s)
+
+    def test_c14n_exclusive(self):
+        tree = self.parse(_bytes(
+                '<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b/></a>'))
+        f = BytesIO()
+        tree.write_c14n(f)
+        s = f.getvalue()
+        self.assertEqual(_bytes('<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b></z:b></a>'),
+                          s)
+        f = BytesIO()
+        tree.write_c14n(f, exclusive=False)
+        s = f.getvalue()
+        self.assertEqual(_bytes('<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b></z:b></a>'),
+                          s)
+        f = BytesIO()
+        tree.write_c14n(f, exclusive=True)
+        s = f.getvalue()
+        self.assertEqual(_bytes('<a xmlns="http://abc"><z:b xmlns:z="http://cde"></z:b></a>'),
+                          s)
+
+        f = BytesIO()
+        tree.write_c14n(f, exclusive=True, inclusive_ns_prefixes=['z'])
+        s = f.getvalue()
+        self.assertEqual(_bytes('<a xmlns="http://abc" xmlns:z="http://cde"><z:b></z:b></a>'),
+                          s)
+
+    def test_c14n_tostring_exclusive(self):
+        tree = self.parse(_bytes(
+                '<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b/></a>'))
+        s = etree.tostring(tree, method='c14n')
+        self.assertEqual(_bytes('<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b></z:b></a>'),
+                          s)
+        s = etree.tostring(tree, method='c14n', exclusive=False)
+        self.assertEqual(_bytes('<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b></z:b></a>'),
+                          s)
+        s = etree.tostring(tree, method='c14n', exclusive=True)
+        self.assertEqual(_bytes('<a xmlns="http://abc"><z:b xmlns:z="http://cde"></z:b></a>'),
+                          s)
+
+        s = etree.tostring(tree, method='c14n', exclusive=True, inclusive_ns_prefixes=['y'])
+        self.assertEqual(_bytes('<a xmlns="http://abc" xmlns:y="http://bcd"><z:b xmlns:z="http://cde"></z:b></a>'),
+                          s)
+
+    def test_c14n_element_tostring_exclusive(self):
+        tree = self.parse(_bytes(
+                '<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b/></a>'))
+        s = etree.tostring(tree.getroot(), method='c14n')
+        self.assertEqual(_bytes('<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b></z:b></a>'),
+                          s)
+        s = etree.tostring(tree.getroot(), method='c14n', exclusive=False)
+        self.assertEqual(_bytes('<a xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b></z:b></a>'),
+                          s)
+        s = etree.tostring(tree.getroot(), method='c14n', exclusive=True)
+        self.assertEqual(_bytes('<a xmlns="http://abc"><z:b xmlns:z="http://cde"></z:b></a>'),
+                          s)
+
+        s = etree.tostring(tree.getroot()[0], method='c14n', exclusive=False)
+        self.assertEqual(_bytes('<z:b xmlns="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"></z:b>'),
+                          s)
+        s = etree.tostring(tree.getroot()[0], method='c14n', exclusive=True)
+        self.assertEqual(_bytes('<z:b xmlns:z="http://cde"></z:b>'),
+                          s)
+
+        s = etree.tostring(tree.getroot()[0], method='c14n', exclusive=True, inclusive_ns_prefixes=['y'])
+        self.assertEqual(_bytes('<z:b xmlns:y="http://bcd" xmlns:z="http://cde"></z:b>'),
+                          s)
+
+    def test_c14n_tostring_inclusive_ns_prefixes(self):
+        """ Regression test to fix memory allocation issues (use 3+ inclusive NS spaces)"""
+        tree = self.parse(_bytes(
+                '<a xmlns:x="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b/></a>'))
+
+        s = etree.tostring(tree, method='c14n', exclusive=True, inclusive_ns_prefixes=['x', 'y', 'z'])
+        self.assertEqual(_bytes('<a xmlns:x="http://abc" xmlns:y="http://bcd" xmlns:z="http://cde"><z:b></z:b></a>'),
+                          s)
+
+
+class ETreeWriteTestCase(HelperTestCase):
+    def test_write(self):
+        tree = self.parse(_bytes('<a><b/></a>'))
+        f = BytesIO()
+        tree.write(f)
+        s = f.getvalue()
+        self.assertEqual(_bytes('<a><b/></a>'),
+                          s)
+
+    def test_write_gzip(self):
+        tree = self.parse(_bytes('<a>'+'<b/>'*200+'</a>'))
+        f = BytesIO()
+        tree.write(f, compression=9)
+        gzfile = gzip.GzipFile(fileobj=BytesIO(f.getvalue()))
+        try:
+            s = gzfile.read()
+        finally:
+            gzfile.close()
+        self.assertEqual(_bytes('<a>'+'<b/>'*200+'</a>'),
+                          s)
+
+    def test_write_gzip_level(self):
+        tree = self.parse(_bytes('<a>'+'<b/>'*200+'</a>'))
+        f = BytesIO()
+        tree.write(f, compression=0)
+        s0 = f.getvalue()
+
+        f = BytesIO()
+        tree.write(f)
+        self.assertEqual(f.getvalue(), s0)
+
+        f = BytesIO()
+        tree.write(f, compression=1)
+        s = f.getvalue()
+        self.assertTrue(len(s) <= len(s0))
+        gzfile = gzip.GzipFile(fileobj=BytesIO(s))
+        try:
+            s1 = gzfile.read()
+        finally:
+            gzfile.close()
+
+        f = BytesIO()
+        tree.write(f, compression=9)
+        s = f.getvalue()
+        self.assertTrue(len(s) <= len(s0))
+        gzfile = gzip.GzipFile(fileobj=BytesIO(s))
+        try:
+            s9 = gzfile.read()
+        finally:
+            gzfile.close()
+
+        self.assertEqual(_bytes('<a>'+'<b/>'*200+'</a>'),
+                          s0)
+        self.assertEqual(_bytes('<a>'+'<b/>'*200+'</a>'),
+                          s1)
+        self.assertEqual(_bytes('<a>'+'<b/>'*200+'</a>'),
+                          s9)
+
+    def test_write_file(self):
+        tree = self.parse(_bytes('<a><b/></a>'))
+        handle, filename = tempfile.mkstemp()
+        try:
+            tree.write(filename)
+            data = read_file(filename, 'rb')
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        self.assertEqual(_bytes('<a><b/></a>'),
+                          data)
+
+    def test_write_file_gzip(self):
+        tree = self.parse(_bytes('<a>'+'<b/>'*200+'</a>'))
+        handle, filename = tempfile.mkstemp()
+        try:
+            tree.write(filename, compression=9)
+            f = gzip.open(filename, 'rb')
+            try:
+                data = f.read()
+            finally:
+                f.close()
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        self.assertEqual(_bytes('<a>'+'<b/>'*200+'</a>'),
+                          data)
+
+    def test_write_file_gzip_parse(self):
+        tree = self.parse(_bytes('<a>'+'<b/>'*200+'</a>'))
+        handle, filename = tempfile.mkstemp()
+        try:
+            tree.write(filename, compression=9)
+            data = etree.tostring(etree.parse(filename))
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        self.assertEqual(_bytes('<a>'+'<b/>'*200+'</a>'),
+                          data)
+
+    def test_write_file_gzipfile_parse(self):
+        tree = self.parse(_bytes('<a>'+'<b/>'*200+'</a>'))
+        handle, filename = tempfile.mkstemp()
+        try:
+            tree.write(filename, compression=9)
+            data = etree.tostring(etree.parse(
+                gzip.GzipFile(filename)))
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        self.assertEqual(_bytes('<a>'+'<b/>'*200+'</a>'),
+                          data)
+
+class ETreeErrorLogTest(HelperTestCase):
+    etree = etree
+
+    def test_parse_error_logging(self):
+        parse = self.etree.parse
+        f = BytesIO('<a><b></c></b></a>')
+        self.etree.clear_error_log()
+        try:
+            parse(f)
+            logs = None
+        except SyntaxError:
+            e = sys.exc_info()[1]
+            logs = e.error_log
+        f.close()
+        self.assertTrue([ log for log in logs
+                       if 'mismatch' in log.message ])
+        self.assertTrue([ log for log in logs
+                       if 'PARSER'   in log.domain_name])
+        self.assertTrue([ log for log in logs
+                       if 'ERR_TAG_NAME_MISMATCH' in log.type_name ])
+        self.assertTrue([ log for log in logs
+                       if 1 == log.line ])
+        self.assertTrue([ log for log in logs
+                       if 15 == log.column ])
+
+    def _test_python_error_logging(self):
+        """This can't really be tested as long as there isn't a way to
+        reset the logging setup ...
+        """
+        parse = self.etree.parse
+
+        messages = []
+        class Logger(self.etree.PyErrorLog):
+            def log(self, entry, message, *args):
+                messages.append(message)
+
+        self.etree.use_global_python_log(Logger())
+        f = BytesIO('<a><b></c></b></a>')
+        try:
+            parse(f)
+        except SyntaxError:
+            pass
+        f.close()
+
+        self.assertTrue([ message for message in messages
+                       if 'mismatch' in message ])
+        self.assertTrue([ message for message in messages
+                       if ':PARSER:'   in message])
+        self.assertTrue([ message for message in messages
+                       if ':ERR_TAG_NAME_MISMATCH:' in message ])
+        self.assertTrue([ message for message in messages
+                       if ':1:15:' in message ])
+
+
+class XMLPullParserTest(unittest.TestCase):
+    etree = etree
+
+    def assert_event_tags(self, events, expected):
+        self.assertEqual([(action, elem.tag) for action, elem in events],
+                         expected)
+
+    def test_pull_from_simple_target(self):
+        class Target(object):
+            def start(self, tag, attrib):
+                return 'start(%s)' % tag
+            def end(self, tag):
+                return 'end(%s)' % tag
+            def close(self):
+                return 'close()'
+
+        parser = self.etree.XMLPullParser(target=Target())
+        events = parser.read_events()
+
+        parser.feed('<root><element>')
+        self.assertFalse(list(events))
+        self.assertFalse(list(events))
+        parser.feed('</element><child>')
+        self.assertEqual([('end', 'end(element)')], list(events))
+        parser.feed('</child>')
+        self.assertEqual([('end', 'end(child)')], list(events))
+        parser.feed('</root>')
+        self.assertEqual([('end', 'end(root)')], list(events))
+        self.assertFalse(list(events))
+        self.assertEqual('close()', parser.close())
+
+    def test_pull_from_simple_target_start_end(self):
+        class Target(object):
+            def start(self, tag, attrib):
+                return 'start(%s)' % tag
+            def end(self, tag):
+                return 'end(%s)' % tag
+            def close(self):
+                return 'close()'
+
+        parser = self.etree.XMLPullParser(
+            ['start', 'end'], target=Target())
+        events = parser.read_events()
+
+        parser.feed('<root><element>')
+        self.assertEqual(
+            [('start', 'start(root)'), ('start', 'start(element)')],
+            list(events))
+        self.assertFalse(list(events))
+        parser.feed('</element><child>')
+        self.assertEqual(
+            [('end', 'end(element)'), ('start', 'start(child)')],
+            list(events))
+        parser.feed('</child>')
+        self.assertEqual(
+            [('end', 'end(child)')],
+            list(events))
+        parser.feed('</root>')
+        self.assertEqual(
+            [('end', 'end(root)')],
+            list(events))
+        self.assertFalse(list(events))
+        self.assertEqual('close()', parser.close())
+
+    def test_pull_from_tree_builder(self):
+        parser = self.etree.XMLPullParser(
+            ['start', 'end'], target=etree.TreeBuilder())
+        events = parser.read_events()
+
+        parser.feed('<root><element>')
+        self.assert_event_tags(
+            events, [('start', 'root'), ('start', 'element')])
+        self.assertFalse(list(events))
+        parser.feed('</element><child>')
+        self.assert_event_tags(
+            events, [('end', 'element'), ('start', 'child')])
+        parser.feed('</child>')
+        self.assert_event_tags(
+            events, [('end', 'child')])
+        parser.feed('</root>')
+        self.assert_event_tags(
+            events, [('end', 'root')])
+        self.assertFalse(list(events))
+        root = parser.close()
+        self.assertEqual('root', root.tag)
+
+    def test_pull_from_tree_builder_subclass(self):
+        class Target(etree.TreeBuilder):
+            def end(self, tag):
+                el = super(Target, self).end(tag)
+                el.tag += '-huhu'
+                return el
+
+        parser = self.etree.XMLPullParser(
+            ['start', 'end'], target=Target())
+        events = parser.read_events()
+
+        parser.feed('<root><element>')
+        self.assert_event_tags(
+            events, [('start', 'root'), ('start', 'element')])
+        self.assertFalse(list(events))
+        parser.feed('</element><child>')
+        self.assert_event_tags(
+            events, [('end', 'element-huhu'), ('start', 'child')])
+        parser.feed('</child>')
+        self.assert_event_tags(
+            events, [('end', 'child-huhu')])
+        parser.feed('</root>')
+        self.assert_event_tags(
+            events, [('end', 'root-huhu')])
+        self.assertFalse(list(events))
+        root = parser.close()
+        self.assertEqual('root-huhu', root.tag)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeOnlyTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeXIncludeTestCase)])
+    suite.addTests([unittest.makeSuite(ElementIncludeTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeC14NTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeWriteTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeErrorLogTest)])
+    suite.addTests([unittest.makeSuite(XMLPullParserTest)])
+    suite.addTests(doctest.DocTestSuite(etree))
+    suite.addTests(
+        [make_doctest('../../../doc/tutorial.txt')])
+    if sys.version_info >= (2,6):
+        # now requires the 'with' statement
+        suite.addTests(
+            [make_doctest('../../../doc/api.txt')])
+    suite.addTests(
+        [make_doctest('../../../doc/FAQ.txt')])
+    suite.addTests(
+        [make_doctest('../../../doc/parsing.txt')])
+    suite.addTests(
+        [make_doctest('../../../doc/resolvers.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_htmlparser.py b/lib/lxml/tests/test_htmlparser.py
new file mode 100644
index 00000000..4f60c0b9
--- /dev/null
+++ b/lib/lxml/tests/test_htmlparser.py
@@ -0,0 +1,516 @@
+# -*- coding: utf-8 -*-
+
+"""
+HTML parser test cases for etree
+"""
+
+import unittest
+import tempfile, os, os.path, sys
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, StringIO, BytesIO, fileInTestDir, _bytes, _str
+from common_imports import SillyFileLike, HelperTestCase, write_to_file, next
+
+try:
+    unicode
+except NameError:
+    unicode = str
+
+class HtmlParserTestCase(HelperTestCase):
+    """HTML parser test cases
+    """
+    etree = etree
+
+    html_str = _bytes("<html><head><title>test</title></head><body><h1>page title</h1></body></html>")
+    html_str_pretty = _bytes("""\
+<html>
+<head><title>test</title></head>
+<body><h1>page title</h1></body>
+</html>
+""")
+    broken_html_str = _bytes("<html><head><title>test"
+                             "<body><h1>page title</h3></p></html>")
+    uhtml_str = _bytes(
+        "<html><head><title>test Ã¡</title></head>"
+        "<body><h1>page Ã¡ title</h1></body></html>").decode('utf8')
+
+    def tearDown(self):
+        super(HtmlParserTestCase, self).tearDown()
+        self.etree.set_default_parser()
+
+    def test_module_HTML(self):
+        element = self.etree.HTML(self.html_str)
+        self.assertEqual(self.etree.tostring(element, method="html"),
+                         self.html_str)
+
+    def test_module_HTML_unicode(self):
+        element = self.etree.HTML(self.uhtml_str)
+        self.assertEqual(
+            self.etree.tostring(element, method="html", encoding='unicode'),
+            self.uhtml_str)
+        self.assertEqual(element.findtext('.//h1'),
+                         _bytes("page Ã¡ title").decode('utf8'))
+
+    def test_wide_unicode_xml(self):
+        if sys.maxunicode < 1114111:
+            return  # skip test
+        element = self.etree.HTML(_bytes(
+            '<html><body><p>\\U00026007</p></body></html>'
+        ).decode('unicode_escape'))
+        p_text = element.findtext('.//p')
+        self.assertEqual(1, len(p_text))
+        self.assertEqual(_bytes('\\U00026007').decode('unicode_escape'),
+                         p_text)
+
+    def test_module_HTML_pretty_print(self):
+        element = self.etree.HTML(self.html_str)
+        self.assertEqual(self.etree.tostring(element, method="html", pretty_print=True),
+                         self.html_str_pretty)
+
+    def test_module_parse_html_error(self):
+        parser = self.etree.HTMLParser(recover=False)
+        parse = self.etree.parse
+        f = BytesIO("<html></body>")
+        self.assertRaises(self.etree.XMLSyntaxError,
+                          parse, f, parser)
+
+    def test_html_element_name_empty(self):
+        parser = self.etree.HTMLParser()
+        Element = parser.makeelement
+
+        el = Element('name')
+        self.assertRaises(ValueError, Element, '{}')
+        self.assertRaises(ValueError, setattr, el, 'tag', '{}')
+
+        self.assertRaises(ValueError, Element, '{test}')
+        self.assertRaises(ValueError, setattr, el, 'tag', '{test}')
+
+    def test_html_element_name_colon(self):
+        parser = self.etree.HTMLParser()
+        Element = parser.makeelement
+
+        pname = Element('p:name')
+        self.assertEqual(pname.tag, 'p:name')
+
+        pname = Element('{test}p:name')
+        self.assertEqual(pname.tag, '{test}p:name')
+
+        pname = Element('name')
+        pname.tag = 'p:name'
+        self.assertEqual(pname.tag, 'p:name')
+
+    def test_html_element_name_quote(self):
+        parser = self.etree.HTMLParser()
+        Element = parser.makeelement
+
+        self.assertRaises(ValueError, Element, 'p"name')
+        self.assertRaises(ValueError, Element, "na'me")
+        self.assertRaises(ValueError, Element, '{test}"name')
+        self.assertRaises(ValueError, Element, "{test}name'")
+
+        el = Element('name')
+        self.assertRaises(ValueError, setattr, el, 'tag', "pname'")
+        self.assertRaises(ValueError, setattr, el, 'tag', '"pname')
+        self.assertEqual(el.tag, "name")
+
+    def test_html_element_name_space(self):
+        parser = self.etree.HTMLParser()
+        Element = parser.makeelement
+
+        self.assertRaises(ValueError, Element, ' name ')
+        self.assertRaises(ValueError, Element, 'na me')
+        self.assertRaises(ValueError, Element, '{test} name')
+
+        el = Element('name')
+        self.assertRaises(ValueError, setattr, el, 'tag', ' name ')
+        self.assertEqual(el.tag, "name")
+
+    def test_html_subelement_name_empty(self):
+        parser = self.etree.HTMLParser()
+        Element = parser.makeelement
+
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        self.assertRaises(ValueError, SubElement, el, '{}')
+        self.assertRaises(ValueError, SubElement, el, '{test}')
+
+    def test_html_subelement_name_colon(self):
+        parser = self.etree.HTMLParser()
+        Element = parser.makeelement
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        pname = SubElement(el, 'p:name')
+        self.assertEqual(pname.tag, 'p:name')
+
+        pname = SubElement(el, '{test}p:name')
+        self.assertEqual(pname.tag, '{test}p:name')
+
+    def test_html_subelement_name_quote(self):
+        parser = self.etree.HTMLParser()
+        Element = parser.makeelement
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        self.assertRaises(ValueError, SubElement, el, "name'")
+        self.assertRaises(ValueError, SubElement, el, 'na"me')
+        self.assertRaises(ValueError, SubElement, el, "{test}na'me")
+        self.assertRaises(ValueError, SubElement, el, '{test}"name')
+
+    def test_html_subelement_name_space(self):
+        parser = self.etree.HTMLParser()
+        Element = parser.makeelement
+        SubElement = self.etree.SubElement
+
+        el = Element('name')
+        self.assertRaises(ValueError, SubElement, el, ' name ')
+        self.assertRaises(ValueError, SubElement, el, 'na me')
+        self.assertRaises(ValueError, SubElement, el, '{test} name')
+
+    def test_module_parse_html_norecover(self):
+        parser = self.etree.HTMLParser(recover=False)
+        parse = self.etree.parse
+        f = BytesIO(self.broken_html_str)
+        self.assertRaises(self.etree.XMLSyntaxError,
+                          parse, f, parser)
+
+    def test_parse_encoding_8bit_explicit(self):
+        text = _str('Søk på nettet')
+        html_latin1 = (_str('<p>%s</p>') % text).encode('iso-8859-1')
+
+        tree = self.etree.parse(
+            BytesIO(html_latin1),
+            self.etree.HTMLParser(encoding="iso-8859-1"))
+        p = tree.find("//p")
+        self.assertEqual(p.text, text)
+
+    def test_parse_encoding_8bit_override(self):
+        text = _str('Søk på nettet')
+        wrong_head = _str('''
+        <head>
+          <meta http-equiv="Content-Type"
+                content="text/html; charset=UTF-8" />
+        </head>''')
+        html_latin1 = (_str('<html>%s<body><p>%s</p></body></html>') % (wrong_head,
+                                                                        text)
+                      ).encode('iso-8859-1')
+
+        self.assertRaises(self.etree.ParseError,
+                          self.etree.parse,
+                          BytesIO(html_latin1))
+
+        tree = self.etree.parse(
+            BytesIO(html_latin1),
+            self.etree.HTMLParser(encoding="iso-8859-1"))
+        p = tree.find("//p")
+        self.assertEqual(p.text, text)
+
+    def test_module_HTML_broken(self):
+        element = self.etree.HTML(self.broken_html_str)
+        self.assertEqual(self.etree.tostring(element, method="html"),
+                         self.html_str)
+
+    def test_module_HTML_cdata(self):
+        # by default, libxml2 generates CDATA nodes for <script> content
+        html = _bytes('<html><head><style>foo</style></head></html>')
+        element = self.etree.HTML(html)
+        self.assertEqual(element[0][0].text, "foo")
+
+    def test_module_HTML_access(self):
+        element = self.etree.HTML(self.html_str)
+        self.assertEqual(element[0][0].tag, 'title')
+
+    def test_module_parse_html(self):
+        parser = self.etree.HTMLParser()
+        filename = tempfile.mktemp(suffix=".html")
+        write_to_file(filename, self.html_str, 'wb')
+        try:
+            f = open(filename, 'rb')
+            tree = self.etree.parse(f, parser)
+            f.close()
+            self.assertEqual(self.etree.tostring(tree.getroot(), method="html"),
+                             self.html_str)
+        finally:
+            os.remove(filename)
+
+    def test_module_parse_html_filelike(self):
+        parser = self.etree.HTMLParser()
+        f = SillyFileLike(self.html_str)
+        tree = self.etree.parse(f, parser)
+        html = self.etree.tostring(tree.getroot(),
+                                   method="html", encoding='UTF-8')
+        self.assertEqual(html, self.html_str)
+
+##     def test_module_parse_html_filelike_unicode(self):
+##         parser = self.etree.HTMLParser()
+##         f = SillyFileLike(self.uhtml_str)
+##         tree = self.etree.parse(f, parser)
+##         html = self.etree.tostring(tree.getroot(), encoding='UTF-8')
+##         self.assertEqual(unicode(html, 'UTF-8'), self.uhtml_str)
+
+    def test_html_file_error(self):
+        parser = self.etree.HTMLParser()
+        parse = self.etree.parse
+        self.assertRaises(IOError,
+                          parse, "__some_hopefully_nonexisting_file__.html",
+                          parser)
+
+    def test_default_parser_HTML_broken(self):
+        self.assertRaises(self.etree.XMLSyntaxError,
+                          self.etree.parse, BytesIO(self.broken_html_str))
+
+        self.etree.set_default_parser( self.etree.HTMLParser() )
+
+        tree = self.etree.parse(BytesIO(self.broken_html_str))
+        self.assertEqual(self.etree.tostring(tree.getroot(), method="html"),
+                         self.html_str)
+
+        self.etree.set_default_parser()
+
+        self.assertRaises(self.etree.XMLSyntaxError,
+                          self.etree.parse, BytesIO(self.broken_html_str))
+
+    def test_html_iterparse(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO(
+            '<html><head><title>TITLE</title><body><p>P</p></body></html>')
+
+        iterator = iterparse(f, html=True)
+        self.assertEqual(None, iterator.root)
+
+        events = list(iterator)
+        root = iterator.root
+        self.assertTrue(root is not None)
+        self.assertEqual(
+            [('end', root[0][0]), ('end', root[0]), ('end', root[1][0]),
+             ('end', root[1]), ('end', root)],
+            events)
+
+    def test_html_iterparse_stop_short(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO(
+            '<html><head><title>TITLE</title><body><p>P</p></body></html>')
+
+        iterator = iterparse(f, html=True)
+        self.assertEqual(None, iterator.root)
+
+        event, element = next(iterator)
+        self.assertEqual('end', event)
+        self.assertEqual('title', element.tag)
+        self.assertEqual(None, iterator.root)
+        del element
+
+        event, element = next(iterator)
+        self.assertEqual('end', event)
+        self.assertEqual('head', element.tag)
+        self.assertEqual(None, iterator.root)
+        del element
+        del iterator
+
+    def test_html_iterparse_broken(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<head><title>TEST></head><p>P<br></div>')
+
+        iterator = iterparse(f, html=True)
+        self.assertEqual(None, iterator.root)
+
+        events = list(iterator)
+        root = iterator.root
+        self.assertTrue(root is not None)
+        self.assertEqual('html', root.tag)
+        self.assertEqual('head', root[0].tag)
+        self.assertEqual('body', root[1].tag)
+        self.assertEqual('p', root[1][0].tag)
+        self.assertEqual('br', root[1][0][0].tag)
+        self.assertEqual(
+            [('end', root[0][0]), ('end', root[0]), ('end', root[1][0][0]),
+             ('end', root[1][0]), ('end', root[1]), ('end', root)],
+            events)
+
+    def test_html_iterparse_broken_no_recover(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO('<p>P<br></div>')
+        iterator = iterparse(f, html=True, recover=False)
+        self.assertRaises(self.etree.XMLSyntaxError, list, iterator)
+
+    def test_html_iterparse_file(self):
+        iterparse = self.etree.iterparse
+        iterator = iterparse(fileInTestDir("shakespeare.html"),
+                             html=True)
+
+        self.assertEqual(None, iterator.root)
+        events = list(iterator)
+        root = iterator.root
+        self.assertTrue(root is not None)
+        self.assertEqual(249, len(events))
+        self.assertFalse(
+            [event for (event, element) in events if event != 'end'])
+
+    def test_html_iterparse_start(self):
+        iterparse = self.etree.iterparse
+        f = BytesIO(
+            '<html><head><title>TITLE</title><body><p>P</p></body></html>')
+
+        iterator = iterparse(f, html=True, events=('start',))
+        self.assertEqual(None, iterator.root)
+
+        events = list(iterator)
+        root = iterator.root
+        self.assertNotEqual(None, root)
+        self.assertEqual(
+            [('start', root), ('start', root[0]), ('start', root[0][0]),
+                ('start', root[1]), ('start', root[1][0])],
+            events)
+
+    def test_html_feed_parser(self):
+        parser = self.etree.HTMLParser()
+        parser.feed("<html><body></")
+        parser.feed("body></html>")
+        root = parser.close()
+
+        self.assertEqual('html', root.tag)
+        # test that we find all names in the parser dict
+        self.assertEqual([root], list(root.iter('html')))
+        self.assertEqual([root[0]], list(root.iter('body')))
+
+    def test_html_feed_parser_chunky(self):
+        parser = self.etree.HTMLParser()
+        parser.feed("<htm")
+        parser.feed("l><body")
+        parser.feed("><")
+        parser.feed("p><")
+        parser.feed("strong")
+        parser.feed(">some ")
+        parser.feed("text</strong></p><")
+        parser.feed("/body></html>")
+        root = parser.close()
+
+        self.assertEqual('html', root.tag)
+        # test that we find all names in the parser dict
+        self.assertEqual([root], list(root.iter('html')))
+        self.assertEqual([root[0]], list(root.iter('body')))
+        self.assertEqual([root[0][0]], list(root.iter('p')))
+        self.assertEqual([root[0][0][0]], list(root.iter('strong')))
+
+    def test_html_feed_parser_more_tags(self):
+        parser = self.etree.HTMLParser()
+        parser.feed('<html><head>')
+        parser.feed('<title>TITLE</title><body><p>P</p></body><')
+        parser.feed("/html>")
+        root = parser.close()
+
+        self.assertEqual('html', root.tag)
+        # test that we find all names in the parser dict
+        self.assertEqual([root], list(root.iter('html')))
+        self.assertEqual([root[0]], list(root.iter('head')))
+        self.assertEqual([root[0][0]], list(root.iter('title')))
+        self.assertEqual([root[1]], list(root.iter('body')))
+        self.assertEqual([root[1][0]], list(root.iter('p')))
+
+    def test_html_parser_target_tag(self):
+        assertFalse  = self.assertFalse
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append(("start", tag))
+                assertFalse(attrib)
+            def end(self, tag):
+                events.append(("end", tag))
+            def close(self):
+                return "DONE"
+
+        parser = self.etree.HTMLParser(target=Target())
+
+        parser.feed("<html><body></body></html>")
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual([
+            ("start", "html"), ("start", "body"),
+            ("end", "body"), ("end", "html")], events)
+
+    def test_html_parser_target_doctype_empty(self):
+        assertFalse  = self.assertFalse
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append(("start", tag))
+                assertFalse(attrib)
+            def end(self, tag):
+                events.append(("end", tag))
+            def doctype(self, *args):
+                events.append(("doctype", args))
+            def close(self):
+                return "DONE"
+
+        parser = self.etree.HTMLParser(target=Target())
+        parser.feed("<!DOCTYPE><html><body></body></html>")
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual([
+            ("doctype", (None, None, None)),
+            ("start", "html"), ("start", "body"),
+            ("end", "body"), ("end", "html")], events)
+
+    def test_html_parser_target_doctype_html(self):
+        assertFalse  = self.assertFalse
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append(("start", tag))
+                assertFalse(attrib)
+            def end(self, tag):
+                events.append(("end", tag))
+            def doctype(self, *args):
+                events.append(("doctype", args))
+            def close(self):
+                return "DONE"
+
+        parser = self.etree.HTMLParser(target=Target())
+        parser.feed("<!DOCTYPE html><html><body></body></html>")
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual([
+            ("doctype", ("html", None, None)),
+            ("start", "html"), ("start", "body"),
+            ("end", "body"), ("end", "html")], events)
+
+    def test_html_parser_target_doctype_html_full(self):
+        assertFalse  = self.assertFalse
+        events = []
+        class Target(object):
+            def start(self, tag, attrib):
+                events.append(("start", tag))
+                assertFalse(attrib)
+            def end(self, tag):
+                events.append(("end", tag))
+            def doctype(self, *args):
+                events.append(("doctype", args))
+            def close(self):
+                return "DONE"
+
+        parser = self.etree.HTMLParser(target=Target())
+        parser.feed('<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01//EN" "sys.dtd">'
+                    '<html><body></body></html>')
+        done = parser.close()
+
+        self.assertEqual("DONE", done)
+        self.assertEqual([
+            ("doctype", ("html", "-//W3C//DTD HTML 4.01//EN", "sys.dtd")),
+            ("start", "html"), ("start", "body"),
+            ("end", "body"), ("end", "html")], events)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(HtmlParserTestCase)])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_http_io.py b/lib/lxml/tests/test_http_io.py
new file mode 100644
index 00000000..2e62626e
--- /dev/null
+++ b/lib/lxml/tests/test_http_io.py
@@ -0,0 +1,131 @@
+# -*- coding: utf-8 -*-
+
+"""
+Web IO test cases that need Python 2.5+ (wsgiref)
+"""
+
+from __future__ import with_statement
+
+import unittest
+import textwrap
+import os
+import sys
+import gzip
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir)  # needed for Py3
+
+from .common_imports import (
+    etree, HelperTestCase, BytesIO, _bytes)
+from .dummy_http_server import webserver, HTTPRequestCollector
+
+
+class HttpIOTestCase(HelperTestCase):
+    etree = etree
+
+    def _parse_from_http(self, data, code=200, headers=None, parser=None):
+        handler = HTTPRequestCollector(data, code, headers)
+        with webserver(handler) as host_url:
+            tree = self.etree.parse(host_url + 'TEST', parser=parser)
+        self.assertEqual([('/TEST', [])], handler.requests)
+        return tree
+
+    def test_http_client(self):
+        tree = self._parse_from_http(_bytes('<root><a/></root>'))
+        self.assertEqual('root', tree.getroot().tag)
+        self.assertEqual('a', tree.getroot()[0].tag)
+
+    def test_http_client_404(self):
+        try:
+            self._parse_from_http(_bytes('<root/>'), code=404)
+        except IOError:
+            self.assertTrue(True)
+        else:
+            self.assertTrue(False, "expected IOError")
+
+    def test_http_client_gzip(self):
+        f = BytesIO()
+        gz = gzip.GzipFile(fileobj=f, mode='w', filename='test.xml')
+        gz.write(_bytes('<root><a/></root>'))
+        gz.close()
+        data = f.getvalue()
+        del f, gz
+
+        headers = [('Content-Encoding', 'gzip')]
+        tree = self._parse_from_http(data, headers=headers)
+        self.assertEqual('root', tree.getroot().tag)
+        self.assertEqual('a', tree.getroot()[0].tag)
+
+    def test_parser_input_mix(self):
+        data = _bytes('<root><a/></root>')
+        handler = HTTPRequestCollector(data)
+
+        with webserver(handler) as host_url:
+            tree = self.etree.parse(host_url)
+            root = tree.getroot()
+            self.assertEqual('a', root[0].tag)
+
+            root = self.etree.fromstring(data)
+            self.assertEqual('a', root[0].tag)
+
+            tree = self.etree.parse(host_url)
+            root = tree.getroot()
+            self.assertEqual('a', root[0].tag)
+
+            root = self.etree.fromstring(data)
+            self.assertEqual('a', root[0].tag)
+
+        root = self.etree.fromstring(data)
+        self.assertEqual('a', root[0].tag)
+
+    def test_network_dtd(self):
+        data = [_bytes(textwrap.dedent(s)) for s in [
+            # XML file
+            '''\
+            <?xml version="1.0"?>
+            <!DOCTYPE root SYSTEM "./file.dtd">
+            <root>&myentity;</root>
+            ''',
+            # DTD
+            '<!ENTITY myentity "DEFINED">',
+        ]]
+
+        responses = []
+        def handler(environ, start_response):
+            start_response('200 OK', [])
+            return [responses.pop()]
+
+        with webserver(handler) as host_url:
+            # DTD network loading enabled
+            responses = data[::-1]
+            tree = self.etree.parse(
+                host_url + 'dir/test.xml',
+                parser=self.etree.XMLParser(
+                    load_dtd=True, no_network=False))
+            self.assertFalse(responses)  # all read
+            root = tree.getroot()
+            self.assertEqual('DEFINED', root.text)
+
+            # DTD network loading disabled
+            responses = data[::-1]
+            try:
+                self.etree.parse(
+                    host_url + 'dir/test.xml',
+                    parser=self.etree.XMLParser(
+                        load_dtd=True, no_network=True))
+            except self.etree.XMLSyntaxError:
+                self.assertTrue("myentity" in str(sys.exc_info()[1]))
+            else:
+                self.assertTrue(False)
+            self.assertEqual(1, len(responses))  # DTD not read
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(HttpIOTestCase)])
+    return suite
+
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_import.xsd b/lib/lxml/tests/test_import.xsd
new file mode 100644
index 00000000..3accd055
--- /dev/null
+++ b/lib/lxml/tests/test_import.xsd
@@ -0,0 +1,10 @@
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema"
+	    targetNamespace="http://codespeak.net/lxml/schema/ns1"
+	    xmlns:a="http://codespeak.net/lxml/schema/ns"
+	    >
+  <xsd:import
+	namespace="http://codespeak.net/lxml/schema/ns"
+	schemaLocation="test_inc.xsd" />
+
+  <xsd:element name="x" type="a:AType"/>
+</xsd:schema>
diff --git a/lib/lxml/tests/test_inc.xsd b/lib/lxml/tests/test_inc.xsd
new file mode 100644
index 00000000..0c2cf3d6
--- /dev/null
+++ b/lib/lxml/tests/test_inc.xsd
@@ -0,0 +1,10 @@
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema"
+	    xmlns="http://codespeak.net/lxml/schema/ns"
+	    targetNamespace="http://codespeak.net/lxml/schema/ns">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
diff --git a/lib/lxml/tests/test_incremental_xmlfile.py b/lib/lxml/tests/test_incremental_xmlfile.py
new file mode 100644
index 00000000..2cbfe09b
--- /dev/null
+++ b/lib/lxml/tests/test_incremental_xmlfile.py
@@ -0,0 +1,248 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests for the incremental XML serialisation API.
+
+Tests require Python 2.5 or later.
+"""
+
+from __future__ import with_statement
+
+import unittest
+import tempfile, os, sys
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, BytesIO
+from common_imports import HelperTestCase
+
+class _XmlFileTestCaseBase(HelperTestCase):
+    _file = None  # to be set by specific subtypes below
+
+    def test_element(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                pass
+        self.assertXml('<test></test>')
+
+    def test_element_write_text(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                xf.write('toast')
+        self.assertXml('<test>toast</test>')
+
+    def test_element_nested(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                with xf.element('toast'):
+                    with xf.element('taste'):
+                        xf.write('conTent')
+        self.assertXml('<test><toast><taste>conTent</taste></toast></test>')
+
+    def test_element_nested_with_text(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                xf.write('con')
+                with xf.element('toast'):
+                    xf.write('tent')
+                    with xf.element('taste'):
+                        xf.write('inside')
+                    xf.write('tnet')
+                xf.write('noc')
+        self.assertXml('<test>con<toast>tent<taste>inside</taste>'
+                       'tnet</toast>noc</test>')
+
+    def test_write_Element(self):
+        with etree.xmlfile(self._file) as xf:
+            xf.write(etree.Element('test'))
+        self.assertXml('<test/>')
+
+    def test_write_Element_repeatedly(self):
+        element = etree.Element('test')
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                for i in range(100):
+                    xf.write(element)
+
+        tree = self._parse_file()
+        self.assertTrue(tree is not None)
+        self.assertEqual(100, len(tree.getroot()))
+        self.assertEqual(set(['test']), set(el.tag for el in tree.getroot()))
+
+    def test_namespace_nsmap(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('{nsURI}test', nsmap={'x': 'nsURI'}):
+                pass
+        self.assertXml('<x:test xmlns:x="nsURI"></x:test>')
+
+    def test_namespace_nested_nsmap(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test', nsmap={'x': 'nsURI'}):
+                with xf.element('{nsURI}toast'):
+                    pass
+        self.assertXml('<test xmlns:x="nsURI"><x:toast></x:toast></test>')
+
+    def test_anonymous_namespace(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('{nsURI}test'):
+                pass
+        self.assertXml('<ns0:test xmlns:ns0="nsURI"></ns0:test>')
+
+    def test_namespace_nested_anonymous(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                with xf.element('{nsURI}toast'):
+                    pass
+        self.assertXml('<test><ns0:toast xmlns:ns0="nsURI"></ns0:toast></test>')
+
+    def test_default_namespace(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('{nsURI}test', nsmap={None: 'nsURI'}):
+                pass
+        self.assertXml('<test xmlns="nsURI"></test>')
+
+    def test_nested_default_namespace(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('{nsURI}test', nsmap={None: 'nsURI'}):
+                with xf.element('{nsURI}toast'):
+                    pass
+        self.assertXml('<test xmlns="nsURI"><toast></toast></test>')
+
+    def test_pi(self):
+        with etree.xmlfile(self._file) as xf:
+            xf.write(etree.ProcessingInstruction('pypi'))
+            with xf.element('test'):
+                pass
+        self.assertXml('<?pypi ?><test></test>')
+
+    def test_comment(self):
+        with etree.xmlfile(self._file) as xf:
+            xf.write(etree.Comment('a comment'))
+            with xf.element('test'):
+                pass
+        self.assertXml('<!--a comment--><test></test>')
+
+    def test_attribute(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test', attrib={'k': 'v'}):
+                pass
+        self.assertXml('<test k="v"></test>')
+
+    def test_escaping(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                xf.write('Comments: <!-- text -->\n')
+                xf.write('Entities: &amp;')
+        self.assertXml(
+            '<test>Comments: &lt;!-- text --&gt;\nEntities: &amp;amp;</test>')
+
+    def test_encoding(self):
+        with etree.xmlfile(self._file, encoding='utf16') as xf:
+            with xf.element('test'):
+                xf.write('toast')
+        self.assertXml('<test>toast</test>', encoding='utf16')
+
+    def test_failure_preceding_text(self):
+        try:
+            with etree.xmlfile(self._file) as xf:
+                xf.write('toast')
+        except etree.LxmlSyntaxError:
+            self.assertTrue(True)
+        else:
+            self.assertTrue(False)
+
+    def test_failure_trailing_text(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                pass
+            try:
+                xf.write('toast')
+            except etree.LxmlSyntaxError:
+                self.assertTrue(True)
+            else:
+                self.assertTrue(False)
+
+    def test_failure_trailing_Element(self):
+        with etree.xmlfile(self._file) as xf:
+            with xf.element('test'):
+                pass
+            try:
+                xf.write(etree.Element('test'))
+            except etree.LxmlSyntaxError:
+                self.assertTrue(True)
+            else:
+                self.assertTrue(False)
+
+    def test_closing_out_of_order_in_error_case(self):
+        cm_exit = None
+        try:
+            with etree.xmlfile(self._file) as xf:
+                x = xf.element('test')
+                cm_exit = x.__exit__
+                x.__enter__()
+                raise ValueError('123')
+        except ValueError:
+            self.assertTrue(cm_exit)
+            try:
+                cm_exit(ValueError, ValueError("huhu"), None)
+            except etree.LxmlSyntaxError:
+                self.assertTrue(True)
+            else:
+                self.assertTrue(False)
+        else:
+            self.assertTrue(False)
+
+    def _read_file(self):
+        self._file.seek(0)
+        return self._file.read()
+
+    def _parse_file(self):
+        self._file.seek(0)
+        return etree.parse(self._file)
+
+    def tearDown(self):
+        self._file.close()
+
+    def assertXml(self, expected, encoding='utf8'):
+        self.assertEqual(self._read_file().decode(encoding), expected)
+
+
+class BytesIOXmlFileTestCase(_XmlFileTestCaseBase):
+    def setUp(self):
+        self._file = BytesIO()
+
+class TempXmlFileTestCase(_XmlFileTestCaseBase):
+    def setUp(self):
+        self._file = tempfile.NamedTemporaryFile()
+
+class SimpleFileLikeXmlFileTestCase(_XmlFileTestCaseBase):
+    class SimpleFileLike(object):
+        def __init__(self, target):
+            self._target = target
+            self.write = target.write
+            self.close = target.close
+
+    def setUp(self):
+        self._target = BytesIO()
+        self._file = self.SimpleFileLike(self._target)
+
+    def _read_file(self):
+        return self._target.getvalue()
+
+    def _parse_file(self):
+        self._target.seek(0)
+        return etree.parse(self._target)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(BytesIOXmlFileTestCase),
+                    unittest.makeSuite(TempXmlFileTestCase),
+                    unittest.makeSuite(SimpleFileLikeXmlFileTestCase),
+                    ])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_io.py b/lib/lxml/tests/test_io.py
new file mode 100644
index 00000000..06199875
--- /dev/null
+++ b/lib/lxml/tests/test_io.py
@@ -0,0 +1,386 @@
+# -*- coding: utf-8 -*-
+
+"""
+IO test cases that apply to both etree and ElementTree
+"""
+
+import unittest
+import tempfile, gzip, os, os.path, sys, gc, shutil
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir)  # needed for Py3
+
+from common_imports import etree, ElementTree, _str, _bytes
+from common_imports import SillyFileLike, LargeFileLike, HelperTestCase
+from common_imports import read_file, write_to_file, BytesIO
+
+if sys.version_info < (2,6):
+    class NamedTemporaryFile(object):
+        def __init__(self, delete=True, **kwargs):
+            self._tmpfile = tempfile.NamedTemporaryFile(**kwargs)
+        def close(self):
+            self._tmpfile.flush()
+        def __getattr__(self, name):
+            return getattr(self._tmpfile, name)
+else:
+    NamedTemporaryFile = tempfile.NamedTemporaryFile
+
+
+class _IOTestCaseBase(HelperTestCase):
+    """(c)ElementTree compatibility for IO functions/methods
+    """
+    etree = None
+    
+    def setUp(self):
+        """Setting up a minimal tree
+        """
+        self.root = self.etree.Element('a')
+        self.root_str = self.etree.tostring(self.root)
+        self.tree = self.etree.ElementTree(self.root)
+        self._temp_dir = tempfile.mkdtemp()
+        
+    def tearDown(self):
+        gc.collect()
+        shutil.rmtree(self._temp_dir)
+
+    def getTestFilePath(self, name):
+        return os.path.join(self._temp_dir, name)
+
+    def buildNodes(self, element, children, depth):
+        Element = self.etree.Element
+        
+        if depth == 0:
+            return
+        for i in range(children):
+            new_element = Element('element_%s_%s' % (depth, i))
+            self.buildNodes(new_element, children, depth - 1)
+            element.append(new_element)
+
+    def test_tree_io(self):
+        Element = self.etree.Element
+        ElementTree = self.etree.ElementTree
+    
+        element = Element('top')
+        element.text = _str("qwrtioüöä\uAABB")
+        tree = ElementTree(element)
+        self.buildNodes(element, 10, 3)
+        f = open(self.getTestFilePath('testdump.xml'), 'wb')
+        tree.write(f, encoding='UTF-8')
+        f.close()
+        f = open(self.getTestFilePath('testdump.xml'), 'rb')
+        tree = ElementTree(file=f)
+        f.close()
+        f = open(self.getTestFilePath('testdump2.xml'), 'wb')
+        tree.write(f, encoding='UTF-8')
+        f.close()
+        f = open(self.getTestFilePath('testdump.xml'), 'rb')
+        data1 = f.read()
+        f.close()
+        f = open(self.getTestFilePath('testdump2.xml'), 'rb')
+        data2 = f.read()
+        f.close()
+        self.assertEqual(data1, data2)
+
+    def test_tree_io_latin1(self):
+        Element = self.etree.Element
+        ElementTree = self.etree.ElementTree
+
+        element = Element('top')
+        element.text = _str("qwrtioüöäßÃ¡")
+        tree = ElementTree(element)
+        self.buildNodes(element, 10, 3)
+        f = open(self.getTestFilePath('testdump.xml'), 'wb')
+        tree.write(f, encoding='iso-8859-1')
+        f.close()
+        f = open(self.getTestFilePath('testdump.xml'), 'rb')
+        tree = ElementTree(file=f)
+        f.close()
+        f = open(self.getTestFilePath('testdump2.xml'), 'wb')
+        tree.write(f, encoding='iso-8859-1')
+        f.close()
+        f = open(self.getTestFilePath('testdump.xml'), 'rb')
+        data1 = f.read()
+        f.close()
+        f = open(self.getTestFilePath('testdump2.xml'), 'rb')
+        data2 = f.read()
+        f.close()
+        self.assertEqual(data1, data2)
+        
+    def test_write_filename(self):
+        # (c)ElementTree  supports filename strings as write argument
+        
+        handle, filename = tempfile.mkstemp(suffix=".xml")
+        self.tree.write(filename)
+        try:
+            self.assertEqual(read_file(filename, 'rb').replace(_bytes('\n'), _bytes('')),
+                             self.root_str)
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        
+    def test_write_invalid_filename(self):
+        filename = os.path.join(
+            os.path.join('hopefullynonexistingpathname'),
+            'invalid_file.xml')
+        try:
+            self.tree.write(filename)
+        except IOError:
+            pass
+        else:
+            self.assertTrue(
+                False, "writing to an invalid file path should fail")
+
+    def test_module_parse_gzipobject(self):
+        # (c)ElementTree supports gzip instance as parse argument
+        handle, filename = tempfile.mkstemp(suffix=".xml.gz")
+        f = gzip.open(filename, 'wb')
+        f.write(self.root_str)
+        f.close()
+        try:
+            f_gz = gzip.open(filename, 'rb')
+            tree = self.etree.parse(f_gz)
+            f_gz.close()
+            self.assertEqual(self.etree.tostring(tree.getroot()), self.root_str)
+        finally:
+            os.close(handle)
+            os.remove(filename)
+
+    def test_class_parse_filename(self):
+        # (c)ElementTree class ElementTree has a 'parse' method that returns
+        # the root of the tree
+
+        # parse from filename
+        
+        handle, filename = tempfile.mkstemp(suffix=".xml")
+        write_to_file(filename, self.root_str, 'wb')
+        try:
+            tree = self.etree.ElementTree()
+            root = tree.parse(filename)
+            self.assertEqual(self.etree.tostring(root), self.root_str)
+        finally:
+            os.close(handle)
+            os.remove(filename)
+
+    def test_class_parse_filename_remove_previous(self):
+        handle, filename = tempfile.mkstemp(suffix=".xml")
+        write_to_file(filename, self.root_str, 'wb')
+        try:
+            tree = self.etree.ElementTree()
+            root = tree.parse(filename)
+            # and now do it again; previous content should still be there
+            root2 = tree.parse(filename)
+            self.assertEqual('a', root.tag)
+            self.assertEqual('a', root2.tag)
+            # now remove all references to root2, and parse again
+            del root2
+            root3 = tree.parse(filename)
+            self.assertEqual('a', root.tag)
+            self.assertEqual('a', root3.tag)
+            # root2's memory should've been freed here
+            # XXX how to check?
+        finally:
+            os.close(handle)
+            os.remove(filename)
+        
+    def test_class_parse_fileobject(self):
+        # (c)ElementTree class ElementTree has a 'parse' method that returns
+        # the root of the tree
+
+        # parse from file object
+        
+        handle, filename = tempfile.mkstemp(suffix=".xml")
+        try:
+            os.write(handle, self.root_str)
+            f = open(filename, 'rb')
+            tree = self.etree.ElementTree()
+            root = tree.parse(f)
+            f.close()
+            self.assertEqual(self.etree.tostring(root), self.root_str)
+        finally:
+            os.close(handle)
+            os.remove(filename)
+
+    def test_class_parse_unamed_fileobject(self):
+        # (c)ElementTree class ElementTree has a 'parse' method that returns
+        # the root of the tree
+
+        # parse from unamed file object    
+        f = SillyFileLike()
+        root = self.etree.ElementTree().parse(f)
+        self.assertTrue(root.tag.endswith('foo'))
+
+    def test_module_parse_large_fileobject(self):
+        # parse from unamed file object
+        f = LargeFileLike()
+        tree = self.etree.parse(f)
+        root = tree.getroot()
+        self.assertTrue(root.tag.endswith('root'))
+
+    def test_module_parse_fileobject_error(self):
+        class LocalError(Exception):
+            pass
+        class TestFile:
+            def read(*args):
+                raise LocalError
+        f = TestFile()
+        self.assertRaises(LocalError, self.etree.parse, f)
+
+    def test_module_parse_fileobject_late_error(self):
+        class LocalError(Exception):
+            pass
+        class TestFile:
+            data = '<root>test</'
+            try:
+                next_char = iter(data).next
+            except AttributeError:
+                # Python 3
+                next_char = iter(data).__next__
+            counter = 0
+            def read(self, amount=None):
+                if amount is None:
+                    while True:
+                        self.read(1)
+                else:
+                    try:
+                        self.counter += 1
+                        return _bytes(self.next_char())
+                    except StopIteration:
+                        raise LocalError
+        f = TestFile()
+        self.assertRaises(LocalError, self.etree.parse, f)
+        self.assertEqual(f.counter, len(f.data)+1)
+
+    def test_module_parse_fileobject_type_error(self):
+        class TestFile:
+            def read(*args):
+                return 1
+        f = TestFile()
+
+        try:
+            expect_exc = (TypeError, self.etree.ParseError)
+        except AttributeError:
+            expect_exc = TypeError
+        self.assertRaises(expect_exc, self.etree.parse, f)
+
+    def test_etree_parse_io_error(self):
+        # this is a directory name that contains characters beyond latin-1
+        dirnameEN = _str('Directory')
+        dirnameRU = _str('ÐšÐ°Ñ‚Ð°Ð»Ð¾Ð³')
+        filename = _str('nosuchfile.xml')
+        dn = tempfile.mkdtemp(prefix=dirnameEN)
+        try:
+            self.assertRaises(IOError, self.etree.parse, os.path.join(dn, filename))
+        finally:
+            os.rmdir(dn)
+        dn = tempfile.mkdtemp(prefix=dirnameRU)
+        try:
+            self.assertRaises(IOError, self.etree.parse, os.path.join(dn, filename))
+        finally:
+            os.rmdir(dn)
+
+    def test_parse_utf8_bom(self):
+        utext = _str('Søk på nettet')
+        uxml = '<?xml version="1.0" encoding="UTF-8"?><p>%s</p>' % utext
+        bom = _bytes('\\xEF\\xBB\\xBF').decode(
+            "unicode_escape").encode("latin1")
+        self.assertEqual(3, len(bom))
+        f = NamedTemporaryFile(delete=False)
+        try:
+            try:
+                f.write(bom)
+                f.write(uxml.encode("utf-8"))
+            finally:
+                f.close()
+            tree = self.etree.parse(f.name)
+        finally:
+            os.unlink(f.name)
+        self.assertEqual(utext, tree.getroot().text)
+
+    def test_iterparse_utf8_bom(self):
+        utext = _str('Søk på nettet')
+        uxml = '<?xml version="1.0" encoding="UTF-8"?><p>%s</p>' % utext
+        bom = _bytes('\\xEF\\xBB\\xBF').decode(
+            "unicode_escape").encode("latin1")
+        self.assertEqual(3, len(bom))
+        f = NamedTemporaryFile(delete=False)
+        try:
+            try:
+                f.write(bom)
+                f.write(uxml.encode("utf-8"))
+            finally:
+                f.close()
+            elements = [el for _, el in self.etree.iterparse(f.name)]
+            self.assertEqual(1, len(elements))
+            root = elements[0]
+        finally:
+            os.unlink(f.name)
+        self.assertEqual(utext, root.text)
+
+    def test_iterparse_utf16_bom(self):
+        utext = _str('Søk på nettet')
+        uxml = '<?xml version="1.0" encoding="UTF-16"?><p>%s</p>' % utext
+        boms = _bytes('\\xFE\\xFF \\xFF\\xFE').decode(
+            "unicode_escape").encode("latin1")
+        self.assertEqual(5, len(boms))
+        xml = uxml.encode("utf-16")
+        self.assertTrue(xml[:2] in boms, repr(xml[:2]))
+
+        f = NamedTemporaryFile(delete=False)
+        try:
+            try:
+                f.write(xml)
+            finally:
+                f.close()
+            elements = [el for _, el in self.etree.iterparse(f.name)]
+            self.assertEqual(1, len(elements))
+            root = elements[0]
+        finally:
+            os.unlink(f.name)
+        self.assertEqual(utext, root.text)
+
+
+class ETreeIOTestCase(_IOTestCaseBase):
+    etree = etree
+
+    def test_write_compressed_text(self):
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        ElementTree = self.etree.ElementTree
+        text = _str("qwrtioüöä")
+
+        root = Element('root')
+        root.text = text
+        child = SubElement(root, 'sub')
+        child.text = 'TEXT'
+        child.tail = 'TAIL'
+        SubElement(root, 'sub').text = text
+
+        tree = ElementTree(root)
+        out = BytesIO()
+        tree.write(out, method='text', encoding='utf8', compression=9)
+        out.seek(0)
+
+        f = gzip.GzipFile(fileobj=out)
+        try:
+            result = f.read().decode('utf8')
+        finally:
+            f.close()
+        self.assertEqual(text+'TEXTTAIL'+text, result)
+
+
+if ElementTree:
+    class ElementTreeIOTestCase(_IOTestCaseBase):
+        etree = ElementTree
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeIOTestCase)])
+    if ElementTree:
+        suite.addTests([unittest.makeSuite(ElementTreeIOTestCase)])
+    return suite
+
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_isoschematron.py b/lib/lxml/tests/test_isoschematron.py
new file mode 100644
index 00000000..c865ef85
--- /dev/null
+++ b/lib/lxml/tests/test_isoschematron.py
@@ -0,0 +1,851 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to ISO-Schematron parsing and validation
+"""
+
+import unittest, sys, os.path
+from lxml import isoschematron
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, HelperTestCase, fileInTestDir
+from common_imports import doctest, make_doctest
+
+class ETreeISOSchematronTestCase(HelperTestCase):
+    def test_schematron(self):
+        tree_valid = self.parse('<AAA><BBB/><CCC/></AAA>')
+        tree_invalid = self.parse('<AAA><BBB/><CCC/><DDD/></AAA>')
+        schema = self.parse('''\
+<schema xmlns="http://purl.oclc.org/dsdl/schematron" >
+    <pattern id="OpenModel">
+        <title>Open Model</title>
+        <rule context="AAA">
+            <assert test="BBB"> BBB element is not present</assert>
+            <assert test="CCC"> CCC element is not present</assert>
+        </rule>
+    </pattern>
+    <pattern id="ClosedModel">
+        <title>Closed model"</title>
+        <rule context="AAA">
+            <assert test="BBB"> BBB element is not present</assert>
+            <assert test="CCC"> CCC element is not present</assert>
+            <assert test="count(BBB|CCC) = count (*)">There is an extra element</assert>
+        </rule>
+    </pattern>
+</schema>
+''')
+        schema = isoschematron.Schematron(schema)
+        self.assertTrue(schema.validate(tree_valid))
+        self.assertTrue(not schema.validate(tree_invalid))
+
+    def test_schematron_elementtree_error(self):
+        self.assertRaises(ValueError, isoschematron.Schematron, etree.ElementTree())
+
+    # an empty pattern is valid in iso schematron
+    def test_schematron_empty_pattern(self):
+        schema = self.parse('''\
+<schema xmlns="http://purl.oclc.org/dsdl/schematron" >
+    <pattern id="OpenModel">
+        <title>Open model</title>
+    </pattern>
+</schema>
+''')
+        schema = isoschematron.Schematron(schema)
+        self.assertTrue(schema)
+        
+    def test_schematron_invalid_schema_empty(self):
+        schema = self.parse('''\
+<schema xmlns="http://purl.oclc.org/dsdl/schematron" />
+''')
+        self.assertRaises(etree.SchematronParseError,
+                          isoschematron.Schematron, schema)
+
+    def test_schematron_invalid_schema_namespace(self):
+        schema = self.parse('''\
+<schema xmlns="mynamespace" />
+''')
+        self.assertRaises(etree.SchematronParseError,
+                          isoschematron.Schematron, schema)
+
+    def test_schematron_from_tree(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(isinstance(schematron, isoschematron.Schematron))
+
+    def test_schematron_from_element(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        schematron = isoschematron.Schematron(schema.getroot())
+        self.assertTrue(isinstance(schematron, isoschematron.Schematron))
+
+    def test_schematron_from_file(self):
+        schematron = isoschematron.Schematron(file=fileInTestDir('test.sch'))
+        self.assertTrue(isinstance(schematron, isoschematron.Schematron))
+
+    def test_schematron_call(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        tree_valid = self.parse('''\
+<message>
+  <number_of_entries>0</number_of_entries>
+  <entries>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <number_of_entries>3</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+
+    def test_schematron_validate(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        tree_valid = self.parse('''\
+<message>
+  <number_of_entries>0</number_of_entries>
+  <entries>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <number_of_entries>3</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(schematron.validate(tree_valid), schematron.error_log)
+        valid = schematron.validate(tree_invalid)
+        self.assertTrue(not valid)
+
+    def test_schematron_assertValid(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        tree_valid = self.parse('''\
+<message>
+  <number_of_entries>0</number_of_entries>
+  <entries>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <number_of_entries>3</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        self.assertRaises(etree.DocumentInvalid, schematron.assertValid,
+                          tree_invalid)
+
+    def test_schematron_error_log(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        tree_valid = self.parse('''\
+<message>
+  <number_of_entries>0</number_of_entries>
+  <entries>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <number_of_entries>3</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(len(schematron.error_log), 1,
+                          'expected single error: %s (%s errors)' %
+                          (schematron.error_log, len(schematron.error_log)))
+
+    def test_schematron_result_report(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        tree_valid = self.parse('''\
+<message>
+  <number_of_entries>0</number_of_entries>
+  <entries>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <number_of_entries>3</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        schematron = isoschematron.Schematron(schema, store_report=True)
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertTrue(
+            isinstance(schematron.validation_report, etree._ElementTree),
+            'expected a validation report result tree, got: %s' %
+            (schematron.validation_report))
+
+        schematron = isoschematron.Schematron(schema, store_report=False)
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertTrue(schematron.validation_report is None,
+            'validation reporting switched off, still: %s' %
+            (schematron.validation_report))
+
+    def test_schematron_store_schematron(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(schematron.validator_xslt is None)
+
+        schematron = isoschematron.Schematron(schema, store_schematron=True) 
+        self.assertTrue(isinstance(schematron.schematron, etree._ElementTree),
+                     'expected schematron schema to be stored')
+
+    def test_schematron_store_xslt(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(schematron.validator_xslt is None)
+
+        schematron = isoschematron.Schematron(schema, store_xslt=True) 
+        self.assertTrue(isinstance(schematron.validator_xslt, etree._ElementTree),
+                     'expected validator xslt to be stored')
+       
+    def test_schematron_abstract(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:title>iso schematron validation</sch:title>
+  <sch:ns uri="http://www.w3.org/2001/XMLSchema-instance" prefix="xsi"/>
+  <sch:ns uri="http://codespeak.net/lxml/objectify/pytype" prefix="py"/>
+
+  <!-- of course, these only really make sense when combined with a schema that
+       ensures datatype xs:dateTime -->
+       
+  <sch:pattern abstract="true" id="abstract.dateTime.tz_utc">
+    <sch:rule context="$datetime">
+      <sch:let name="tz" value="concat(substring-after(substring-after(./text(), 'T'), '+'), substring-after(substring-after(./text(), 'T'), '-'))"/>
+      <sch:let name="lastchar" value="substring(./text(), string-length(./text()))"/>
+      <sch:assert test="$lastchar='Z' or $tz='00:00'">[ERROR] element (<sch:value-of select="name(.)"/>) dateTime value (<sch:value-of select="."/>) is not qualified as UTC (tz: <sch:value-of select="$tz"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+
+  <sch:pattern abstract="true" id="abstract.dateTime.tz_utc_nillable">
+    <sch:rule context="$datetime">
+      <sch:let name="tz" value="concat(substring-after(substring-after(./text(), 'T'), '+'), substring-after(substring-after(./text(), 'T'), '-'))"/>
+      <sch:let name="lastchar" value="substring(./text(), string-length(./text()))"/>
+      <sch:assert test="@xsi:nil='true'  or ($lastchar='Z' or $tz='00:00')">[ERROR] element (<sch:value-of select="name(.)"/>) dateTime value (<sch:value-of select="."/>) is not qualified as UTC (tz: <sch:value-of select="$tz"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+
+  <sch:pattern is-a="abstract.dateTime.tz_utc" id="datetime" >
+    <sch:param name="datetime" value="datetime"/>
+  </sch:pattern>
+
+  <sch:pattern is-a="abstract.dateTime.tz_utc_nillable" id="nillableDatetime">
+    <sch:param name="datetime" value="nillableDatetime"/>
+  </sch:pattern>
+
+</sch:schema>
+''')
+        valid_trees = [
+            self.parse('''\
+<root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+  <datetime>2009-12-10T15:21:00Z</datetime>
+  <nillableDatetime xsi:nil="true"/>
+</root>
+'''),
+            self.parse('''\
+<root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+  <datetime>2009-12-10T15:21:00Z</datetime>
+  <nillableDatetime>2009-12-10T15:21:00Z</nillableDatetime>
+</root>
+'''),
+            self.parse('''\
+<root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+  <datetime>2009-12-10T15:21:00+00:00</datetime>
+  <nillableDatetime>2009-12-10T15:21:00-00:00</nillableDatetime>
+</root>
+'''),
+            ]
+                       
+        schematron = isoschematron.Schematron(schema)
+        for tree_valid in valid_trees:
+            self.assertTrue(schematron(tree_valid), schematron.error_log)
+
+        tree_invalid = self.parse('''\
+<root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+  <datetime>2009-12-10T16:21:00+01:00</datetime>
+  <nillableDatetime>2009-12-10T16:21:00+01:00</nillableDatetime>
+</root>
+''')
+        expected = 2
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+
+        tree_invalid = self.parse('''\
+<root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+  <datetime xsi:nil="true"/>
+  <nillableDatetime>2009-12-10T16:21:00Z</nillableDatetime>
+</root>
+''')
+        expected = 1
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+
+    def test_schematron_phases(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:title>iso schematron validation</sch:title>
+  <sch:ns uri="http://www.w3.org/2001/XMLSchema-instance" prefix="xsi"/>
+  <sch:ns uri="http://codespeak.net/lxml/objectify/pytype" prefix="py"/>
+
+  <sch:phase id="mandatory">
+    <sch:active pattern="number_of_entries"/>
+  </sch:phase>
+
+  <sch:phase id="datetime_checks">
+    <sch:active pattern="datetime"/>
+    <sch:active pattern="nillableDatetime"/>
+  </sch:phase>
+
+  <sch:phase id="full">
+    <sch:active pattern="number_of_entries"/>
+    <sch:active pattern="datetime"/>
+    <sch:active pattern="nillableDatetime"/>
+  </sch:phase>
+
+  <!-- of course, these only really make sense when combined with a schema that
+       ensures datatype xs:dateTime -->
+  
+  <sch:pattern abstract="true" id="abstract.dateTime.tz_utc">
+    <sch:rule context="$datetime">
+      <sch:let name="tz" value="concat(substring-after(substring-after(./text(), 'T'), '+'), substring-after(substring-after(./text(), 'T'), '-'))"/>
+      <sch:let name="lastchar" value="substring(./text(), string-length(./text()))"/>
+      <sch:assert test="$lastchar='Z' or $tz='00:00'">[ERROR] element (<sch:value-of select="name(.)"/>) dateTime value (<sch:value-of select="."/>) is not qualified as UTC (tz: <sch:value-of select="$tz"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+
+  <sch:pattern abstract="true" id="abstract.dateTime.tz_utc_nillable">
+    <sch:rule context="$datetime">
+      <sch:let name="tz" value="concat(substring-after(substring-after(./text(), 'T'), '+'), substring-after(substring-after(./text(), 'T'), '-'))"/>
+      <sch:let name="lastchar" value="substring(./text(), string-length(./text()))"/>
+      <sch:assert test="@xsi:nil='true'  or ($lastchar='Z' or $tz='00:00')">[ERROR] element (<sch:value-of select="name(.)"/>) dateTime value (<sch:value-of select="."/>) is not qualified as UTC (tz: <sch:value-of select="$tz"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries test</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+
+  <sch:pattern  id="datetime" is-a="abstract.dateTime.tz_utc">
+    <sch:param name="datetime" value="datetime"/>
+  </sch:pattern>
+
+  <sch:pattern  id="nillableDatetime" is-a="abstract.dateTime.tz_utc_nillable">
+    <sch:param name="datetime" value="nillableDatetime"/>
+  </sch:pattern>
+
+</sch:schema>
+''')
+        tree_valid = self.parse('''\
+<message xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+  <datetime>2009-12-10T15:21:00Z</datetime>
+  <nillableDatetime xsi:nil="true"/>
+  <number_of_entries>0</number_of_entries>
+  <entries>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <datetime>2009-12-10T16:21:00+01:00</datetime>
+  <nillableDatetime>2009-12-10T16:21:00+01:00</nillableDatetime>
+  <number_of_entries>3</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        # check everything (default phase #ALL)
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        expected = 3
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+
+        # check phase mandatory
+        schematron = isoschematron.Schematron(
+            schema, compile_params={'phase': 'mandatory'})
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        expected = 1
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+
+        # check phase datetime_checks
+        schematron = isoschematron.Schematron(
+            schema, compile_params={'phase': 'datetime_checks'})
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        expected = 2
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+
+        # check phase full
+        schematron = isoschematron.Schematron(
+            schema, compile_params={'phase': 'full'})
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        expected = 3
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+                                      
+    def test_schematron_phases_kwarg(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:title>iso schematron validation</sch:title>
+  <sch:ns uri="http://www.w3.org/2001/XMLSchema-instance" prefix="xsi"/>
+  <sch:ns uri="http://codespeak.net/lxml/objectify/pytype" prefix="py"/>
+
+  <sch:phase id="mandatory">
+    <sch:active pattern="number_of_entries"/>
+  </sch:phase>
+
+  <sch:phase id="datetime_checks">
+    <sch:active pattern="datetime"/>
+    <sch:active pattern="nillableDatetime"/>
+  </sch:phase>
+
+  <sch:phase id="full">
+    <sch:active pattern="number_of_entries"/>
+    <sch:active pattern="datetime"/>
+    <sch:active pattern="nillableDatetime"/>
+  </sch:phase>
+
+  <!-- of course, these only really make sense when combined with a schema that
+       ensures datatype xs:dateTime -->
+  
+  <sch:pattern abstract="true" id="abstract.dateTime.tz_utc">
+    <sch:rule context="$datetime">
+      <sch:let name="tz" value="concat(substring-after(substring-after(./text(), 'T'), '+'), substring-after(substring-after(./text(), 'T'), '-'))"/>
+      <sch:let name="lastchar" value="substring(./text(), string-length(./text()))"/>
+      <sch:assert test="$lastchar='Z' or $tz='00:00'">[ERROR] element (<sch:value-of select="name(.)"/>) dateTime value (<sch:value-of select="."/>) is not qualified as UTC (tz: <sch:value-of select="$tz"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+
+  <sch:pattern abstract="true" id="abstract.dateTime.tz_utc_nillable">
+    <sch:rule context="$datetime">
+      <sch:let name="tz" value="concat(substring-after(substring-after(./text(), 'T'), '+'), substring-after(substring-after(./text(), 'T'), '-'))"/>
+      <sch:let name="lastchar" value="substring(./text(), string-length(./text()))"/>
+      <sch:assert test="@xsi:nil='true'  or ($lastchar='Z' or $tz='00:00')">[ERROR] element (<sch:value-of select="name(.)"/>) dateTime value (<sch:value-of select="."/>) is not qualified as UTC (tz: <sch:value-of select="$tz"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries test</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+
+  <sch:pattern  id="datetime" is-a="abstract.dateTime.tz_utc">
+    <sch:param name="datetime" value="datetime"/>
+  </sch:pattern>
+
+  <sch:pattern  id="nillableDatetime" is-a="abstract.dateTime.tz_utc_nillable">
+    <sch:param name="datetime" value="nillableDatetime"/>
+  </sch:pattern>
+
+</sch:schema>
+''')
+        tree_valid = self.parse('''\
+<message xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+  <datetime>2009-12-10T15:21:00Z</datetime>
+  <nillableDatetime xsi:nil="true"/>
+  <number_of_entries>0</number_of_entries>
+  <entries>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <datetime>2009-12-10T16:21:00+01:00</datetime>
+  <nillableDatetime>2009-12-10T16:21:00+01:00</nillableDatetime>
+  <number_of_entries>3</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        # check everything (default phase #ALL)
+        schematron = isoschematron.Schematron(schema)
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        expected = 3
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+
+        # check phase mandatory
+        schematron = isoschematron.Schematron(schema, phase='mandatory')
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        expected = 1
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+
+        # check phase datetime_checks
+        schematron = isoschematron.Schematron(schema, phase='datetime_checks')
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        expected = 2
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected,
+            'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+
+        # check phase full
+        schematron = isoschematron.Schematron(schema, phase='full')
+        self.assertTrue(schematron(tree_valid), schematron.error_log)
+        expected = 3
+        valid = schematron(tree_invalid)
+        self.assertTrue(not valid)
+        self.assertEqual(
+            len(schematron.error_log), expected, 'expected %s errors: %s (%s errors)' %
+            (expected, schematron.error_log, len(schematron.error_log)))
+                                      
+    def test_schematron_xmlschema_embedded(self):
+        schema = self.parse('''\
+<xs:schema xmlns:xs="http://www.w3.org/2001/XMLSchema"
+    xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+    <xs:element name="message">
+        <xs:complexType>
+            <xs:sequence>
+                <xs:element name="number_of_entries" type="xs:positiveInteger">
+                    <xs:annotation>
+                        <xs:appinfo>
+                            <sch:pattern id="number_of_entries">
+                                <sch:title>mandatory number_of_entries tests</sch:title>
+                                <sch:rule context="number_of_entries">
+                                    <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+                                </sch:rule>
+                            </sch:pattern>
+                        </xs:appinfo>
+                    </xs:annotation>
+                </xs:element>
+                <xs:element name="entries">
+                    <xs:complexType>
+                        <xs:sequence>
+                            <xs:element name="entry" type="xs:string" minOccurs="0" maxOccurs="unbounded"/>
+                        </xs:sequence>
+                    </xs:complexType>
+                </xs:element>
+            </xs:sequence>
+        </xs:complexType>
+    </xs:element>
+</xs:schema>
+''')
+        tree_valid = self.parse('''\
+<message>
+  <number_of_entries>2</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <number_of_entries>1</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        xmlschema = etree.XMLSchema(schema)
+        schematron = isoschematron.Schematron(schema)
+        # fwiw, this must also be XMLSchema-valid
+        self.assertTrue(xmlschema(tree_valid), xmlschema.error_log)
+        self.assertTrue(schematron(tree_valid))
+        # still schema-valid
+        self.assertTrue(xmlschema(tree_invalid), xmlschema.error_log)
+        self.assertTrue(not schematron(tree_invalid))
+
+    def test_schematron_relaxng_embedded(self):
+        schema = self.parse('''\
+<grammar xmlns="http://relaxng.org/ns/structure/1.0"
+  xmlns:sch="http://purl.oclc.org/dsdl/schematron"
+  datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <ref name="message"/>
+  </start>
+  <define name="message">
+    <element name="message">
+      <element name="number_of_entries">
+        <!-- RelaxNG can be mixed freely with stuff from other namespaces -->
+        <sch:pattern id="number_of_entries">
+          <sch:title>mandatory number_of_entries tests</sch:title>
+          <sch:rule context="number_of_entries">
+            <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+          </sch:rule>
+        </sch:pattern>
+        <data type="positiveInteger"/>
+      </element>
+      <element name="entries">
+        <zeroOrMore>
+          <element name="entry"><data type="string"/></element>
+        </zeroOrMore>
+      </element>
+    </element>
+  </define>
+</grammar>
+''')
+        tree_valid = self.parse('''\
+<message>
+  <number_of_entries>2</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        tree_invalid = self.parse('''\
+<message>
+  <number_of_entries>1</number_of_entries>
+  <entries>
+    <entry>Entry 1</entry>
+    <entry>Entry 2</entry>
+  </entries>
+</message>
+''')
+        relaxng = etree.RelaxNG(schema)
+        schematron = isoschematron.Schematron(schema)
+        # fwiw, this must also be RelaxNG-valid
+        self.assertTrue(relaxng(tree_valid), relaxng.error_log)
+        self.assertTrue(schematron(tree_valid))
+        # still schema-valid
+        self.assertTrue(relaxng(tree_invalid), relaxng.error_log)
+        self.assertTrue(not schematron(tree_invalid))
+
+    def test_schematron_invalid_args(self):
+        schema = self.parse('''\
+<sch:schema xmlns:sch="http://purl.oclc.org/dsdl/schematron">
+  <sch:pattern id="number_of_entries">
+    <sch:title>mandatory number_of_entries tests</sch:title>
+    <sch:rule context="number_of_entries">
+      <sch:assert test="text()=count(../entries/entry)">[ERROR] number_of_entries (<sch:value-of select="."/>) must equal the number of entries/entry elements (<sch:value-of select="count(../entries/entry)"/>)</sch:assert>
+    </sch:rule>
+  </sch:pattern>
+</sch:schema>
+''')
+        # handing phase as keyword arg will *not* raise the type error
+        self.assertRaises(TypeError, isoschematron.Schematron, schema,
+                          compile_params={'phase': None})
+
+    def test_schematron_customization(self):
+        class MySchematron(isoschematron.Schematron):
+            def _extract(self, root):
+                schematron = (root.xpath(
+                    '//sch:schema',
+                    namespaces={'sch': "http://purl.oclc.org/dsdl/schematron"})
+                    or [None])[0]
+                return schematron
+                              
+            def _include(self, schematron, **kwargs):
+                raise RuntimeError('inclusion unsupported')
+            
+            def _expand(self, schematron, **kwargs):
+                raise RuntimeError('expansion unsupported')
+            
+            def _validation_errors(self, validationReport):
+                valid = etree.XPath(
+                    'count(//svrl:successful-report[@flag="critical"])=1',
+                    namespaces={'svrl': isoschematron.SVRL_NS})(
+                    validationReport)
+                if valid:
+                    return []
+                error = etree.Element('Error')
+                error.text = 'missing critical condition report'
+                return [error]
+
+        tree_valid = self.parse('<AAA><BBB/><CCC/></AAA>')
+        tree_invalid = self.parse('<AAA><BBB/><CCC/><DDD/></AAA>')
+        schema = self.parse('''\
+<schema xmlns="http://www.example.org/yet/another/schema/dialect">
+  <schema xmlns="http://purl.oclc.org/dsdl/schematron" >
+    <pattern id="OpenModel">
+      <title>Open Model</title>
+      <rule context="AAA">
+        <report test="BBB" flag="info">BBB element must be present</report>
+        <report test="CCC" flag="info">CCC element must be present</report>
+      </rule>
+    </pattern>
+    <pattern id="ClosedModel">
+      <title>Closed model"</title>
+      <rule context="AAA">
+        <report test="BBB" flag="info">BBB element must be present</report>
+        <report test="CCC" flag="info">CCC element must be present</report>
+        <report test="count(BBB|CCC) = count(*)" flag="critical">Only BBB and CCC children must be present</report>
+      </rule>
+    </pattern>
+  </schema>
+</schema>
+''')
+        # check if overridden _include is run
+        self.assertRaises(RuntimeError, MySchematron, schema, store_report=True)
+        # check if overridden _expand is run
+        self.assertRaises(RuntimeError, MySchematron, schema, store_report=True,
+                          include=False)
+        
+        schema = MySchematron(schema, store_report=True, include=False,
+                              expand=False)
+        self.assertTrue(schema.validate(tree_valid))
+        self.assertTrue(not schema.validate(tree_invalid))
+
+    #TODO: test xslt parameters for inclusion, expand & compile steps (?)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeISOSchematronTestCase)])
+    suite.addTests(
+        [make_doctest('../../../doc/validation.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_nsclasses.py b/lib/lxml/tests/test_nsclasses.py
new file mode 100644
index 00000000..b8b41063
--- /dev/null
+++ b/lib/lxml/tests/test_nsclasses.py
@@ -0,0 +1,215 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to namespace implementation classes and the
+namespace registry mechanism
+"""
+
+import unittest, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, HelperTestCase, _bytes
+from common_imports import doctest, make_doctest
+
+class ETreeNamespaceClassesTestCase(HelperTestCase):
+    
+    class default_class(etree.ElementBase):
+        pass
+    class maeh_class(etree.ElementBase):
+        def maeh(self):
+            return 'maeh'
+    class bluff_class(etree.ElementBase):
+        def bluff(self):
+            return 'bluff'
+
+    def setUp(self):
+        super(ETreeNamespaceClassesTestCase, self).setUp()
+        lookup = etree.ElementNamespaceClassLookup()
+        self.Namespace = lookup.get_namespace
+        parser = etree.XMLParser()
+        parser.set_element_class_lookup(lookup)
+        etree.set_default_parser(parser)
+
+    def tearDown(self):
+        etree.set_default_parser()
+        del self.Namespace
+        super(ETreeNamespaceClassesTestCase, self).tearDown()
+
+    def test_registry(self):
+        ns = self.Namespace('ns01')
+        ns['maeh'] = self.maeh_class
+
+        self.Namespace('ns01').clear()
+
+        self.Namespace('ns02').update({'maeh'  : self.maeh_class})
+        self.Namespace('ns03').update({'bluff' : self.bluff_class}.items())
+        self.Namespace('ns02').clear()
+        self.Namespace('ns03').clear()
+
+    def test_ns_classes(self):
+        bluff_dict = {'bluff' : self.bluff_class}
+        maeh_dict  = {'maeh'  : self.maeh_class}
+
+        self.Namespace('ns10').update(bluff_dict)
+
+        tree = self.parse(_bytes('<bluff xmlns="ns10"><ns11:maeh xmlns:ns11="ns11"/></bluff>'))
+
+        el = tree.getroot()
+        self.assertTrue(isinstance(el, etree.ElementBase))
+        self.assertTrue(hasattr(el, 'bluff'))
+        self.assertFalse(hasattr(el[0], 'maeh'))
+        self.assertFalse(hasattr(el[0], 'bluff'))
+        self.assertEqual(el.bluff(), 'bluff')
+        del el
+
+        self.Namespace('ns11').update(maeh_dict)
+        el = tree.getroot()
+        self.assertTrue(hasattr(el, 'bluff'))
+        self.assertTrue(hasattr(el[0], 'maeh'))
+        self.assertEqual(el.bluff(), 'bluff')
+        self.assertEqual(el[0].maeh(), 'maeh')
+        del el
+
+        self.Namespace('ns10').clear()
+
+        tree = self.parse(_bytes('<bluff xmlns="ns10"><ns11:maeh xmlns:ns11="ns11"/></bluff>'))
+        el = tree.getroot()
+        self.assertFalse(hasattr(el, 'bluff'))
+        self.assertFalse(hasattr(el, 'maeh'))
+        self.assertFalse(hasattr(el[0], 'bluff'))
+        self.assertTrue(hasattr(el[0], 'maeh'))
+
+        self.Namespace('ns11').clear()
+
+    def test_default_tagname(self):
+        bluff_dict = {
+            None   : self.bluff_class,
+            'maeh' : self.maeh_class
+            }
+
+        ns = self.Namespace("uri:nsDefClass")
+        ns.update(bluff_dict)
+
+        tree = self.parse(_bytes('''
+            <test xmlns="bla" xmlns:ns1="uri:nsDefClass" xmlns:ns2="uri:nsDefClass">
+              <ns2:el1/><ns1:el2/><ns1:maeh/><ns2:maeh/><maeh/>
+            </test>
+            '''))
+
+        el = tree.getroot()
+        self.assertFalse(isinstance(el, etree.ElementBase))
+        for child in el[:-1]:
+            self.assertTrue(isinstance(child, etree.ElementBase), child.tag)
+        self.assertFalse(isinstance(el[-1], etree.ElementBase))
+
+        self.assertTrue(hasattr(el[0], 'bluff'))
+        self.assertTrue(hasattr(el[1], 'bluff'))
+        self.assertTrue(hasattr(el[2], 'maeh'))
+        self.assertTrue(hasattr(el[3], 'maeh'))
+        self.assertFalse(hasattr(el[4], 'maeh'))
+        del el
+
+        ns.clear()
+
+    def test_create_element(self):
+        bluff_dict = {'bluff' : self.bluff_class}
+        self.Namespace('ns20').update(bluff_dict)
+
+        maeh_dict  = {'maeh'  : self.maeh_class}
+        self.Namespace('ns21').update(maeh_dict)
+
+        el = etree.Element("{ns20}bluff")
+        self.assertTrue(hasattr(el, 'bluff'))
+
+        child = etree.SubElement(el, "{ns21}maeh")
+        self.assertTrue(hasattr(child, 'maeh'))
+        child = etree.SubElement(el, "{ns20}bluff")
+        self.assertTrue(hasattr(child, 'bluff'))
+        child = etree.SubElement(el, "{ns21}bluff")
+        self.assertFalse(hasattr(child, 'bluff'))
+        self.assertFalse(hasattr(child, 'maeh'))
+
+        self.assertTrue(hasattr(el[0], 'maeh'))
+        self.assertTrue(hasattr(el[1], 'bluff'))
+        self.assertFalse(hasattr(el[2], 'bluff'))
+        self.assertFalse(hasattr(el[2], 'maeh'))
+
+        self.assertEqual(el.bluff(), 'bluff')
+        self.assertEqual(el[0].maeh(), 'maeh')
+        self.assertEqual(el[1].bluff(), 'bluff')
+
+        self.Namespace('ns20').clear()
+        self.Namespace('ns21').clear()
+
+    def test_create_element_default(self):
+        bluff_dict = {None : self.bluff_class}
+        self.Namespace('ns30').update(bluff_dict)
+
+        maeh_dict  = {'maeh'  : self.maeh_class}
+        self.Namespace(None).update(maeh_dict)
+
+        el = etree.Element("{ns30}bluff")
+        etree.SubElement(el, "maeh")
+        self.assertTrue(hasattr(el, 'bluff'))
+        self.assertTrue(hasattr(el[0], 'maeh'))
+        self.assertEqual(el.bluff(), 'bluff')
+        self.assertEqual(el[0].maeh(), 'maeh')
+
+        self.Namespace(None).clear()
+        self.Namespace('ns30').clear()
+
+    def test_element_creation(self):
+        default, bluff, maeh = (
+            self.default_class, self.bluff_class, self.maeh_class)
+
+        class honk(etree.ElementBase):
+            TAG = 'HONK'
+            NAMESPACE = 'http://a.b/c'
+
+        el = default(
+            "test",
+            "text",
+            bluff(honk, "TaIL", maeh),
+            maeh("TeXT", bluff, honk(), "TAiL"),
+            "Tail")
+
+        self.assertEqual('default_class', el.tag)
+        self.assertEqual('testtext', el.text)
+        self.assertEqual(None, el.tail)
+        self.assertEqual(2, len(el))
+        self.assertEqual(7, len(list(el.iter())))
+
+        self.assertEqual('bluff_class', el[0].tag)
+        self.assertEqual('TaIL', el[0][0].tail)
+        self.assertEqual('TaIL', ''.join(el[0].itertext()))
+        self.assertEqual('{http://a.b/c}HONK',
+                          el[0][0].tag)
+        self.assertEqual('maeh_class',
+                          el[0][1].tag)
+
+        self.assertEqual('maeh_class', el[1].tag)
+        self.assertEqual('TeXT', el[1].text)
+        self.assertEqual('bluff_class', el[1][0].tag)
+        self.assertEqual('{http://a.b/c}HONK', el[1][1].tag)
+        self.assertEqual('TAiL', el[1][1].tail)
+
+        self.assertEqual('TeXTTAiL',
+                          ''.join(el[1].itertext()))
+        self.assertEqual('Tail', el[1].tail)
+        self.assertEqual('TAiL', el[1][1].tail)
+        self.assertEqual('bluff_class', el[1][0].tag)
+        self.assertEqual('{http://a.b/c}HONK', el[1][1].tag)
+        
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeNamespaceClassesTestCase)])
+    suite.addTests(
+        [make_doctest('../../../doc/element_classes.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_objectify.py b/lib/lxml/tests/test_objectify.py
new file mode 100644
index 00000000..b17e38c2
--- /dev/null
+++ b/lib/lxml/tests/test_objectify.py
@@ -0,0 +1,2586 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests specific to the lxml.objectify API
+"""
+
+
+import unittest, operator, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, HelperTestCase, fileInTestDir
+from common_imports import SillyFileLike, canonicalize, doctest, make_doctest
+from common_imports import _bytes, _str, StringIO, BytesIO
+
+from lxml import objectify
+
+PYTYPE_NAMESPACE = "http://codespeak.net/lxml/objectify/pytype"
+XML_SCHEMA_NS = "http://www.w3.org/2001/XMLSchema"
+XML_SCHEMA_INSTANCE_NS = "http://www.w3.org/2001/XMLSchema-instance"
+XML_SCHEMA_INSTANCE_TYPE_ATTR = "{%s}type" % XML_SCHEMA_INSTANCE_NS
+XML_SCHEMA_NIL_ATTR = "{%s}nil" % XML_SCHEMA_INSTANCE_NS
+TREE_PYTYPE = "TREE"
+DEFAULT_NSMAP = { "py"  : PYTYPE_NAMESPACE,
+                  "xsi" : XML_SCHEMA_INSTANCE_NS,
+                  "xsd" : XML_SCHEMA_NS}
+
+objectclass2xsitype = {
+    # objectify built-in
+    objectify.IntElement: ("int", "short", "byte", "unsignedShort",
+                           "unsignedByte", "integer", "nonPositiveInteger",
+                           "negativeInteger", "long", "nonNegativeInteger",
+                           "unsignedLong", "unsignedInt", "positiveInteger",),
+    objectify.FloatElement: ("float", "double"),
+    objectify.BoolElement: ("boolean",),
+    objectify.StringElement: ("string", "normalizedString", "token", "language",
+                              "Name", "NCName", "ID", "IDREF", "ENTITY",
+                              "NMTOKEN", ),
+    # None: xsi:nil="true"
+    }
+
+xsitype2objclass = dict([ (v, k) for k in objectclass2xsitype
+                          for v in objectclass2xsitype[k] ])
+
+objectclass2pytype = {
+    # objectify built-in
+    objectify.IntElement: "int",
+    objectify.FloatElement: "float",
+    objectify.BoolElement: "bool",
+    objectify.StringElement: "str",
+    # None: xsi:nil="true"
+    }
+
+pytype2objclass = dict([ (objectclass2pytype[k], k)
+                         for k in objectclass2pytype])
+
+xml_str = '''\
+<obj:root xmlns:obj="objectified" xmlns:other="otherNS">
+  <obj:c1 a1="A1" a2="A2" other:a3="A3">
+    <obj:c2>0</obj:c2>
+    <obj:c2>1</obj:c2>
+    <obj:c2>2</obj:c2>
+    <other:c2>3</other:c2>
+    <c2>4</c2>
+  </obj:c1>
+</obj:root>'''
+
+class ObjectifyTestCase(HelperTestCase):
+    """Test cases for lxml.objectify
+    """
+    etree = etree
+    
+    def XML(self, xml):
+        return self.etree.XML(xml, self.parser)
+
+    def setUp(self):
+        super(ObjectifyTestCase, self).setUp()
+        self.parser = self.etree.XMLParser(remove_blank_text=True)
+        self.lookup = etree.ElementNamespaceClassLookup(
+            objectify.ObjectifyElementClassLookup() )
+        self.parser.set_element_class_lookup(self.lookup)
+
+        self.Element = self.parser.makeelement
+
+        ns = self.lookup.get_namespace("otherNS")
+        ns[None] = self.etree.ElementBase
+
+        self._orig_types = objectify.getRegisteredTypes()
+
+    def tearDown(self):
+        self.lookup.get_namespace("otherNS").clear()
+        objectify.set_pytype_attribute_tag()
+        del self.lookup
+        del self.parser
+
+        for pytype in objectify.getRegisteredTypes():
+            pytype.unregister()
+        for pytype in self._orig_types:
+            pytype.register()
+        del self._orig_types
+
+        super(ObjectifyTestCase, self).tearDown()
+
+
+    def test_element_nsmap_default(self):
+        elt = objectify.Element("test")
+        self.assertEqual(elt.nsmap, DEFAULT_NSMAP)
+
+    def test_element_nsmap_empty(self):
+        nsmap = {}
+        elt = objectify.Element("test", nsmap=nsmap)
+        self.assertEqual(list(elt.nsmap.values()), [PYTYPE_NAMESPACE])
+
+    def test_element_nsmap_custom_prefixes(self):
+        nsmap = {"mypy": PYTYPE_NAMESPACE,
+                 "myxsi": XML_SCHEMA_INSTANCE_NS,
+                 "myxsd": XML_SCHEMA_NS}
+        elt = objectify.Element("test", nsmap=nsmap)
+        self.assertEqual(elt.nsmap, nsmap)
+        
+    def test_element_nsmap_custom(self):
+        nsmap = {"my": "someNS",
+                 "myother": "someOtherNS",
+                 "myxsd": XML_SCHEMA_NS}
+        elt = objectify.Element("test", nsmap=nsmap)
+        self.assertTrue(PYTYPE_NAMESPACE in elt.nsmap.values())
+        for prefix, ns in nsmap.items():
+            self.assertTrue(prefix in elt.nsmap)
+            self.assertEqual(nsmap[prefix], elt.nsmap[prefix]) 
+        
+    def test_sub_element_nsmap_default(self):
+        root = objectify.Element("root")
+        root.sub = objectify.Element("test")
+        self.assertEqual(root.sub.nsmap, DEFAULT_NSMAP)
+
+    def test_sub_element_nsmap_empty(self):
+        root = objectify.Element("root")
+        nsmap = {}
+        root.sub = objectify.Element("test", nsmap=nsmap)
+        self.assertEqual(root.sub.nsmap, DEFAULT_NSMAP)
+
+    def test_sub_element_nsmap_custom_prefixes(self):
+        root = objectify.Element("root")
+        nsmap = {"mypy": PYTYPE_NAMESPACE,
+                 "myxsi": XML_SCHEMA_INSTANCE_NS,
+                 "myxsd": XML_SCHEMA_NS}
+        root.sub = objectify.Element("test", nsmap=nsmap)
+        self.assertEqual(root.sub.nsmap, DEFAULT_NSMAP)
+        
+    def test_sub_element_nsmap_custom(self):
+        root = objectify.Element("root")
+        nsmap = {"my": "someNS",
+                 "myother": "someOtherNS",
+                 "myxsd": XML_SCHEMA_NS,}
+        root.sub = objectify.Element("test", nsmap=nsmap)
+        expected = nsmap.copy()
+        del expected["myxsd"]
+        expected.update(DEFAULT_NSMAP)
+        self.assertEqual(root.sub.nsmap, expected) 
+        
+    def test_data_element_nsmap_default(self):
+        value = objectify.DataElement("test this")
+        self.assertEqual(value.nsmap, DEFAULT_NSMAP)
+
+    def test_data_element_nsmap_empty(self):
+        nsmap = {}
+        value = objectify.DataElement("test this", nsmap=nsmap)
+        self.assertEqual(list(value.nsmap.values()), [PYTYPE_NAMESPACE])
+
+    def test_data_element_nsmap_custom_prefixes(self):
+        nsmap = {"mypy": PYTYPE_NAMESPACE,
+                 "myxsi": XML_SCHEMA_INSTANCE_NS,
+                 "myxsd": XML_SCHEMA_NS}
+        value = objectify.DataElement("test this", nsmap=nsmap)
+        self.assertEqual(value.nsmap, nsmap)
+        
+    def test_data_element_nsmap_custom(self):
+        nsmap = {"my": "someNS",
+                 "myother": "someOtherNS",
+                 "myxsd": XML_SCHEMA_NS,}
+        value = objectify.DataElement("test", nsmap=nsmap)
+        self.assertTrue(PYTYPE_NAMESPACE in value.nsmap.values())
+        for prefix, ns in nsmap.items():
+            self.assertTrue(prefix in value.nsmap)
+            self.assertEqual(nsmap[prefix], value.nsmap[prefix]) 
+        
+    def test_sub_data_element_nsmap_default(self):
+        root = objectify.Element("root")
+        root.value = objectify.DataElement("test this")
+        self.assertEqual(root.value.nsmap, DEFAULT_NSMAP)
+
+    def test_sub_data_element_nsmap_empty(self):
+        root = objectify.Element("root")
+        nsmap = {}
+        root.value = objectify.DataElement("test this", nsmap=nsmap)
+        self.assertEqual(root.value.nsmap, DEFAULT_NSMAP)
+
+    def test_sub_data_element_nsmap_custom_prefixes(self):
+        root = objectify.Element("root")
+        nsmap = {"mypy": PYTYPE_NAMESPACE,
+                 "myxsi": XML_SCHEMA_INSTANCE_NS,
+                 "myxsd": XML_SCHEMA_NS}
+        root.value = objectify.DataElement("test this", nsmap=nsmap)
+        self.assertEqual(root.value.nsmap, DEFAULT_NSMAP)
+        
+    def test_sub_data_element_nsmap_custom(self):
+        root = objectify.Element("root")
+        nsmap = {"my": "someNS",
+                 "myother": "someOtherNS",
+                 "myxsd": XML_SCHEMA_NS}
+        root.value = objectify.DataElement("test", nsmap=nsmap)
+        expected = nsmap.copy()
+        del expected["myxsd"]
+        expected.update(DEFAULT_NSMAP)
+        self.assertEqual(root.value.nsmap, expected)
+
+    def test_date_element_efactory_text(self):
+        # ObjectifiedDataElement can also be used as E-Factory
+        value = objectify.ObjectifiedDataElement('test', 'toast')
+        self.assertEqual(value.text, 'testtoast')
+
+    def test_date_element_efactory_tail(self):
+        # ObjectifiedDataElement can also be used as E-Factory
+        value = objectify.ObjectifiedElement(objectify.ObjectifiedDataElement(), 'test', 'toast')
+        self.assertEqual(value.ObjectifiedDataElement.tail, 'testtoast')
+
+    def test_data_element_attrib_attributes_precedence(self):
+        # keyword arguments override attrib entries
+        value = objectify.DataElement(23, _pytype="str", _xsi="foobar",
+                                      attrib={"gnu": "muh", "cat": "meeow",
+                                              "dog": "wuff"},
+                                      bird="tchilp", dog="grrr")
+        self.assertEqual(value.get("gnu"), "muh")
+        self.assertEqual(value.get("cat"), "meeow")
+        self.assertEqual(value.get("dog"), "grrr")
+        self.assertEqual(value.get("bird"), "tchilp")
+        
+    def test_data_element_data_element_arg(self):
+        # Check that DataElement preserves all attributes ObjectifiedDataElement
+        # arguments
+        arg = objectify.DataElement(23, _pytype="str", _xsi="foobar",
+                                    attrib={"gnu": "muh", "cat": "meeow",
+                                            "dog": "wuff"},
+                                    bird="tchilp", dog="grrr")
+        value = objectify.DataElement(arg)
+        self.assertTrue(isinstance(value, objectify.StringElement))
+        for attr in arg.attrib:
+            self.assertEqual(value.get(attr), arg.get(attr))
+
+    def test_data_element_data_element_arg_pytype_none(self):
+        # Check that _pytype arg overrides original py:pytype of
+        # ObjectifiedDataElement
+        arg = objectify.DataElement(23, _pytype="str", _xsi="foobar",
+                                    attrib={"gnu": "muh", "cat": "meeow",
+                                            "dog": "wuff"},
+                                    bird="tchilp", dog="grrr")
+        value = objectify.DataElement(arg, _pytype="NoneType")
+        self.assertTrue(isinstance(value, objectify.NoneElement))
+        self.assertEqual(value.get(XML_SCHEMA_NIL_ATTR), "true")
+        self.assertEqual(value.text, None)
+        self.assertEqual(value.pyval, None)
+        for attr in arg.attrib:
+            #if not attr == objectify.PYTYPE_ATTRIBUTE:
+            self.assertEqual(value.get(attr), arg.get(attr))
+
+    def test_data_element_data_element_arg_pytype(self):
+        # Check that _pytype arg overrides original py:pytype of
+        # ObjectifiedDataElement
+        arg = objectify.DataElement(23, _pytype="str", _xsi="foobar",
+                                    attrib={"gnu": "muh", "cat": "meeow",
+                                            "dog": "wuff"},
+                                    bird="tchilp", dog="grrr")
+        value = objectify.DataElement(arg, _pytype="int")
+        self.assertTrue(isinstance(value, objectify.IntElement))
+        self.assertEqual(value.get(objectify.PYTYPE_ATTRIBUTE), "int")
+        for attr in arg.attrib:
+            if not attr == objectify.PYTYPE_ATTRIBUTE:
+                self.assertEqual(value.get(attr), arg.get(attr))
+
+    def test_data_element_data_element_arg_xsitype(self):
+        # Check that _xsi arg overrides original xsi:type of given
+        # ObjectifiedDataElement
+        arg = objectify.DataElement(23, _pytype="str", _xsi="foobar",
+                                    attrib={"gnu": "muh", "cat": "meeow",
+                                            "dog": "wuff"},
+                                    bird="tchilp", dog="grrr")
+        value = objectify.DataElement(arg, _xsi="xsd:int")
+        self.assertTrue(isinstance(value, objectify.IntElement))
+        self.assertEqual(value.get(XML_SCHEMA_INSTANCE_TYPE_ATTR), "xsd:int")
+        self.assertEqual(value.get(objectify.PYTYPE_ATTRIBUTE), "int")
+        for attr in arg.attrib:
+            if not attr in [objectify.PYTYPE_ATTRIBUTE,
+                            XML_SCHEMA_INSTANCE_TYPE_ATTR]:
+                self.assertEqual(value.get(attr), arg.get(attr))
+
+    def test_data_element_data_element_arg_pytype_xsitype(self):
+        # Check that _pytype and _xsi args override original py:pytype and
+        # xsi:type attributes of given ObjectifiedDataElement
+        arg = objectify.DataElement(23, _pytype="str", _xsi="foobar",
+                                    attrib={"gnu": "muh", "cat": "meeow",
+                                            "dog": "wuff"},
+                                    bird="tchilp", dog="grrr")
+        value = objectify.DataElement(arg, _pytype="int", _xsi="xsd:int")
+        self.assertTrue(isinstance(value, objectify.IntElement))
+        self.assertEqual(value.get(objectify.PYTYPE_ATTRIBUTE), "int")
+        self.assertEqual(value.get(XML_SCHEMA_INSTANCE_TYPE_ATTR), "xsd:int")
+        for attr in arg.attrib:
+            if not attr in [objectify.PYTYPE_ATTRIBUTE,
+                            XML_SCHEMA_INSTANCE_TYPE_ATTR]:
+                self.assertEqual(value.get(attr), arg.get(attr))
+
+    def test_data_element_invalid_pytype(self):
+        self.assertRaises(ValueError, objectify.DataElement, 3.1415,
+                          _pytype="int")
+
+    def test_data_element_invalid_xsi(self):
+        self.assertRaises(ValueError, objectify.DataElement, 3.1415,
+                          _xsi="xsd:int")
+        
+    def test_data_element_data_element_arg_invalid_pytype(self):
+        arg = objectify.DataElement(3.1415)
+        self.assertRaises(ValueError, objectify.DataElement, arg,
+                          _pytype="int")
+
+    def test_data_element_data_element_arg_invalid_xsi(self):
+        arg = objectify.DataElement(3.1415)
+        self.assertRaises(ValueError, objectify.DataElement, arg,
+                          _xsi="xsd:int")
+
+    def test_data_element_element_arg(self):
+        arg = objectify.Element('arg')
+        value = objectify.DataElement(arg)
+        self.assertTrue(isinstance(value, objectify.ObjectifiedElement))
+        for attr in arg.attrib:
+            self.assertEqual(value.get(attr), arg.get(attr))
+        
+    def test_root(self):
+        root = self.Element("test")
+        self.assertTrue(isinstance(root, objectify.ObjectifiedElement))
+
+    def test_str(self):
+        root = self.Element("test")
+        self.assertEqual('', str(root))
+
+    def test_child(self):
+        root = self.XML(xml_str)
+        self.assertEqual("0", root.c1.c2.text)
+
+    def test_child_ns_nons(self):
+        root = self.XML("""
+            <root>
+                <foo:x xmlns:foo="/foo/bar">1</foo:x>
+                <x>2</x>
+            </root>
+        """)
+        self.assertEqual(2, root.x)
+
+    def test_countchildren(self):
+        root = self.XML(xml_str)
+        self.assertEqual(1, root.countchildren())
+        self.assertEqual(5, root.c1.countchildren())
+
+    def test_child_getattr(self):
+        root = self.XML(xml_str)
+        self.assertEqual("0", getattr(root.c1, "{objectified}c2").text)
+        self.assertEqual("3", getattr(root.c1, "{otherNS}c2").text)
+
+    def test_child_nonexistant(self):
+        root = self.XML(xml_str)
+        self.assertRaises(AttributeError, getattr, root.c1, "NOT_THERE")
+        self.assertRaises(AttributeError, getattr, root.c1, "{unknownNS}c2")
+
+    def test_child_getattr_empty_ns(self):
+        root = self.XML(xml_str)
+        self.assertEqual("4", getattr(root.c1, "{}c2").text)
+        self.assertEqual("0", getattr(root.c1, "c2").text)
+
+    def test_setattr(self):
+        for val in [
+            2, 2**32, 1.2, "Won't get fooled again", 
+            _str("W\xf6n't get f\xf6\xf6led \xe4g\xe4in", 'ISO-8859-1'), True,
+            False, None]: 
+            root = self.Element('root')
+            attrname = 'val'
+            setattr(root, attrname, val)
+            result = getattr(root, attrname)
+            self.assertEqual(val, result)
+            self.assertEqual(type(val), type(result.pyval))
+ 
+    def test_setattr_nonunicode(self):
+        root = self.Element('root')
+        attrname = 'val'
+        val = _bytes("W\xf6n't get f\xf6\xf6led \xe4g\xe4in", 'ISO-8859-1')
+        self.assertRaises(ValueError, setattr, root, attrname, val)
+        self.assertRaises(AttributeError, getattr, root, attrname) 
+ 
+    def test_addattr(self):
+        root = self.XML(xml_str)
+        self.assertEqual(1, len(root.c1))
+        root.addattr("c1", "test")
+        self.assertEqual(2, len(root.c1))
+        self.assertEqual("test", root.c1[1].text)
+
+    def test_addattr_element(self):
+        root = self.XML(xml_str)
+        self.assertEqual(1, len(root.c1))
+
+        new_el = self.Element("test", myattr="5")
+        root.addattr("c1", new_el)
+        self.assertEqual(2, len(root.c1))
+        self.assertEqual(None, root.c1[0].get("myattr"))
+        self.assertEqual("5",  root.c1[1].get("myattr"))
+
+    def test_addattr_list(self):
+        root = self.XML(xml_str)
+        self.assertEqual(1, len(root.c1))
+
+        new_el = self.Element("test")
+        self.etree.SubElement(new_el, "a", myattr="A")
+        self.etree.SubElement(new_el, "a", myattr="B")
+
+        root.addattr("c1", list(new_el.a))
+        self.assertEqual(3, len(root.c1))
+        self.assertEqual(None, root.c1[0].get("myattr"))
+        self.assertEqual("A",  root.c1[1].get("myattr"))
+        self.assertEqual("B",  root.c1[2].get("myattr"))
+
+    def test_child_addattr(self):
+        root = self.XML(xml_str)
+        self.assertEqual(3, len(root.c1.c2))
+        root.c1.addattr("c2", 3)
+        self.assertEqual(4, len(root.c1.c2))
+        self.assertEqual("3", root.c1.c2[3].text)
+
+    def test_child_index(self):
+        root = self.XML(xml_str)
+        self.assertEqual("0", root.c1.c2[0].text)
+        self.assertEqual("1", root.c1.c2[1].text)
+        self.assertEqual("2", root.c1.c2[2].text)
+        self.assertRaises(IndexError, operator.getitem, root.c1.c2, 3)
+
+    def test_child_index_neg(self):
+        root = self.XML(xml_str)
+        self.assertEqual("0", root.c1.c2[0].text)
+        self.assertEqual("0", root.c1.c2[-3].text)
+        self.assertEqual("1", root.c1.c2[-2].text)
+        self.assertEqual("2", root.c1.c2[-1].text)
+        self.assertRaises(IndexError, operator.getitem, root.c1.c2, -4)
+
+    def test_child_len(self):
+        root = self.XML(xml_str)
+        self.assertEqual(1, len(root))
+        self.assertEqual(1, len(root.c1))
+        self.assertEqual(3, len(root.c1.c2))
+
+    def test_child_iter(self):
+        root = self.XML(xml_str)
+        self.assertEqual([root],
+                          list(iter(root)))
+        self.assertEqual([root.c1],
+                          list(iter(root.c1)))
+        self.assertEqual([root.c1.c2[0], root.c1.c2[1], root.c1.c2[2]],
+                          list(iter((root.c1.c2))))
+
+    def test_class_lookup(self):
+        root = self.XML(xml_str)
+        self.assertTrue(isinstance(root.c1.c2, objectify.ObjectifiedElement))
+        self.assertFalse(isinstance(getattr(root.c1, "{otherNS}c2"),
+                                    objectify.ObjectifiedElement))
+
+    def test_dir(self):
+        root = self.XML(xml_str)
+        dir_c1 = dir(objectify.ObjectifiedElement) + ['c1']
+        dir_c1.sort()
+        dir_c2 = dir(objectify.ObjectifiedElement) + ['c2']
+        dir_c2.sort()
+
+        self.assertEqual(dir_c1, dir(root))
+        self.assertEqual(dir_c2, dir(root.c1))
+
+    def test_vars(self):
+        root = self.XML(xml_str)
+        self.assertEqual({'c1' : root.c1},    vars(root))
+        self.assertEqual({'c2' : root.c1.c2}, vars(root.c1))
+
+    def test_child_set_ro(self):
+        root = self.XML(xml_str)
+        self.assertRaises(TypeError, setattr, root.c1.c2, 'text',  "test")
+        self.assertRaises(TypeError, setattr, root.c1.c2, 'pyval', "test")
+
+    # slicing
+
+    def test_getslice_complete(self):
+        root = self.XML("<root><c>c1</c><c>c2</c></root>")
+        self.assertEqual(["c1", "c2"],
+                          [ c.text for c in root.c[:] ])
+
+    def test_getslice_partial(self):
+        root = self.XML("<root><c>c1</c><c>c2</c><c>c3</c><c>c4</c></root>")
+        test_list = ["c1", "c2", "c3", "c4"]
+
+        self.assertEqual(test_list,
+                          [ c.text for c in root.c[:] ])
+        self.assertEqual(test_list[1:2],
+                          [ c.text for c in root.c[1:2] ])
+        self.assertEqual(test_list[-3:-1],
+                          [ c.text for c in root.c[-3:-1] ])
+        self.assertEqual(test_list[-3:3],
+                          [ c.text for c in root.c[-3:3] ])
+        self.assertEqual(test_list[-3000:3],
+                          [ c.text for c in root.c[-3000:3] ])
+        self.assertEqual(test_list[-3:3000],
+                          [ c.text for c in root.c[-3:3000] ])
+
+    def test_getslice_partial_neg(self):
+        root = self.XML("<root><c>c1</c><c>c2</c><c>c3</c><c>c4</c></root>")
+        test_list = ["c1", "c2", "c3", "c4"]
+
+        self.assertEqual(test_list,
+                          [ c.text for c in root.c[:] ])
+        self.assertEqual(test_list[2:1:-1],
+                          [ c.text for c in root.c[2:1:-1] ])
+        self.assertEqual(test_list[-1:-3:-1],
+                          [ c.text for c in root.c[-1:-3:-1] ])
+        self.assertEqual(test_list[2:-3:-1],
+                          [ c.text for c in root.c[2:-3:-1] ])
+        self.assertEqual(test_list[2:-3000:-1],
+                          [ c.text for c in root.c[2:-3000:-1] ])
+
+    # slice assignment
+
+    def test_setslice_complete(self):
+        Element = self.Element
+        root = Element("root")
+        root.c = ["c1", "c2"]
+
+        c1 = root.c[0]
+        c2 = root.c[1]
+
+        self.assertEqual([c1,c2], list(root.c))
+        self.assertEqual(["c1", "c2"],
+                          [ c.text for c in root.c ])
+
+    def test_setslice_elements(self):
+        Element = self.Element
+        root = Element("root")
+        root.c = ["c1", "c2"]
+
+        c1 = root.c[0]
+        c2 = root.c[1]
+
+        self.assertEqual([c1,c2], list(root.c))
+        self.assertEqual(["c1", "c2"],
+                          [ c.text for c in root.c ])
+
+        root2 = Element("root2")
+        root2.el = [ "test", "test" ]
+        self.assertEqual(["test", "test"],
+                          [ el.text for el in root2.el ])
+
+        root.c = [ root2.el, root2.el ]
+        self.assertEqual(["test", "test"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(["test", "test"],
+                          [ el.text for el in root2.el ])
+
+        root.c[:] = [ c1, c2, c2, c1 ]
+        self.assertEqual(["c1", "c2", "c2", "c1"],
+                          [ c.text for c in root.c ])
+
+    def test_setslice_partial(self):
+        Element = self.Element
+        root = Element("root")
+        l = ["c1", "c2", "c3", "c4"]
+        root.c = l
+
+        self.assertEqual(["c1", "c2", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+        new_slice = ["cA", "cB"]
+        l[1:2] = new_slice
+        root.c[1:2] = new_slice
+
+        self.assertEqual(["c1", "cA", "cB", "c3", "c4"], l)
+        self.assertEqual(["c1", "cA", "cB", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+    def test_setslice_insert(self):
+        Element = self.Element
+        root = Element("root")
+        l = ["c1", "c2", "c3", "c4"]
+        root.c = l
+
+        self.assertEqual(["c1", "c2", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+        new_slice = ["cA", "cB"]
+        l[1:1] = new_slice
+        root.c[1:1] = new_slice
+
+        self.assertEqual(["c1", "cA", "cB", "c2", "c3", "c4"], l)
+        self.assertEqual(["c1", "cA", "cB", "c2", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+    def test_setslice_insert_neg(self):
+        Element = self.Element
+        root = Element("root")
+        l = ["c1", "c2", "c3", "c4"]
+        root.c = l
+
+        self.assertEqual(["c1", "c2", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+        new_slice = ["cA", "cB"]
+        l[-2:-2] = new_slice
+        root.c[-2:-2] = new_slice
+
+        self.assertEqual(["c1", "c2", "cA", "cB", "c3", "c4"], l)
+        self.assertEqual(["c1", "c2", "cA", "cB", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+    def test_setslice_empty(self):
+        Element = self.Element
+        root = Element("root")
+
+        root.c = []
+        self.assertRaises(
+            AttributeError, getattr, root, 'c')
+
+    def test_setslice_partial_wrong_length(self):
+        Element = self.Element
+        root = Element("root")
+        l = ["c1", "c2", "c3", "c4"]
+        root.c = l
+
+        self.assertEqual(["c1", "c2", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+        new_slice = ["cA", "cB", "cC"]
+        self.assertRaises(
+            ValueError, operator.setitem,
+            l, slice(1,2,-1), new_slice)
+        self.assertRaises(
+            ValueError, operator.setitem,
+            root.c, slice(1,2,-1), new_slice)
+
+    def test_setslice_partial_neg(self):
+        Element = self.Element
+        root = Element("root")
+        l = ["c1", "c2", "c3", "c4"]
+        root.c = l
+
+        self.assertEqual(["c1", "c2", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+        new_slice = ["cA", "cB"]
+        l[-1:1:-1] = new_slice
+        root.c[-1:1:-1] = new_slice
+
+        self.assertEqual(["c1", "c2", "cB", "cA"], l)
+        self.assertEqual(["c1", "c2", "cB", "cA"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+    def test_setslice_partial_allneg(self):
+        Element = self.Element
+        root = Element("root")
+        l = ["c1", "c2", "c3", "c4"]
+        root.c = l
+
+        self.assertEqual(["c1", "c2", "c3", "c4"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+        new_slice = ["cA", "cB"]
+        l[-1:-4:-2] = new_slice
+        root.c[-1:-4:-2] = new_slice
+
+        self.assertEqual(["c1", "cB", "c3", "cA"], l)
+        self.assertEqual(["c1", "cB", "c3", "cA"],
+                          [ c.text for c in root.c ])
+        self.assertEqual(l,
+                          [ c.text for c in root.c ])
+
+    # other stuff
+
+    def test_set_string(self):
+        # make sure strings are not handled as sequences
+        Element = self.Element
+        root = Element("root")
+        root.c = "TEST"
+        self.assertEqual(["TEST"],
+                          [ c.text for c in root.c ])
+
+    def test_setitem_string(self):
+        # make sure strings are set as children
+        Element = self.Element
+        root = Element("root")
+        root["c"] = "TEST"
+        self.assertEqual(["TEST"],
+                          [ c.text for c in root.c ])
+
+    def test_setitem_string_special(self):
+        # make sure 'text' etc. are set as children
+        Element = self.Element
+        root = Element("root")
+
+        root["text"] = "TEST"
+        self.assertEqual(["TEST"],
+                          [ c.text for c in root["text"] ])
+
+        root["tail"] = "TEST"
+        self.assertEqual(["TEST"],
+                          [ c.text for c in root["tail"] ])
+
+        root["pyval"] = "TEST"
+        self.assertEqual(["TEST"],
+                          [ c.text for c in root["pyval"] ])
+
+        root["tag"] = "TEST"
+        self.assertEqual(["TEST"],
+                          [ c.text for c in root["tag"] ])
+
+    def test_findall(self):
+        XML = self.XML
+        root = XML('<a><b><c/></b><b/><c><b/></c></a>')
+        self.assertEqual(1, len(root.findall("c")))
+        self.assertEqual(2, len(root.findall(".//c")))
+        self.assertEqual(3, len(root.findall(".//b")))
+        self.assertTrue(root.findall(".//b")[1] is root.getchildren()[1])
+
+    def test_findall_ns(self):
+        XML = self.XML
+        root = XML('<a xmlns:x="X" xmlns:y="Y"><x:b><c/></x:b><b/><c><x:b/><b/></c><b/></a>')
+        self.assertEqual(2, len(root.findall(".//{X}b")))
+        self.assertEqual(3, len(root.findall(".//b")))
+        self.assertEqual(2, len(root.findall("b")))
+
+    def test_build_tree(self):
+        root = self.Element('root')
+        root.a = 5
+        root.b = 6
+        self.assertTrue(isinstance(root, objectify.ObjectifiedElement))
+        self.assertTrue(isinstance(root.a, objectify.IntElement))
+        self.assertTrue(isinstance(root.b, objectify.IntElement))
+
+    def test_type_NoneType(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+
+        nil_attr = XML_SCHEMA_NIL_ATTR
+        root = Element("{objectified}root")
+        SubElement(root, "{objectified}none")
+        SubElement(root, "{objectified}none", {nil_attr : "true"})
+        self.assertFalse(isinstance(root.none, objectify.NoneElement))
+        self.assertFalse(isinstance(root.none[0], objectify.NoneElement))
+        self.assertTrue(isinstance(root.none[1], objectify.NoneElement))
+        self.assertEqual(hash(root.none[1]), hash(None))
+        self.assertEqual(root.none[1], None)
+        self.assertFalse(root.none[1])
+
+    def test_data_element_NoneType(self):
+        value = objectify.DataElement(None)
+        self.assertTrue(isinstance(value, objectify.NoneElement))
+        self.assertEqual(value, None)
+        self.assertEqual(value.get(XML_SCHEMA_NIL_ATTR), "true")
+
+    def test_type_bool(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.bool = True
+        self.assertEqual(root.bool, True)
+        self.assertEqual(root.bool + root.bool, True + True)
+        self.assertEqual(True + root.bool, True + root.bool)
+        self.assertEqual(root.bool * root.bool, True * True)
+        self.assertEqual(int(root.bool), int(True))
+        self.assertEqual(hash(root.bool), hash(True))
+        self.assertEqual(complex(root.bool), complex(True))
+        self.assertTrue(isinstance(root.bool, objectify.BoolElement))
+
+        root.bool = False
+        self.assertEqual(root.bool, False)
+        self.assertEqual(root.bool + root.bool, False + False)
+        self.assertEqual(False + root.bool, False + root.bool)
+        self.assertEqual(root.bool * root.bool, False * False)
+        self.assertEqual(int(root.bool), int(False))
+        self.assertEqual(hash(root.bool), hash(False))
+        self.assertEqual(complex(root.bool), complex(False))
+        self.assertTrue(isinstance(root.bool, objectify.BoolElement))
+
+    def test_data_element_bool(self):
+        value = objectify.DataElement(True)
+        self.assertTrue(isinstance(value, objectify.BoolElement))
+        self.assertEqual(value, True)
+
+        value = objectify.DataElement(False)
+        self.assertTrue(isinstance(value, objectify.BoolElement))
+        self.assertEqual(value, False)
+
+    def test_type_str(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = "test"
+        self.assertTrue(isinstance(root.s, objectify.StringElement))
+
+    def test_type_str_intliteral(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = "3"
+        self.assertTrue(isinstance(root.s, objectify.StringElement))
+
+    def test_type_str_floatliteral(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = "3.72"
+        self.assertTrue(isinstance(root.s, objectify.StringElement))
+
+    def test_type_str_mul(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = "test"
+
+        self.assertEqual("test" * 5, root.s * 5)
+        self.assertEqual(5 * "test", 5 * root.s)
+
+        self.assertRaises(TypeError, operator.mul, root.s, "honk")
+        self.assertRaises(TypeError, operator.mul, "honk", root.s)
+
+    def test_type_str_add(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = "test"
+
+        s = "toast"
+        self.assertEqual("test" + s, root.s + s)
+        self.assertEqual(s + "test", s + root.s)
+            
+    def test_type_str_mod(self):
+        s = "%d %f %s %r"
+        el = objectify.DataElement(s)
+        values = (1, 7.0, "abcd", None)
+        self.assertEqual(s % values, el % values)
+
+        s = "%d"
+        el = objectify.DataElement(s)
+        val = 5
+        self.assertEqual(s % val, el % val)
+
+        s = "%d %s"
+        el = objectify.DataElement(s)
+        val = 5
+        self.assertRaises(TypeError, el.__mod__, val)
+
+        s = ""
+        el = objectify.DataElement(s)
+        val = 5
+        self.assertRaises(TypeError, el.__mod__, val)
+
+    def test_type_str_hash(self):
+        v = "1"
+        el = objectify.DataElement(v)
+        self.assertEqual(hash(el), hash("1"))
+
+    def test_type_str_as_int(self):
+        v = "1"
+        el = objectify.DataElement(v)
+        self.assertEqual(int(el), 1)
+            
+    def test_type_str_as_float(self):
+        v = "1"
+        el = objectify.DataElement(v)
+        self.assertEqual(float(el), 1)
+
+    def test_type_str_as_complex(self):
+        v = "1"
+        el = objectify.DataElement(v)
+        self.assertEqual(complex(el), 1)
+            
+    def test_type_str_mod_data_elements(self):
+        s = "%d %f %s %r"
+        el = objectify.DataElement(s)
+        values = (objectify.DataElement(1),
+                  objectify.DataElement(7.0),
+                  objectify.DataElement("abcd"),
+                  objectify.DataElement(None))
+        self.assertEqual(s % values, el % values)
+
+    def test_data_element_str(self):
+        value = objectify.DataElement("test")
+        self.assertTrue(isinstance(value, objectify.StringElement))
+        self.assertEqual(value, "test")
+
+    def test_data_element_str_intliteral(self):
+        value = objectify.DataElement("3")
+        self.assertTrue(isinstance(value, objectify.StringElement))
+        self.assertEqual(value, "3")
+
+    def test_data_element_str_floatliteral(self):
+        value = objectify.DataElement("3.20")
+        self.assertTrue(isinstance(value, objectify.StringElement))
+        self.assertEqual(value, "3.20")
+
+    def test_type_ustr(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = _str("test")
+        self.assertTrue(isinstance(root.s, objectify.StringElement))
+
+    def test_type_ustr_intliteral(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = _str("3")
+        self.assertTrue(isinstance(root.s, objectify.StringElement))
+
+    def test_type_ustr_floatliteral(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = _str("3.72")
+        self.assertTrue(isinstance(root.s, objectify.StringElement))
+
+    def test_type_ustr_mul(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = _str("test")
+
+        self.assertEqual(_str("test") * 5, root.s * 5)
+        self.assertEqual(5 * _str("test"), 5 * root.s)
+
+        self.assertRaises(TypeError, operator.mul, root.s, _str("honk"))
+        self.assertRaises(TypeError, operator.mul, _str("honk"), root.s)
+
+    def test_type_ustr_add(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.s = _str("test")
+
+        s = _str("toast")
+        self.assertEqual(_str("test") + s, root.s + s)
+        self.assertEqual(s + _str("test"), s + root.s)
+
+    def test_data_element_ustr(self):
+        value = objectify.DataElement(_str("test"))
+        self.assertTrue(isinstance(value, objectify.StringElement))
+        self.assertEqual(value, _str("test"))
+
+    def test_data_element_ustr_intliteral(self):
+        value = objectify.DataElement("3")
+        self.assertTrue(isinstance(value, objectify.StringElement))
+        self.assertEqual(value, _str("3"))
+
+    def test_data_element_ustr_floatliteral(self):
+        value = objectify.DataElement(_str("3.20"))
+        self.assertTrue(isinstance(value, objectify.StringElement))
+        self.assertEqual(value, _str("3.20"))
+
+    def test_type_int(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.none = 5
+        self.assertTrue(isinstance(root.none, objectify.IntElement))
+
+    def test_data_element_int(self):
+        value = objectify.DataElement(5)
+        self.assertTrue(isinstance(value, objectify.IntElement))
+        self.assertEqual(value, 5)
+
+    def test_data_element_int_hash(self):
+        value = objectify.DataElement(123)
+        self.assertEqual(hash(value), hash(123))
+
+    def test_type_float(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        root = Element("{objectified}root")
+        root.none = 5.5
+        self.assertTrue(isinstance(root.none, objectify.FloatElement))
+
+    def test_data_element_float(self):
+        value = objectify.DataElement(5.5)
+        self.assertTrue(isinstance(value, objectify.FloatElement))
+        self.assertEqual(value, 5.5)
+
+    def test_data_element_float_hash(self):
+        value = objectify.DataElement(5.5)
+        self.assertEqual(hash(value), hash(5.5))
+
+    def test_data_element_xsitypes(self):
+        for xsi, objclass in xsitype2objclass.items():
+            # 1 is a valid value for all ObjectifiedDataElement classes
+            pyval = 1
+            value = objectify.DataElement(pyval, _xsi=xsi)
+            self.assertTrue(isinstance(value, objclass),
+                         "DataElement(%s, _xsi='%s') returns %s, expected %s"
+                         % (pyval, xsi, type(value), objclass))
+        
+    def test_data_element_xsitypes_xsdprefixed(self):
+        for xsi, objclass in xsitype2objclass.items():
+            # 1 is a valid value for all ObjectifiedDataElement classes
+            pyval = 1
+            value = objectify.DataElement(pyval, _xsi="xsd:%s" % xsi)
+            self.assertTrue(isinstance(value, objclass),
+                         "DataElement(%s, _xsi='%s') returns %s, expected %s"
+                         % (pyval, xsi, type(value), objclass))
+        
+    def test_data_element_xsitypes_prefixed(self):
+        for xsi, objclass in xsitype2objclass.items():
+            # 1 is a valid value for all ObjectifiedDataElement classes
+            self.assertRaises(ValueError, objectify.DataElement, 1,
+                              _xsi="foo:%s" % xsi)
+
+    def test_data_element_pytypes(self):
+        for pytype, objclass in pytype2objclass.items():
+            # 1 is a valid value for all ObjectifiedDataElement classes
+            pyval = 1
+            value = objectify.DataElement(pyval, _pytype=pytype)
+            self.assertTrue(isinstance(value, objclass),
+                         "DataElement(%s, _pytype='%s') returns %s, expected %s"
+                         % (pyval, pytype, type(value), objclass))
+
+    def test_data_element_pytype_none(self):
+        pyval = 1
+        pytype = "NoneType"
+        objclass = objectify.NoneElement
+        value = objectify.DataElement(pyval, _pytype=pytype)
+        self.assertTrue(isinstance(value, objclass),
+                     "DataElement(%s, _pytype='%s') returns %s, expected %s"
+                     % (pyval, pytype, type(value), objclass))
+        self.assertEqual(value.text, None)
+        self.assertEqual(value.pyval, None)
+            
+    def test_data_element_pytype_none_compat(self):
+        # pre-2.0 lxml called NoneElement "none"
+        pyval = 1
+        pytype = "none"
+        objclass = objectify.NoneElement
+        value = objectify.DataElement(pyval, _pytype=pytype)
+        self.assertTrue(isinstance(value, objclass),
+                     "DataElement(%s, _pytype='%s') returns %s, expected %s"
+                     % (pyval, pytype, type(value), objclass))
+        self.assertEqual(value.text, None)
+        self.assertEqual(value.pyval, None)
+
+    def test_type_unregistered(self):
+        Element = self.Element
+        SubElement = self.etree.SubElement
+        class MyFloat(float):
+            pass
+        root = Element("{objectified}root")
+        root.myfloat = MyFloat(5.5)
+        self.assertTrue(isinstance(root.myfloat, objectify.FloatElement))
+        self.assertEqual(root.myfloat.get(objectify.PYTYPE_ATTRIBUTE), None)
+
+    def test_data_element_unregistered(self):
+        class MyFloat(float):
+            pass
+        value = objectify.DataElement(MyFloat(5.5))
+        self.assertTrue(isinstance(value, objectify.FloatElement))
+        self.assertEqual(value, 5.5)
+        self.assertEqual(value.get(objectify.PYTYPE_ATTRIBUTE), None)
+
+    def test_schema_types(self):
+        XML = self.XML
+        root = XML('''\
+        <root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+          <b xsi:type="boolean">true</b>
+          <b xsi:type="boolean">false</b>
+          <b xsi:type="boolean">1</b>
+          <b xsi:type="boolean">0</b>
+
+          <f xsi:type="float">5</f>
+          <f xsi:type="double">5</f>
+        
+          <s xsi:type="string">5</s>
+          <s xsi:type="normalizedString">5</s>
+          <s xsi:type="token">5</s>
+          <s xsi:type="language">5</s>
+          <s xsi:type="Name">5</s>
+          <s xsi:type="NCName">5</s>
+          <s xsi:type="ID">5</s>
+          <s xsi:type="IDREF">5</s>
+          <s xsi:type="ENTITY">5</s>
+          <s xsi:type="NMTOKEN">5</s>
+
+          <l xsi:type="integer">5</l>
+          <l xsi:type="nonPositiveInteger">5</l>
+          <l xsi:type="negativeInteger">5</l>
+          <l xsi:type="long">5</l>
+          <l xsi:type="nonNegativeInteger">5</l>
+          <l xsi:type="unsignedLong">5</l>
+          <l xsi:type="unsignedInt">5</l>
+          <l xsi:type="positiveInteger">5</l>
+          
+          <i xsi:type="int">5</i>
+          <i xsi:type="short">5</i>
+          <i xsi:type="byte">5</i>
+          <i xsi:type="unsignedShort">5</i>
+          <i xsi:type="unsignedByte">5</i>
+
+          <n xsi:nil="true"/>
+        </root>
+        ''')
+
+        for b in root.b:
+            self.assertTrue(isinstance(b, objectify.BoolElement))
+        self.assertEqual(True,  root.b[0])
+        self.assertEqual(False, root.b[1])
+        self.assertEqual(True,  root.b[2])
+        self.assertEqual(False, root.b[3])
+
+        for f in root.f:
+            self.assertTrue(isinstance(f, objectify.FloatElement))
+            self.assertEqual(5, f)
+            
+        for s in root.s:
+            self.assertTrue(isinstance(s, objectify.StringElement))
+            self.assertEqual("5", s)
+
+        for i in root.i:
+            self.assertTrue(isinstance(i, objectify.IntElement))
+            self.assertEqual(5, i)
+
+        for l in root.l:
+            self.assertTrue(isinstance(l, objectify.IntElement))
+            self.assertEqual(5, i)
+            
+        self.assertTrue(isinstance(root.n, objectify.NoneElement))
+        self.assertEqual(None, root.n)
+
+    def test_schema_types_prefixed(self):
+        XML = self.XML
+        root = XML('''\
+        <root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+          <b xsi:type="xsd:boolean">true</b>
+          <b xsi:type="xsd:boolean">false</b>
+          <b xsi:type="xsd:boolean">1</b>
+          <b xsi:type="xsd:boolean">0</b>
+
+          <f xsi:type="xsd:float">5</f>
+          <f xsi:type="xsd:double">5</f>
+        
+          <s xsi:type="xsd:string">5</s>
+          <s xsi:type="xsd:normalizedString">5</s>
+          <s xsi:type="xsd:token">5</s>
+          <s xsi:type="xsd:language">5</s>
+          <s xsi:type="xsd:Name">5</s>
+          <s xsi:type="xsd:NCName">5</s>
+          <s xsi:type="xsd:ID">5</s>
+          <s xsi:type="xsd:IDREF">5</s>
+          <s xsi:type="xsd:ENTITY">5</s>
+          <s xsi:type="xsd:NMTOKEN">5</s>
+
+          <l xsi:type="xsd:integer">5</l>
+          <l xsi:type="xsd:nonPositiveInteger">5</l>
+          <l xsi:type="xsd:negativeInteger">5</l>
+          <l xsi:type="xsd:long">5</l>
+          <l xsi:type="xsd:nonNegativeInteger">5</l>
+          <l xsi:type="xsd:unsignedLong">5</l>
+          <l xsi:type="xsd:unsignedInt">5</l>
+          <l xsi:type="xsd:positiveInteger">5</l>
+          
+          <i xsi:type="xsd:int">5</i>
+          <i xsi:type="xsd:short">5</i>
+          <i xsi:type="xsd:byte">5</i>
+          <i xsi:type="xsd:unsignedShort">5</i>
+          <i xsi:type="xsd:unsignedByte">5</i>
+
+          <n xsi:nil="true"/>
+        </root>
+        ''')
+
+        for b in root.b:
+            self.assertTrue(isinstance(b, objectify.BoolElement))
+        self.assertEqual(True,  root.b[0])
+        self.assertEqual(False, root.b[1])
+        self.assertEqual(True,  root.b[2])
+        self.assertEqual(False, root.b[3])
+
+        for f in root.f:
+            self.assertTrue(isinstance(f, objectify.FloatElement))
+            self.assertEqual(5, f)
+            
+        for s in root.s:
+            self.assertTrue(isinstance(s, objectify.StringElement))
+            self.assertEqual("5", s)
+
+        for i in root.i:
+            self.assertTrue(isinstance(i, objectify.IntElement))
+            self.assertEqual(5, i)
+
+        for l in root.l:
+            self.assertTrue(isinstance(l, objectify.IntElement))
+            self.assertEqual(5, l)
+            
+        self.assertTrue(isinstance(root.n, objectify.NoneElement))
+        self.assertEqual(None, root.n)
+        
+    def test_type_str_sequence(self):
+        XML = self.XML
+        root = XML(_bytes('<root><b>why</b><b>try</b></root>'))
+        strs = [ str(s) for s in root.b ]
+        self.assertEqual(["why", "try"],
+                          strs)
+
+    def test_type_str_cmp(self):
+        XML = self.XML
+        root = XML(_bytes('<root><b>test</b><b>taste</b><b></b><b/></root>'))
+        self.assertFalse(root.b[0] <  root.b[1])
+        self.assertFalse(root.b[0] <= root.b[1])
+        self.assertFalse(root.b[0] == root.b[1])
+
+        self.assertTrue(root.b[0] != root.b[1])
+        self.assertTrue(root.b[0] >= root.b[1])
+        self.assertTrue(root.b[0] >  root.b[1])
+
+        self.assertEqual(root.b[0], "test")
+        self.assertEqual("test", root.b[0])
+
+        self.assertEqual("", root.b[2])
+        self.assertEqual(root.b[2], "")
+        self.assertEqual("", root.b[3])
+        self.assertEqual(root.b[3], "")
+        self.assertEqual(root.b[2], root.b[3])
+        
+        root.b = "test"
+        self.assertTrue(root.b)
+        root.b = ""
+        self.assertFalse(root.b)
+        self.assertEqual(root.b, "")
+        self.assertEqual("", root.b)
+
+    def test_type_int_cmp(self):
+        XML = self.XML
+        root = XML(_bytes('<root><b>5</b><b>6</b></root>'))
+        self.assertTrue(root.b[0] <  root.b[1])
+        self.assertTrue(root.b[0] <= root.b[1])
+        self.assertTrue(root.b[0] != root.b[1])
+
+        self.assertFalse(root.b[0] == root.b[1])
+        self.assertFalse(root.b[0] >= root.b[1])
+        self.assertFalse(root.b[0] >  root.b[1])
+
+        self.assertEqual(root.b[0], 5)
+        self.assertEqual(5, root.b[0])
+        self.assertNotEqual(root.b[0], "5")
+
+        root.b = 5
+        self.assertTrue(root.b)
+        root.b = 0
+        self.assertFalse(root.b)
+        
+    # float + long share the NumberElement implementation with int
+
+    def test_type_bool_cmp(self):
+        XML = self.XML
+        root = XML(_bytes('<root><b>false</b><b>true</b></root>'))
+        self.assertTrue(root.b[0] <  root.b[1])
+        self.assertTrue(root.b[0] <= root.b[1])
+        self.assertTrue(root.b[0] != root.b[1])
+
+        self.assertFalse(root.b[0] == root.b[1])
+        self.assertFalse(root.b[0] >= root.b[1])
+        self.assertFalse(root.b[0] >  root.b[1])
+
+        self.assertFalse(root.b[0])
+        self.assertTrue(root.b[1])
+
+        self.assertEqual(root.b[0], False)
+        self.assertEqual(False, root.b[0])
+        self.assertTrue(root.b[0] <  5)
+        self.assertTrue(5 > root.b[0])
+
+        root.b = True
+        self.assertTrue(root.b)
+        root.b = False
+        self.assertFalse(root.b)
+
+    def test_type_none_cmp(self):
+        XML = self.XML
+        root = XML(_bytes("""
+        <root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+          <b xsi:nil="true"></b><b xsi:nil="true"/>
+        </root>"""))
+        self.assertTrue(root.b[0] == root.b[1])
+        self.assertFalse(root.b[0])
+        self.assertEqual(root.b[0], None)
+        self.assertEqual(None, root.b[0])
+
+        # doesn't work in Py3:
+
+        #for comparison in ["abc", 5, 7.3, True, [], ()]:
+        #    none = root.b[1]
+        #    self.assertTrue(none < comparison, "%s (%s) should be < %s" %
+        #                 (none, type(none), comparison) )
+        #    self.assertTrue(comparison > none, "%s should be > %s (%s)" %
+        #                 (comparison, none, type(none)) )
+
+    def test_dataelement_xsi(self):
+        el = objectify.DataElement(1, _xsi="string")
+        self.assertEqual(
+            el.get(XML_SCHEMA_INSTANCE_TYPE_ATTR),
+            'xsd:string')
+
+    def test_dataelement_xsi_nsmap(self):
+        el = objectify.DataElement(1, _xsi="string", 
+                                   nsmap={'schema': XML_SCHEMA_NS})
+        self.assertEqual(
+            el.get(XML_SCHEMA_INSTANCE_TYPE_ATTR),
+            'schema:string')
+
+    def test_dataelement_xsi_prefix_error(self):
+        self.assertRaises(ValueError, objectify.DataElement, 1,
+                          _xsi="foo:string")
+
+    def test_pytype_annotation(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.annotate(root)
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual("int",   child_types[ 0])
+        self.assertEqual("str",   child_types[ 1])
+        self.assertEqual("float", child_types[ 2])
+        self.assertEqual("str",   child_types[ 3])
+        self.assertEqual("bool",  child_types[ 4])
+        self.assertEqual("NoneType",  child_types[ 5])
+        self.assertEqual(None,    child_types[ 6])
+        self.assertEqual("float", child_types[ 7])
+        self.assertEqual("float", child_types[ 8])
+        self.assertEqual("str",   child_types[ 9])
+        self.assertEqual("int",   child_types[10])
+        self.assertEqual("int",   child_types[11])
+        self.assertEqual("int",   child_types[12])
+        self.assertEqual(None,    child_types[13])
+        
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+    def test_pytype_annotation_empty(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <n></n>
+        </a>
+        '''))
+        objectify.annotate(root)
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual(None,    child_types[0])
+
+        objectify.annotate(root, empty_pytype="str")
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual("str",    child_types[0])
+
+    def test_pytype_annotation_use_old(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.annotate(root, ignore_old=False)
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual("int",   child_types[ 0])
+        self.assertEqual("str",   child_types[ 1])
+        self.assertEqual("float", child_types[ 2])
+        self.assertEqual("str",   child_types[ 3])
+        self.assertEqual("bool",  child_types[ 4])
+        self.assertEqual("NoneType",  child_types[ 5])
+        self.assertEqual(None,    child_types[ 6])
+        self.assertEqual("float", child_types[ 7])
+        self.assertEqual("float", child_types[ 8])
+        self.assertEqual("str",   child_types[ 9])
+        self.assertEqual("str",   child_types[10])
+        self.assertEqual("float", child_types[11])
+        self.assertEqual("int",   child_types[12])
+        self.assertEqual(TREE_PYTYPE,  child_types[13])
+        
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+    def test_pytype_xsitype_annotation(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.annotate(root, ignore_old=False, ignore_xsi=False,
+                           annotate_xsi=1, annotate_pytype=1)
+        
+        # check py annotations
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual("int",   child_types[ 0])
+        self.assertEqual("str",   child_types[ 1])
+        self.assertEqual("float", child_types[ 2])
+        self.assertEqual("str",   child_types[ 3])
+        self.assertEqual("bool",  child_types[ 4])
+        self.assertEqual("NoneType",  child_types[ 5])
+        self.assertEqual(None,    child_types[ 6])
+        self.assertEqual("float", child_types[ 7])
+        self.assertEqual("float", child_types[ 8])
+        self.assertEqual("str",   child_types[ 9])
+        self.assertEqual("str",   child_types[10])
+        self.assertEqual("float",   child_types[11])
+        self.assertEqual("int",     child_types[12])
+        self.assertEqual(TREE_PYTYPE,  child_types[13])
+        
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+        child_xsitypes = [ c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR)
+                        for c in root.iterchildren() ]
+
+        # check xsi annotations
+        child_types = [ c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR)
+                        for c in root.iterchildren() ]
+        self.assertEqual("xsd:integer", child_types[ 0])
+        self.assertEqual("xsd:string",  child_types[ 1])
+        self.assertEqual("xsd:double",  child_types[ 2])
+        self.assertEqual("xsd:string",  child_types[ 3])
+        self.assertEqual("xsd:boolean", child_types[ 4])
+        self.assertEqual(None,          child_types[ 5])
+        self.assertEqual(None,          child_types[ 6])
+        self.assertEqual("xsd:double",  child_types[ 7])
+        self.assertEqual("xsd:float",   child_types[ 8])
+        self.assertEqual("xsd:string",  child_types[ 9])
+        self.assertEqual("xsd:string",  child_types[10])
+        self.assertEqual("xsd:double",  child_types[11])
+        self.assertEqual("xsd:integer", child_types[12])
+        self.assertEqual(None,  child_types[13])
+
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+    def test_xsiannotate_use_old(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.xsiannotate(root, ignore_old=False)
+
+        child_types = [ c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR)
+                        for c in root.iterchildren() ]
+        self.assertEqual("xsd:integer", child_types[ 0])
+        self.assertEqual("xsd:string",  child_types[ 1])
+        self.assertEqual("xsd:double",  child_types[ 2])
+        self.assertEqual("xsd:string",  child_types[ 3])
+        self.assertEqual("xsd:boolean", child_types[ 4])
+        self.assertEqual(None,          child_types[ 5])
+        self.assertEqual(None,          child_types[ 6])
+        self.assertEqual("xsd:double",  child_types[ 7])
+        self.assertEqual("xsd:float",   child_types[ 8])
+        self.assertEqual("xsd:string",  child_types[ 9])
+        self.assertEqual("xsd:string",  child_types[10])
+        self.assertEqual("xsd:double",  child_types[11])
+        self.assertEqual("xsd:integer", child_types[12])
+        self.assertEqual(None,          child_types[13])
+
+    def test_pyannotate_ignore_old(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.pyannotate(root, ignore_old=True)
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual("int",   child_types[ 0])
+        self.assertEqual("str",   child_types[ 1])
+        self.assertEqual("float", child_types[ 2])
+        self.assertEqual("str",   child_types[ 3])
+        self.assertEqual("bool",  child_types[ 4])
+        self.assertEqual("NoneType",  child_types[ 5])
+        self.assertEqual(None,    child_types[ 6])
+        self.assertEqual("float", child_types[ 7])
+        self.assertEqual("float", child_types[ 8])
+        self.assertEqual("str",   child_types[ 9])
+        self.assertEqual("int",   child_types[10])
+        self.assertEqual("int",   child_types[11])
+        self.assertEqual("int",   child_types[12])
+        self.assertEqual(None,    child_types[13])
+        
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+    def test_pyannotate_empty(self):
+        XML = self.XML
+        root = XML('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <n></n>
+        </a>
+        ''')
+        objectify.pyannotate(root)
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual(None,    child_types[0])
+
+        objectify.annotate(root, empty_pytype="str")
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual("str",    child_types[0])
+
+    def test_pyannotate_use_old(self):
+        XML = self.XML
+        root = XML('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        ''')
+        objectify.pyannotate(root)
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual("int",   child_types[ 0])
+        self.assertEqual("str",   child_types[ 1])
+        self.assertEqual("float", child_types[ 2])
+        self.assertEqual("str",   child_types[ 3])
+        self.assertEqual("bool",  child_types[ 4])
+        self.assertEqual("NoneType",  child_types[ 5])
+        self.assertEqual(None,    child_types[ 6])
+        self.assertEqual("float", child_types[ 7])
+        self.assertEqual("float", child_types[ 8])
+        self.assertEqual("str",   child_types[ 9])
+        self.assertEqual("str",   child_types[10])
+        self.assertEqual("float", child_types[11])
+        self.assertEqual("int",   child_types[12])
+        self.assertEqual(TREE_PYTYPE, child_types[13])
+        
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+        
+    def test_xsiannotate_ignore_old(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.xsiannotate(root, ignore_old=True)
+
+        child_types = [ c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR)
+                        for c in root.iterchildren() ]
+        self.assertEqual("xsd:integer", child_types[ 0])
+        self.assertEqual("xsd:string",  child_types[ 1])
+        self.assertEqual("xsd:double",  child_types[ 2])
+        self.assertEqual("xsd:string",  child_types[ 3])
+        self.assertEqual("xsd:boolean", child_types[ 4])
+        self.assertEqual(None,          child_types[ 5])
+        self.assertEqual(None,          child_types[ 6])
+        self.assertEqual("xsd:integer", child_types[ 7])
+        self.assertEqual("xsd:integer", child_types[ 8])
+        self.assertEqual("xsd:integer", child_types[ 9])
+        self.assertEqual("xsd:string",  child_types[10])
+        self.assertEqual("xsd:double",  child_types[11])
+        self.assertEqual("xsd:integer", child_types[12])
+        self.assertEqual(None,          child_types[13])
+
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+    def test_deannotate(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.deannotate(root)
+
+        for c in root.getiterator():
+            self.assertEqual(None, c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR))
+            self.assertEqual(None, c.get(objectify.PYTYPE_ATTRIBUTE))
+
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+    def test_xsinil_deannotate(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+          <b xsi:type="float">5</b>
+          <s xsi:type="string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.annotate(
+            root, ignore_old=False, ignore_xsi=False, annotate_xsi=True,
+            empty_pytype='str', empty_type='string')
+        objectify.deannotate(root, pytype=False, xsi=False, xsi_nil=True)
+
+        child_types = [ c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR)
+                        for c in root.iterchildren() ]
+        self.assertEqual("xsd:integer",  child_types[ 0])
+        self.assertEqual("xsd:string",   child_types[ 1])
+        self.assertEqual("xsd:double",   child_types[ 2])
+        self.assertEqual("xsd:string",   child_types[ 3])
+        self.assertEqual("xsd:boolean",  child_types[ 4])
+        self.assertEqual(None,           child_types[ 5])
+        self.assertEqual("xsd:string",   child_types[ 6])
+        self.assertEqual("xsd:double",   child_types[ 7])
+        self.assertEqual("xsd:float",    child_types[ 8])
+        self.assertEqual("xsd:string",   child_types[ 9])
+        self.assertEqual("xsd:string",   child_types[10])
+        self.assertEqual("xsd:double",    child_types[11])
+        self.assertEqual("xsd:integer",  child_types[12])
+        self.assertEqual(None,           child_types[13])
+
+        self.assertEqual(None, root.n.get(XML_SCHEMA_NIL_ATTR))
+
+        for c in root.iterchildren():
+            self.assertNotEqual(None, c.get(objectify.PYTYPE_ATTRIBUTE))
+            # these have no equivalent in xsi:type
+            if (c.get(objectify.PYTYPE_ATTRIBUTE) not in [TREE_PYTYPE, 
+                "NoneType"]):
+                self.assertNotEqual(
+                    None, c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR))
+
+    def test_xsitype_deannotate(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype"
+        xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="xsd:double">5</b>
+          <b xsi:type="xsd:float">5</b>
+          <s xsi:type="xsd:string">23</s>
+          <s py:pytype="str">42</s>
+          <f py:pytype="float">300</f>
+          <l py:pytype="long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.annotate(root)
+        objectify.deannotate(root, pytype=False)
+
+        child_types = [ c.get(objectify.PYTYPE_ATTRIBUTE)
+                        for c in root.iterchildren() ]
+        self.assertEqual("int",   child_types[ 0])
+        self.assertEqual("str",   child_types[ 1])
+        self.assertEqual("float", child_types[ 2])
+        self.assertEqual("str",   child_types[ 3])
+        self.assertEqual("bool",  child_types[ 4])
+        self.assertEqual("NoneType",  child_types[ 5])
+        self.assertEqual(None,    child_types[ 6])
+        self.assertEqual("float", child_types[ 7])
+        self.assertEqual("float", child_types[ 8])
+        self.assertEqual("str",   child_types[ 9])
+        self.assertEqual("int",   child_types[10])
+        self.assertEqual("int",   child_types[11])
+        self.assertEqual("int",   child_types[12])
+        self.assertEqual(None,    child_types[13])
+        
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+        for c in root.getiterator():
+            self.assertEqual(None, c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR))
+
+    def test_pytype_deannotate(self):
+        XML = self.XML
+        root = XML(_bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+        xmlns:py="http://codespeak.net/lxml/objectify/pytype"
+        xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+          <b xsi:type="xsd:int">5</b>
+          <b xsi:type="xsd:string">test</b>
+          <c xsi:type="xsd:float">1.1</c>
+          <c xsi:type="xsd:string">\uF8D2</c>
+          <x xsi:type="xsd:boolean">true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="xsd:double">5</b>
+          <b xsi:type="xsd:float">5</b>
+          <s xsi:type="xsd:string">23</s>
+          <s xsi:type="xsd:string">42</s>
+          <f xsi:type="xsd:float">300</f>
+          <l xsi:type="xsd:long">2</l>
+          <t py:pytype="TREE"></t>
+        </a>
+        '''))
+        objectify.annotate(root)
+        objectify.deannotate(root, xsi=False)
+
+        child_types = [ c.get(XML_SCHEMA_INSTANCE_TYPE_ATTR)
+                        for c in root.iterchildren() ]
+        self.assertEqual("xsd:int",      child_types[ 0])
+        self.assertEqual("xsd:string",   child_types[ 1])
+        self.assertEqual("xsd:float",    child_types[ 2])
+        self.assertEqual("xsd:string",   child_types[ 3])
+        self.assertEqual("xsd:boolean",  child_types[ 4])
+        self.assertEqual(None,           child_types[ 5])
+        self.assertEqual(None,           child_types[ 6])
+        self.assertEqual("xsd:double",   child_types[ 7])
+        self.assertEqual("xsd:float",    child_types[ 8])
+        self.assertEqual("xsd:string",   child_types[ 9])
+        self.assertEqual("xsd:string",   child_types[10])
+        self.assertEqual("xsd:float",    child_types[11])
+        self.assertEqual("xsd:long",     child_types[12])
+        self.assertEqual(None,           child_types[13])
+
+        self.assertEqual("true", root.n.get(XML_SCHEMA_NIL_ATTR))
+
+        for c in root.getiterator():
+            self.assertEqual(None, c.get(objectify.PYTYPE_ATTRIBUTE))
+
+    def test_change_pytype_attribute(self):
+        XML = self.XML
+
+        xml = _bytes('''\
+        <a xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+          <b>5</b>
+          <b>test</b>
+          <c>1.1</c>
+          <c>\uF8D2</c>
+          <x>true</x>
+          <n xsi:nil="true" />
+          <n></n>
+          <b xsi:type="double">5</b>
+        </a>
+        ''')
+
+        pytype_ns, pytype_name = objectify.PYTYPE_ATTRIBUTE[1:].split('}')
+        objectify.set_pytype_attribute_tag("{TEST}test")
+
+        root = XML(xml)
+        objectify.annotate(root)
+
+        attribs = root.xpath("//@py:%s" % pytype_name,
+                             namespaces={"py" : pytype_ns})
+        self.assertEqual(0, len(attribs))
+        attribs = root.xpath("//@py:test",
+                             namespaces={"py" : "TEST"})
+        self.assertEqual(7, len(attribs))
+
+        objectify.set_pytype_attribute_tag()
+        pytype_ns, pytype_name = objectify.PYTYPE_ATTRIBUTE[1:].split('}')
+
+        self.assertNotEqual("test", pytype_ns.lower())
+        self.assertNotEqual("test", pytype_name.lower())
+
+        root = XML(xml)
+        attribs = root.xpath("//@py:%s" % pytype_name,
+                             namespaces={"py" : pytype_ns})
+        self.assertEqual(0, len(attribs))
+
+        objectify.annotate(root)
+        attribs = root.xpath("//@py:%s" % pytype_name,
+                             namespaces={"py" : pytype_ns})
+        self.assertEqual(7, len(attribs))
+
+    def test_registered_types(self):
+        orig_types = objectify.getRegisteredTypes()
+        orig_types[0].unregister()
+        self.assertEqual(orig_types[1:], objectify.getRegisteredTypes())
+
+        class NewType(objectify.ObjectifiedDataElement):
+            pass
+
+        def checkMyType(s):
+            return True
+
+        pytype = objectify.PyType("mytype", checkMyType, NewType)
+        self.assertTrue(pytype not in objectify.getRegisteredTypes())
+        pytype.register()
+        self.assertTrue(pytype in objectify.getRegisteredTypes())
+        pytype.unregister()
+        self.assertTrue(pytype not in objectify.getRegisteredTypes())
+
+        pytype.register(before = [objectify.getRegisteredTypes()[0].name])
+        self.assertEqual(pytype, objectify.getRegisteredTypes()[0])
+        pytype.unregister()
+
+        pytype.register(after = [objectify.getRegisteredTypes()[0].name])
+        self.assertNotEqual(pytype, objectify.getRegisteredTypes()[0])
+        pytype.unregister()
+
+        self.assertRaises(ValueError, pytype.register,
+                          before = [objectify.getRegisteredTypes()[0].name],
+                          after  = [objectify.getRegisteredTypes()[1].name])
+
+    def test_registered_type_stringify(self):
+        from datetime import datetime
+        def parse_date(value):
+            if len(value) != 14:
+                raise ValueError(value)
+            Y = int(value[0:4])
+            M = int(value[4:6])
+            D = int(value[6:8])
+            h = int(value[8:10])
+            m = int(value[10:12])
+            s = int(value[12:14])
+            return datetime(Y, M, D, h, m, s)
+
+        def stringify_date(date):
+            return date.strftime("%Y%m%d%H%M%S")
+
+        class DatetimeElement(objectify.ObjectifiedDataElement):
+            def pyval(self):
+                return parse_date(self.text)
+            pyval = property(pyval)
+
+        datetime_type = objectify.PyType(
+            "datetime", parse_date, DatetimeElement, stringify_date)
+        datetime_type.xmlSchemaTypes = "dateTime"
+        datetime_type.register()
+
+        NAMESPACE = "http://foo.net/xmlns"
+        NAMESPACE_MAP = {'ns': NAMESPACE}
+
+        r = objectify.Element("{%s}root" % NAMESPACE, nsmap=NAMESPACE_MAP)
+        time = datetime.now()
+        r.date = time
+
+        self.assertTrue(isinstance(r.date, DatetimeElement))
+        self.assertTrue(isinstance(r.date.pyval, datetime))
+
+        self.assertEqual(r.date.pyval, parse_date(stringify_date(time)))
+        self.assertEqual(r.date.text, stringify_date(time))
+
+        r.date = objectify.E.date(time)
+
+        self.assertTrue(isinstance(r.date, DatetimeElement))
+        self.assertTrue(isinstance(r.date.pyval, datetime))
+
+        self.assertEqual(r.date.pyval, parse_date(stringify_date(time)))
+        self.assertEqual(r.date.text, stringify_date(time))
+
+        date = objectify.DataElement(time)
+
+        self.assertTrue(isinstance(date, DatetimeElement))
+        self.assertTrue(isinstance(date.pyval, datetime))
+
+        self.assertEqual(date.pyval, parse_date(stringify_date(time)))
+        self.assertEqual(date.text, stringify_date(time))
+
+    def test_object_path(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c2" )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+    def test_object_path_list(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( ['root', 'c1', 'c2'] )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+    def test_object_path_fail(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c99" )
+        self.assertRaises(AttributeError, path, root)
+
+    def test_object_path_default_absolute(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c99" )
+        self.assertEqual(None, path(root, None))
+        path = objectify.ObjectPath( "root.c99.c2" )
+        self.assertEqual(None, path(root, None))
+        path = objectify.ObjectPath( "notroot.c99.c2" )
+        self.assertEqual(None, path(root, None))
+
+    def test_object_path_default_relative(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( ".c1.c99" )
+        self.assertEqual(None, path(root, None))
+        path = objectify.ObjectPath( ".c99.c2" )
+        self.assertEqual(None, path(root, None))
+
+    def test_object_path_syntax(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath("root .    {objectified}c1.   c2")
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+        path = objectify.ObjectPath("   root.{objectified}  c1.c2  [ 0 ]   ")
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+    def test_object_path_fail_parse_empty(self):
+        self.assertRaises(ValueError, objectify.ObjectPath, "")
+
+    def test_object_path_fail_parse_empty_list(self):
+        self.assertRaises(ValueError, objectify.ObjectPath, [])
+
+    def test_object_path_hasattr(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root" )
+        self.assertTrue(path.hasattr(root))
+        path = objectify.ObjectPath( "root.c1" )
+        self.assertTrue(path.hasattr(root))
+        path = objectify.ObjectPath( "root.c1.c2" )
+        self.assertTrue(path.hasattr(root))
+        path = objectify.ObjectPath( "root.c1.{otherNS}c2" )
+        self.assertTrue(path.hasattr(root))
+        path = objectify.ObjectPath( "root.c1.c2[1]" )
+        self.assertTrue(path.hasattr(root))
+        path = objectify.ObjectPath( "root.c1.c2[2]" )
+        self.assertTrue(path.hasattr(root))
+        path = objectify.ObjectPath( "root.c1.c2[3]" )
+        self.assertFalse(path.hasattr(root))
+        path = objectify.ObjectPath( "root.c1[1].c2" )
+        self.assertFalse(path.hasattr(root))
+
+    def test_object_path_dot(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "." )
+        self.assertEqual(root.c1.c2.text, path(root).c1.c2.text)
+
+    def test_object_path_dot_list(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( [''] )
+        self.assertEqual(root.c1.c2.text, path(root).c1.c2.text)
+
+    def test_object_path_dot_root(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( ".c1.c2" )
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+    def test_object_path_dot_root_list(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( ['', 'c1', 'c2'] )
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+    def test_object_path_index(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1[0].c2[0]" )
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+        path = objectify.ObjectPath( "root.c1[0].c2" )
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+        path = objectify.ObjectPath( "root.c1[0].c2[1]" )
+        self.assertEqual(root.c1.c2[1].text, path(root).text)
+
+        path = objectify.ObjectPath( "root.c1.c2[2]" )
+        self.assertEqual(root.c1.c2[2].text, path(root).text)
+
+        path = objectify.ObjectPath( "root.c1.c2[-1]" )
+        self.assertEqual(root.c1.c2[-1].text, path(root).text)
+
+        path = objectify.ObjectPath( "root.c1.c2[-3]" )
+        self.assertEqual(root.c1.c2[-3].text, path(root).text)
+
+    def test_object_path_index_list(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( ['root', 'c1[0]', 'c2[0]'] )
+        self.assertEqual(root.c1.c2.text, path(root).text)
+
+        path = objectify.ObjectPath( ['root', 'c1[0]', 'c2[2]'] )
+        self.assertEqual(root.c1.c2[2].text, path(root).text)
+
+        path = objectify.ObjectPath( ['root', 'c1', 'c2[2]'] )
+        self.assertEqual(root.c1.c2[2].text, path(root).text)
+
+        path = objectify.ObjectPath( ['root', 'c1', 'c2[-1]'] )
+        self.assertEqual(root.c1.c2[-1].text, path(root).text)
+
+        path = objectify.ObjectPath( ['root', 'c1', 'c2[-3]'] )
+        self.assertEqual(root.c1.c2[-3].text, path(root).text)
+
+    def test_object_path_index_fail_parse(self):
+        self.assertRaises(ValueError, objectify.ObjectPath,
+                          "root.c1[0].c2[-1-2]")
+        self.assertRaises(ValueError, objectify.ObjectPath,
+                          ['root', 'c1[0]', 'c2[-1-2]'])
+
+        self.assertRaises(ValueError, objectify.ObjectPath,
+                          "root[2].c1.c2")
+        self.assertRaises(ValueError, objectify.ObjectPath,
+                          ['root[2]', 'c1', 'c2'])
+
+        self.assertRaises(ValueError, objectify.ObjectPath,
+                          [])
+        self.assertRaises(ValueError, objectify.ObjectPath,
+                          ['', '', ''])
+
+    def test_object_path_index_fail_lookup(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath("root.c1[9999].c2")
+        self.assertRaises(AttributeError, path, root)
+
+        path = objectify.ObjectPath("root.c1[0].c2[9999]")
+        self.assertRaises(AttributeError, path, root)
+
+        path = objectify.ObjectPath(".c1[9999].c2[0]")
+        self.assertRaises(AttributeError, path, root)
+
+        path = objectify.ObjectPath("root.c1[-2].c2")
+        self.assertRaises(AttributeError, path, root)
+
+        path = objectify.ObjectPath("root.c1[0].c2[-4]")
+        self.assertRaises(AttributeError, path, root)
+
+    def test_object_path_ns(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "{objectified}root.c1.c2" )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        path = objectify.ObjectPath( "{objectified}root.{objectified}c1.c2" )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        path = objectify.ObjectPath( "root.{objectified}c1.{objectified}c2" )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        path = objectify.ObjectPath( "root.c1.{objectified}c2" )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        path = objectify.ObjectPath( "root.c1.{otherNS}c2" )
+        self.assertEqual(getattr(root.c1, '{otherNS}c2').text,
+                          path.find(root).text)
+
+    def test_object_path_ns_list(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( ['{objectified}root', 'c1', 'c2'] )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        path = objectify.ObjectPath( ['{objectified}root', '{objectified}c1', 'c2'] )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        path = objectify.ObjectPath( ['root', '{objectified}c1', '{objectified}c2'] )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        path = objectify.ObjectPath( ['root', '{objectified}c1', '{objectified}c2[2]'] )
+        self.assertEqual(root.c1.c2[2].text, path.find(root).text)
+        path = objectify.ObjectPath( ['root', 'c1', '{objectified}c2'] )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        path = objectify.ObjectPath( ['root', 'c1', '{objectified}c2[2]'] )
+        self.assertEqual(root.c1.c2[2].text, path.find(root).text)
+        path = objectify.ObjectPath( ['root', 'c1', '{otherNS}c2'] )
+        self.assertEqual(getattr(root.c1, '{otherNS}c2').text,
+                          path.find(root).text)
+
+    def test_object_path_set(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c2" )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        self.assertEqual("1", root.c1.c2[1].text)
+
+        new_value = "my new value"
+        path.setattr(root, new_value)
+
+        self.assertEqual(new_value, root.c1.c2.text)
+        self.assertEqual(new_value, path(root).text)
+        self.assertEqual("1", root.c1.c2[1].text)
+
+    def test_object_path_set_element(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c2" )
+        self.assertEqual(root.c1.c2.text, path.find(root).text)
+        self.assertEqual("1", root.c1.c2[1].text)
+
+        new_el = self.Element("{objectified}test")
+        etree.SubElement(new_el, "{objectified}sub", myattr="ATTR").a = "TEST"
+        path.setattr(root, new_el.sub)
+
+        self.assertEqual("ATTR", root.c1.c2.get("myattr"))
+        self.assertEqual("TEST", root.c1.c2.a.text)
+        self.assertEqual("TEST", path(root).a.text)
+        self.assertEqual("1", root.c1.c2[1].text)
+
+    def test_object_path_set_create(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c99" )
+        self.assertRaises(AttributeError, path.find, root)
+
+        new_value = "my new value"
+        path.setattr(root, new_value)
+
+        self.assertEqual(1, len(root.c1.c99))
+        self.assertEqual(new_value, root.c1.c99.text)
+        self.assertEqual(new_value, path(root).text)
+
+    def test_object_path_set_create_element(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c99" )
+        self.assertRaises(AttributeError, path.find, root)
+
+        new_el = self.Element("{objectified}test")
+        etree.SubElement(new_el, "{objectified}sub", myattr="ATTR").a = "TEST"
+        path.setattr(root, new_el.sub)
+
+        self.assertEqual(1, len(root.c1.c99))
+        self.assertEqual("ATTR", root.c1.c99.get("myattr"))
+        self.assertEqual("TEST", root.c1.c99.a.text)
+        self.assertEqual("TEST", path(root).a.text)
+
+    def test_object_path_set_create_list(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c99" )
+        self.assertRaises(AttributeError, path.find, root)
+
+        new_el = self.Element("{objectified}test")
+        new_el.a = ["TEST1", "TEST2"]
+        new_el.a[0].set("myattr", "ATTR1")
+        new_el.a[1].set("myattr", "ATTR2")
+
+        path.setattr(root, list(new_el.a))
+
+        self.assertEqual(2, len(root.c1.c99))
+        self.assertEqual("ATTR1", root.c1.c99[0].get("myattr"))
+        self.assertEqual("TEST1", root.c1.c99[0].text)
+        self.assertEqual("ATTR2", root.c1.c99[1].get("myattr"))
+        self.assertEqual("TEST2", root.c1.c99[1].text)
+        self.assertEqual("TEST1", path(root).text)
+
+    def test_object_path_addattr(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c2" )
+        self.assertEqual(3, len(root.c1.c2))
+        path.addattr(root, "test")
+        self.assertEqual(4, len(root.c1.c2))
+        self.assertEqual(["0", "1", "2", "test"],
+                          [el.text for el in root.c1.c2])
+
+    def test_object_path_addattr_element(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c2" )
+        self.assertEqual(3, len(root.c1.c2))
+
+        new_el = self.Element("{objectified}test")
+        etree.SubElement(new_el, "{objectified}sub").a = "TEST"
+
+        path.addattr(root, new_el.sub)
+        self.assertEqual(4, len(root.c1.c2))
+        self.assertEqual("TEST", root.c1.c2[3].a.text)
+        self.assertEqual(["0", "1", "2"],
+                          [el.text for el in root.c1.c2[:3]])
+
+    def test_object_path_addattr_create(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c99" )
+        self.assertRaises(AttributeError, path.find, root)
+
+        new_value = "my new value"
+        path.addattr(root, new_value)
+
+        self.assertEqual(1, len(root.c1.c99))
+        self.assertEqual(new_value, root.c1.c99.text)
+        self.assertEqual(new_value, path(root).text)
+
+    def test_object_path_addattr_create_element(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c99" )
+        self.assertRaises(AttributeError, path.find, root)
+
+        new_el = self.Element("{objectified}test")
+        etree.SubElement(new_el, "{objectified}sub", myattr="ATTR").a = "TEST"
+
+        path.addattr(root, new_el.sub)
+        self.assertEqual(1, len(root.c1.c99))
+        self.assertEqual("TEST", root.c1.c99.a.text)
+        self.assertEqual("TEST", path(root).a.text)
+        self.assertEqual("ATTR", root.c1.c99.get("myattr"))
+
+    def test_object_path_addattr_create_list(self):
+        root = self.XML(xml_str)
+        path = objectify.ObjectPath( "root.c1.c99" )
+        self.assertRaises(AttributeError, path.find, root)
+
+        new_el = self.Element("{objectified}test")
+        new_el.a = ["TEST1", "TEST2"]
+
+        self.assertEqual(2, len(new_el.a))
+
+        path.addattr(root, list(new_el.a))
+        self.assertEqual(2, len(root.c1.c99))
+        self.assertEqual("TEST1", root.c1.c99.text)
+        self.assertEqual("TEST2", path(root)[1].text)
+
+    def test_descendant_paths(self):
+        root = self.XML(xml_str)
+        self.assertEqual(
+            ['{objectified}root', '{objectified}root.c1',
+             '{objectified}root.c1.c2',
+             '{objectified}root.c1.c2[1]', '{objectified}root.c1.c2[2]',
+             '{objectified}root.c1.{otherNS}c2', '{objectified}root.c1.{}c2'],
+            root.descendantpaths())
+
+    def test_descendant_paths_child(self):
+        root = self.XML(xml_str)
+        self.assertEqual(
+            ['{objectified}c1', '{objectified}c1.c2',
+             '{objectified}c1.c2[1]', '{objectified}c1.c2[2]',
+             '{objectified}c1.{otherNS}c2', '{objectified}c1.{}c2'],
+            root.c1.descendantpaths())
+
+    def test_descendant_paths_prefix(self):
+        root = self.XML(xml_str)
+        self.assertEqual(
+            ['root.{objectified}c1', 'root.{objectified}c1.c2',
+             'root.{objectified}c1.c2[1]', 'root.{objectified}c1.c2[2]',
+             'root.{objectified}c1.{otherNS}c2',
+             'root.{objectified}c1.{}c2'],
+            root.c1.descendantpaths('root'))
+
+    def test_pickle(self):
+        import pickle
+
+        root = self.XML(xml_str)
+        out = BytesIO()
+        pickle.dump(root, out)
+
+        new_root = pickle.loads(out.getvalue())
+        self.assertEqual(
+            etree.tostring(new_root),
+            etree.tostring(root))
+
+    def test_pickle_elementtree(self):
+        import pickle
+
+        tree = etree.ElementTree(self.XML(xml_str + "<?my pi?>"))
+        out = BytesIO()
+        pickle.dump(tree, out)
+
+        new_tree = pickle.loads(out.getvalue())
+        self.assertTrue(isinstance(new_tree, etree._ElementTree))
+        self.assertEqual(
+            etree.tostring(new_tree),
+            etree.tostring(tree))
+
+    def test_pickle_intelement(self):
+        self._test_pickle('<x>42</x>')
+        self._test_pickle(objectify.DataElement(42))
+
+    def test_pickle_floattelement(self):
+        self._test_pickle('<x>42.0</x>')
+        self._test_pickle(objectify.DataElement(42.0))
+
+    def test_pickle_strelement(self):
+        self._test_pickle('<x>Pickle me!</x>')
+        self._test_pickle(objectify.DataElement('Pickle me!'))
+
+    def test_pickle_boolelement(self):
+        self._test_pickle('<x>true</x>')
+        self._test_pickle('<x>false</x>')
+        self._test_pickle(objectify.DataElement(True))
+        self._test_pickle(objectify.DataElement(False))
+
+    def test_pickle_noneelement(self):
+        self._test_pickle('''
+<x xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:nil="true"/>''')
+        self._test_pickle(objectify.DataElement(None))
+
+    def _test_pickle(self, stringOrElt):
+        import pickle
+        if isinstance(stringOrElt, (etree._Element, etree._ElementTree)):
+            elt = stringOrElt
+        else:
+            elt = self.XML(stringOrElt)
+        out = BytesIO()
+        pickle.dump(elt, out)
+
+        new_elt = pickle.loads(out.getvalue())
+        self.assertEqual(
+            etree.tostring(new_elt),
+            etree.tostring(elt))
+
+    # E-Factory tests, need to use sub-elements as root element is always
+    # type-looked-up as ObjectifiedElement (no annotations)
+    def test_efactory_int(self):
+        E = objectify.E
+        root = E.root(E.val(23))
+        self.assertTrue(isinstance(root.val, objectify.IntElement))
+
+    def test_efactory_float(self):
+        E = objectify.E
+        root = E.root(E.val(233.23))
+        self.assertTrue(isinstance(root.val, objectify.FloatElement))
+
+    def test_efactory_str(self):
+        E = objectify.E
+        root = E.root(E.val("what?"))
+        self.assertTrue(isinstance(root.val, objectify.StringElement))
+
+    def test_efactory_unicode(self):
+        E = objectify.E
+        root = E.root(E.val(_str("blöödy häll", encoding="ISO-8859-1")))
+        self.assertTrue(isinstance(root.val, objectify.StringElement))
+
+    def test_efactory_bool(self):
+        E = objectify.E
+        root = E.root(E.val(True))
+        self.assertTrue(isinstance(root.val, objectify.BoolElement))
+
+    def test_efactory_none(self):
+        E = objectify.E
+        root = E.root(E.val(None))
+        self.assertTrue(isinstance(root.val, objectify.NoneElement))
+
+    def test_efactory_value_concatenation(self):
+        E = objectify.E
+        root = E.root(E.val(1, "foo", 2.0, "bar ", True, None))
+        self.assertTrue(isinstance(root.val, objectify.StringElement))
+
+    def test_efactory_attrib(self):
+        E = objectify.E
+        root = E.root(foo="bar")
+        self.assertEqual(root.get("foo"), "bar")
+
+    def test_efactory_nested(self):
+        E = objectify.E
+        DataElement = objectify.DataElement
+        root = E.root("text", E.sub(E.subsub()), "tail", DataElement(1),
+                      DataElement(2.0))
+        self.assertTrue(isinstance(root, objectify.ObjectifiedElement))
+        self.assertEqual(root.text, "text")
+        self.assertTrue(isinstance(root.sub, objectify.ObjectifiedElement))
+        self.assertEqual(root.sub.tail, "tail")
+        self.assertTrue(isinstance(root.sub.subsub, objectify.StringElement))
+        self.assertEqual(len(root.value), 2)
+        self.assertTrue(isinstance(root.value[0], objectify.IntElement))
+        self.assertTrue(isinstance(root.value[1], objectify.FloatElement))
+
+    def test_efactory_subtype(self):
+        class Attribute(objectify.ObjectifiedDataElement):
+            def __init__(self):
+                objectify.ObjectifiedDataElement.__init__(self)
+                self.set("datatype", "TYPE")
+                self.set("range", "0.,1.")
+
+        attr = Attribute()
+        self.assertEqual(attr.text, None)
+        self.assertEqual(attr.get("datatype"), "TYPE")
+        self.assertEqual(attr.get("range"), "0.,1.")
+
+    def test_XML_base_url_docinfo(self):
+        root = objectify.XML(_bytes("<root/>"), base_url="http://no/such/url")
+        docinfo = root.getroottree().docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+ 
+    def test_XML_set_base_url_docinfo(self):
+        root = objectify.XML(_bytes("<root/>"), base_url="http://no/such/url")
+        docinfo = root.getroottree().docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+        docinfo.URL = "https://secret/url"
+        self.assertEqual(docinfo.URL, "https://secret/url")
+ 
+    def test_parse_stringio_base_url(self):
+        tree = objectify.parse(BytesIO("<root/>"), base_url="http://no/such/url")
+        docinfo = tree.docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+ 
+    def test_parse_base_url_docinfo(self):
+        tree = objectify.parse(fileInTestDir('include/test_xinclude.xml'),
+                               base_url="http://no/such/url")
+        docinfo = tree.docinfo
+        self.assertEqual(docinfo.URL, "http://no/such/url")
+
+    def test_xml_base(self):
+        root = objectify.XML(_bytes("<root/>"), base_url="http://no/such/url")
+        self.assertEqual(root.base, "http://no/such/url")
+        self.assertEqual(
+            root.get('{http://www.w3.org/XML/1998/namespace}base'), None)
+        root.base = "https://secret/url"
+        self.assertEqual(root.base, "https://secret/url")
+        self.assertEqual(
+            root.get('{http://www.w3.org/XML/1998/namespace}base'),
+            "https://secret/url")
+ 
+    def test_xml_base_attribute(self):
+        root = objectify.XML(_bytes("<root/>"), base_url="http://no/such/url")
+        self.assertEqual(root.base, "http://no/such/url")
+        self.assertEqual(
+            root.get('{http://www.w3.org/XML/1998/namespace}base'), None)
+        root.set('{http://www.w3.org/XML/1998/namespace}base',
+                 "https://secret/url")
+        self.assertEqual(root.base, "https://secret/url")
+        self.assertEqual(
+            root.get('{http://www.w3.org/XML/1998/namespace}base'),
+            "https://secret/url")
+
+    def test_standard_lookup(self):
+        XML = self.XML
+
+        xml = _bytes('''\
+        <root xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
+          <i>5</i>
+          <i>-5</i>
+          <l>4294967296</l>
+          <l>-4294967296</l>
+          <f>1.1</f>
+          <b>true</b>
+          <b>false</b>
+          <s>Strange things happen, where strings collide</s>
+          <s>True</s>
+          <s>False</s>
+          <s>t</s>
+          <s>f</s>
+          <s></s>
+          <s>None</s>
+          <n xsi:nil="true" />
+        </root>
+        ''')
+        root = XML(xml)
+
+        for i in root.i:
+            self.assertTrue(isinstance(i, objectify.IntElement))
+        for l in root.l:
+            self.assertTrue(isinstance(l, objectify.IntElement))
+        for f in root.f:
+            self.assertTrue(isinstance(f, objectify.FloatElement))  
+        for b in root.b:
+            self.assertTrue(isinstance(b, objectify.BoolElement))
+        self.assertEqual(True,  root.b[0])
+        self.assertEqual(False, root.b[1])
+        for s in root.s:
+            self.assertTrue(isinstance(s, objectify.StringElement))
+        self.assertTrue(isinstance(root.n, objectify.NoneElement))
+        self.assertEqual(None, root.n)
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ObjectifyTestCase)])
+    suite.addTests(doctest.DocTestSuite(objectify))
+    if sys.version_info >= (2,4):
+        suite.addTests(
+            [make_doctest('../../../doc/objectify.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_pyclasslookup.py b/lib/lxml/tests/test_pyclasslookup.py
new file mode 100644
index 00000000..a54d776f
--- /dev/null
+++ b/lib/lxml/tests/test_pyclasslookup.py
@@ -0,0 +1,345 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests specific to the Python based class lookup.
+"""
+
+
+import unittest, operator, os.path, sys
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, StringIO, HelperTestCase, fileInTestDir
+from common_imports import SillyFileLike, canonicalize, doctest, _bytes
+
+from lxml.etree import PythonElementClassLookup
+
+xml_str = _bytes('''\
+<obj:root xmlns:obj="objectified" xmlns:other="otherNS">
+  <obj:c1 a1="A1" a2="A2" other:a3="A3">
+    <obj:c2>0</obj:c2>
+    <obj:c2>1</obj:c2>
+    <obj:c2>2</obj:c2>
+    <other:c2>3</other:c2>
+    <c2>3</c2>
+  </obj:c1>
+</obj:root>''')
+
+
+class PyClassLookupTestCase(HelperTestCase):
+    """Test cases for the lxml.pyclasslookup class lookup mechanism.
+    """
+    etree = etree
+    parser = etree.XMLParser()
+    Element = parser.makeelement
+
+    def tearDown(self):
+        self.parser.set_element_class_lookup(None)
+        super(PyClassLookupTestCase, self).tearDown()
+
+    def _setClassLookup(self, lookup_function):
+        class Lookup(PythonElementClassLookup):
+            def lookup(self, *args):
+                return lookup_function(*args)
+        self.parser.set_element_class_lookup( Lookup() )
+
+    def _buildElementClass(self):
+        class LocalElement(etree.ElementBase):
+            pass
+        return LocalElement
+
+    def XML(self, xml):
+        return self.etree.XML(xml, self.parser)
+
+    # --- Test cases
+
+    def test_lookup(self):
+        el_class = self._buildElementClass()
+        el_class.i = 1
+        def lookup(*args):
+            if el_class.i == 1:
+                el_class.i = 2
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertEqual(2, el_class.i)
+
+    def test_lookup_keep_ref_assertion(self):
+        el_class = self._buildElementClass()
+        el_class.EL = None
+        def lookup(doc, el):
+            if el_class.EL is None:
+                el_class.EL = el
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertNotEqual(None, el_class.EL)
+        self.assertRaises(ReferenceError, el_class.EL.getchildren)
+
+    def test_lookup_tag(self):
+        el_class = self._buildElementClass()
+        el_class.TAG = None
+        def lookup(doc, el):
+            if el_class.TAG is None:
+                el_class.TAG = el.tag
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertNotEqual(None, root.TAG)
+        self.assertEqual(root.tag, root.TAG)
+
+    def test_lookup_text(self):
+        el_class = self._buildElementClass()
+        el_class.TEXT = None
+        def lookup(doc, el):
+            if el_class.TEXT is None:
+                el_class.TEXT = el.text
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertNotEqual(None, root.TEXT)
+        self.assertEqual(root.text, root.TEXT)
+
+    def test_lookup_tail(self):
+        el_class = self._buildElementClass()
+        el_class.TAIL = None
+        def lookup(doc, el):
+            if el_class.TAIL is None:
+                el_class.TAIL = el.tail
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertEqual(root.tail, root.TAIL)
+
+    def test_lookup_attrib(self):
+        el_class = self._buildElementClass()
+        el_class.ATTRIB = None
+        def lookup(doc, el):
+            if el_class.ATTRIB is None:
+                el_class.ATTRIB = el[0].attrib
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        items1 = list(root[0].attrib.items())
+        items1.sort()
+        items2 = list(root.ATTRIB.items())
+        items2.sort()
+        self.assertEqual(items1, items2)
+
+    def test_lookup_prefix(self):
+        el_class = self._buildElementClass()
+        el_class.PREFIX = None
+        def lookup(doc, el):
+            if el_class.PREFIX is None:
+                el_class.PREFIX = el.prefix
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertEqual(root.prefix, root.PREFIX)
+
+    def test_lookup_sourceline(self):
+        el_class = self._buildElementClass()
+        el_class.LINE = None
+        def lookup(doc, el):
+            if el_class.LINE is None:
+                el_class.LINE = el.sourceline
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertEqual(root.sourceline, root.LINE)
+
+    def test_lookup_getitem(self):
+        el_class = self._buildElementClass()
+        el_class.CHILD_TAG = None
+        def lookup(doc, el):
+            el_class.CHILD_TAG = el[0].tag
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        child_tag = root.CHILD_TAG
+        self.assertNotEqual(None, child_tag)
+        self.assertEqual(root[0].tag, child_tag)
+
+    def test_lookup_getitem_neg(self):
+        el_class = self._buildElementClass()
+        el_class.CHILD_TAG = None
+        def lookup(doc, el):
+            if el_class.CHILD_TAG is None:
+                el_class.CHILD_TAG = el[-1].tag
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        child_tag = root.CHILD_TAG
+        self.assertNotEqual(None, child_tag)
+        self.assertEqual(root[-1].tag, child_tag)
+
+    def test_lookup_getslice(self):
+        el_class = self._buildElementClass()
+        el_class.CHILD_TAGS = None
+        def lookup(doc, el):
+            if el_class.CHILD_TAGS is None:
+                el_class.CHILD_TAGS = [ c.tag for c in el[1:-1] ]
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        child_tags = root.CHILD_TAGS
+        self.assertNotEqual(None, child_tags)
+        self.assertEqual([ c.tag for c in root[1:-1] ],
+                          child_tags)
+
+    def test_lookup_len(self):
+        el_class = self._buildElementClass()
+        el_class.LEN = None
+        def lookup(doc, el):
+            if el_class.LEN is None:
+                el_class.LEN = len(el)
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertEqual(1, el_class.LEN)
+
+    def test_lookup_bool(self):
+        el_class = self._buildElementClass()
+        el_class.TRUE = None
+        def lookup(doc, el):
+            if el_class.TRUE is None:
+                el_class.TRUE = bool(el)
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertTrue(el_class.TRUE)
+
+    def test_lookup_get(self):
+        el_class = self._buildElementClass()
+        el_class.VAL = None
+        def lookup(doc, el):
+            if el_class.VAL is None:
+                el_class.VAL = el[0].get('a1')
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertNotEqual(None, el_class.VAL)
+        self.assertEqual(root[0].get('a1'), el_class.VAL)
+
+    def test_lookup_get_default(self):
+        el_class = self._buildElementClass()
+        default = str(id(el_class))
+        el_class.VAL = None
+        def lookup(doc, el):
+            if el_class.VAL is None:
+                el_class.VAL = el[0].get('unknownattribute', default)
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertEqual(default, el_class.VAL)
+
+    def test_lookup_getchildren(self):
+        el_class = self._buildElementClass()
+        el_class.CHILD_TAGS = None
+        def lookup(doc, el):
+            if el_class.CHILD_TAGS is None:
+                el_class.CHILD_TAGS = [ c.tag for c in el.getchildren() ]
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        child_tags = root.CHILD_TAGS
+        self.assertNotEqual(None, child_tags)
+        self.assertEqual([ c.tag for c in root.getchildren() ],
+                          child_tags)
+
+    def test_lookup_iter_children(self):
+        el_class = self._buildElementClass()
+        el_class.CHILD_TAGS = None
+        def lookup(doc, el):
+            if el_class.CHILD_TAGS is None:
+                el_class.CHILD_TAGS = [ c.tag for c in el ]
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        child_tags = root.CHILD_TAGS
+        self.assertNotEqual(None, child_tags)
+        self.assertEqual([ c.tag for c in root.getchildren() ],
+                          child_tags)
+
+    def test_lookup_iterchildren(self):
+        el_class = self._buildElementClass()
+        el_class.CHILD_TAGS = None
+        def lookup(doc, el):
+            if el_class.CHILD_TAGS is None:
+                el_class.CHILD_TAGS = [ c.tag for c in el.iterchildren() ]
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        child_tags = root.CHILD_TAGS
+        self.assertNotEqual(None, child_tags)
+        self.assertEqual([ c.tag for c in root.getchildren() ],
+                          child_tags)
+
+    def test_lookup_iterchildren_tag(self):
+        el_class = self._buildElementClass()
+        el_class.CHILD_TAGS = None
+        def lookup(doc, el):
+            if not el_class.CHILD_TAGS:
+                el_class.CHILD_TAGS = [
+                    c.tag for c in el.iterchildren(tag='{objectified}c2') ]
+            return el_class
+        self._setClassLookup(lookup)
+
+        root = self.XML(xml_str)
+        child_tags = root.CHILD_TAGS
+        self.assertNotEqual(None, child_tags)
+        self.assertEqual([], child_tags)
+
+        c1 = root[0]
+        child_tags = root.CHILD_TAGS
+        self.assertNotEqual(None, child_tags)
+        self.assertNotEqual([], child_tags)
+        self.assertEqual(
+            [ c.tag for c in root[0].iterchildren(tag='{objectified}c2') ],
+            child_tags)
+
+    def test_lookup_getparent(self):
+        el_class = self._buildElementClass()
+        el_class.PARENT = None
+        def lookup(doc, el):
+            if el_class.PARENT is None:
+                el_class.PARENT = el[0].getparent().tag
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertEqual(root.tag, root.PARENT)
+
+    def test_lookup_getnext(self):
+        el_class = self._buildElementClass()
+        el_class.NEXT = None
+        def lookup(doc, el):
+            if el_class.NEXT is None:
+                el_class.NEXT = el[0][1].getnext().tag
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertNotEqual(None, el_class.NEXT)
+        self.assertEqual(root[0][1].getnext().tag, el_class.NEXT)
+
+    def test_lookup_getprevious(self):
+        el_class = self._buildElementClass()
+        el_class.PREV = None
+        def lookup(doc, el):
+            if el_class.PREV is None:
+                el_class.PREV = el[0][1].getprevious().tag
+            return el_class
+        self._setClassLookup(lookup)
+        root = self.XML(xml_str)
+        self.assertNotEqual(None, el_class.PREV)
+        self.assertEqual(root[0][1].getprevious().tag, el_class.PREV)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(PyClassLookupTestCase)])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_relaxng.py b/lib/lxml/tests/test_relaxng.py
new file mode 100644
index 00000000..4337f055
--- /dev/null
+++ b/lib/lxml/tests/test_relaxng.py
@@ -0,0 +1,180 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to RelaxNG parsing and validation
+"""
+
+import unittest, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, BytesIO, _bytes, HelperTestCase, fileInTestDir
+from common_imports import doctest, make_doctest
+
+class ETreeRelaxNGTestCase(HelperTestCase):
+    def test_relaxng(self):
+        tree_valid = self.parse('<a><b></b></a>')
+        tree_invalid = self.parse('<a><c></c></a>')
+        schema = self.parse('''\
+<element name="a" xmlns="http://relaxng.org/ns/structure/1.0">
+  <zeroOrMore>
+     <element name="b">
+       <text />
+     </element>
+  </zeroOrMore>
+</element>
+''')
+        schema = etree.RelaxNG(schema)
+        self.assertTrue(schema.validate(tree_valid))
+        self.assertFalse(schema.error_log.filter_from_errors())
+
+        self.assertFalse(schema.validate(tree_invalid))
+        self.assertTrue(schema.error_log.filter_from_errors())
+
+        self.assertTrue(schema.validate(tree_valid))             # repeat valid
+        self.assertFalse(schema.error_log.filter_from_errors())  # repeat valid
+
+    def test_relaxng_stringio(self):
+        tree_valid = self.parse('<a><b></b></a>')
+        tree_invalid = self.parse('<a><c></c></a>')
+        schema_file = BytesIO('''\
+<element name="a" xmlns="http://relaxng.org/ns/structure/1.0">
+  <zeroOrMore>
+     <element name="b">
+       <text />
+     </element>
+  </zeroOrMore>
+</element>
+''')
+        schema = etree.RelaxNG(file=schema_file)
+        self.assertTrue(schema.validate(tree_valid))
+        self.assertFalse(schema.validate(tree_invalid))
+
+    def test_relaxng_elementtree_error(self):
+        self.assertRaises(ValueError, etree.RelaxNG, etree.ElementTree())
+
+    def test_relaxng_error(self):
+        tree_invalid = self.parse('<a><c></c></a>')
+        schema = self.parse('''\
+<element name="a" xmlns="http://relaxng.org/ns/structure/1.0">
+  <zeroOrMore>
+     <element name="b">
+       <text />
+     </element>
+  </zeroOrMore>
+</element>
+''')
+        schema = etree.RelaxNG(schema)
+        self.assertFalse(schema.validate(tree_invalid))
+        errors = schema.error_log
+        self.assertTrue([log for log in errors
+                         if log.level_name == "ERROR"])
+        self.assertTrue([log for log in errors
+                         if "not expect" in log.message])
+
+    def test_relaxng_invalid_schema(self):
+        schema = self.parse('''\
+<element name="a" xmlns="http://relaxng.org/ns/structure/1.0">
+  <zeroOrMore>
+     <element name="b" />
+  </zeroOrMore>
+</element>
+''')
+        self.assertRaises(etree.RelaxNGParseError,
+                          etree.RelaxNG, schema)
+
+    def test_relaxng_invalid_schema2(self):
+        schema = self.parse('''\
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" />
+''')
+        self.assertRaises(etree.RelaxNGParseError,
+                          etree.RelaxNG, schema)
+
+    def test_relaxng_invalid_schema3(self):
+        schema = self.parse('''\
+<grammar xmlns="http://relaxng.org/ns/structure/1.0">
+  <define name="test">
+    <element name="test"/>
+  </define>
+</grammar>
+''')
+        self.assertRaises(etree.RelaxNGParseError,
+                          etree.RelaxNG, schema)
+
+    def test_relaxng_invalid_schema4(self):
+        # segfault
+        schema = self.parse('''\
+<element name="a" xmlns="mynamespace" />
+''')
+        self.assertRaises(etree.RelaxNGParseError,
+                          etree.RelaxNG, schema)
+
+    def test_relaxng_include(self):
+        # this will only work if we access the file through path or
+        # file object..
+        f = open(fileInTestDir('test1.rng'), 'rb')
+        try:
+            schema = etree.RelaxNG(file=f)
+        finally:
+            f.close()
+
+    def test_relaxng_shortcut(self):
+        tree_valid = self.parse('<a><b></b></a>')
+        tree_invalid = self.parse('<a><c></c></a>')
+        schema = self.parse('''\
+<element name="a" xmlns="http://relaxng.org/ns/structure/1.0">
+  <zeroOrMore>
+     <element name="b">
+       <text />
+     </element>
+  </zeroOrMore>
+</element>
+''')
+        self.assertTrue(tree_valid.relaxng(schema))
+        self.assertFalse(tree_invalid.relaxng(schema))
+
+    def test_multiple_elementrees(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        schema = etree.RelaxNG( self.parse('''\
+<element name="a" xmlns="http://relaxng.org/ns/structure/1.0">
+  <element name="b">
+    <text />
+  </element>
+  <element name="c">
+    <text />
+  </element>
+</element>
+''') )
+        self.assertTrue(schema.validate(tree))
+        self.assertFalse(schema.error_log.filter_from_errors())
+
+        self.assertTrue(schema.validate(tree))                   # repeat valid
+        self.assertFalse(schema.error_log.filter_from_errors())  # repeat valid
+
+        schema = etree.RelaxNG( self.parse('''\
+<element name="b" xmlns="http://relaxng.org/ns/structure/1.0">
+  <text />
+</element>
+''') )
+        c_tree = etree.ElementTree(tree.getroot()[1])
+        self.assertEqual(self._rootstring(c_tree), _bytes('<c>C</c>'))
+        self.assertFalse(schema.validate(c_tree))
+        self.assertTrue(schema.error_log.filter_from_errors())
+
+        b_tree = etree.ElementTree(tree.getroot()[0])
+        self.assertEqual(self._rootstring(b_tree), _bytes('<b>B</b>'))
+        self.assertTrue(schema.validate(b_tree))
+        self.assertFalse(schema.error_log.filter_from_errors())
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeRelaxNGTestCase)])
+    suite.addTests(
+        [make_doctest('../../../doc/validation.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_sax.py b/lib/lxml/tests/test_sax.py
new file mode 100644
index 00000000..ed45fbbc
--- /dev/null
+++ b/lib/lxml/tests/test_sax.py
@@ -0,0 +1,277 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to SAX I/O
+"""
+
+import unittest, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import HelperTestCase, doctest, make_doctest, BytesIO, _bytes
+from lxml import sax
+from xml.dom import pulldom
+
+class ETreeSaxTestCase(HelperTestCase):
+
+    def test_etree_sax_simple(self):
+        tree = self.parse('<a>ab<b/>ba</a>')
+        xml_out = self._saxify_serialize(tree)
+        self.assertEqual(_bytes('<a>ab<b/>ba</a>'),
+                          xml_out)
+
+    def test_etree_sax_double(self):
+        tree = self.parse('<a>ab<b>bb</b>ba</a>')
+        xml_out = self._saxify_serialize(tree)
+        self.assertEqual(_bytes('<a>ab<b>bb</b>ba</a>'),
+                          xml_out)
+
+    def test_etree_sax_comment(self):
+        tree = self.parse('<a>ab<!-- TEST -->ba</a>')
+        xml_out = self._saxify_serialize(tree)
+        self.assertEqual(_bytes('<a>abba</a>'),
+                          xml_out)
+
+    def test_etree_sax_pi(self):
+        tree = self.parse('<a>ab<?this and that?>ba</a>')
+        xml_out = self._saxify_serialize(tree)
+        self.assertEqual(_bytes('<a>ab<?this and that?>ba</a>'),
+                          xml_out)
+
+    def test_etree_sax_comment_root(self):
+        tree = self.parse('<!-- TEST --><a>ab</a>')
+        xml_out = self._saxify_serialize(tree)
+        self.assertEqual(_bytes('<a>ab</a>'),
+                          xml_out)
+
+    def test_etree_sax_pi_root(self):
+        tree = self.parse('<?this and that?><a>ab</a>')
+        xml_out = self._saxify_serialize(tree)
+        self.assertEqual(_bytes('<?this and that?><a>ab</a>'),
+                          xml_out)
+
+    def test_etree_sax_attributes(self):
+        tree = self.parse('<a aa="5">ab<b b="5"/>ba</a>')
+        xml_out = self._saxify_serialize(tree)
+        self.assertEqual(_bytes('<a aa="5">ab<b b="5"/>ba</a>'),
+                          xml_out)
+
+    def test_etree_sax_ns1(self):
+        tree = self.parse('<a xmlns="bla">ab<b>bb</b>ba</a>')
+        new_tree = self._saxify_unsaxify(tree)
+        root = new_tree.getroot()
+        self.assertEqual('{bla}a',
+                         root.tag)
+        self.assertEqual('{bla}b',
+                         root[0].tag)
+
+    def test_etree_sax_ns2(self):
+        tree = self.parse('<a xmlns="blaA">ab<b:b xmlns:b="blaB">bb</b:b>ba</a>')
+        new_tree = self._saxify_unsaxify(tree)
+        root = new_tree.getroot()
+        self.assertEqual('{blaA}a',
+                         root.tag)
+        self.assertEqual('{blaB}b',
+                         root[0].tag)
+
+    def test_sax_to_pulldom(self):
+        tree = self.parse('<a xmlns="blaA">ab<b:b xmlns:b="blaB">bb</b:b>ba</a>')
+        handler = pulldom.SAX2DOM()
+        sax.saxify(tree, handler)
+        dom = handler.document
+
+        self.assertEqual('a',
+                         dom.firstChild.localName)
+        self.assertEqual('blaA',
+                         dom.firstChild.namespaceURI)
+
+        children = dom.firstChild.childNodes
+        self.assertEqual('ab',
+                         children[0].nodeValue)
+        self.assertEqual('blaB',
+                         children[1].namespaceURI)
+        self.assertEqual('ba',
+                         children[2].nodeValue)
+
+    def test_element_sax(self):
+        tree = self.parse('<a><b/></a>')
+        a = tree.getroot()
+        b = a[0]
+
+        xml_out = self._saxify_serialize(a)
+        self.assertEqual(_bytes('<a><b/></a>'),
+                          xml_out)
+
+        xml_out = self._saxify_serialize(b)
+        self.assertEqual(_bytes('<b/>'),
+                          xml_out)
+
+    def test_element_sax_ns(self):
+        tree = self.parse('<a:a xmlns:a="blaA"><b/></a:a>')
+        a = tree.getroot()
+        b = a[0]
+
+        new_tree = self._saxify_unsaxify(a)
+        root = new_tree.getroot()
+        self.assertEqual('{blaA}a',
+                         root.tag)
+        self.assertEqual('b',
+                         root[0].tag)
+
+        new_tree = self._saxify_unsaxify(b)
+        root = new_tree.getroot()
+        self.assertEqual('b',
+                         root.tag)
+        self.assertEqual(0,
+                         len(root))
+
+    def test_etree_sax_handler_default_ns(self):
+        handler = sax.ElementTreeContentHandler()
+        handler.startDocument()
+        handler.startPrefixMapping(None, 'blaA')
+        handler.startElementNS(('blaA', 'a'), 'a', {})
+        handler.startPrefixMapping(None, 'blaB')
+        handler.startElementNS(('blaB', 'b'), 'b', {})
+        handler.endElementNS(  ('blaB', 'b'), 'b')
+        handler.endPrefixMapping(None)
+        handler.startElementNS(('blaA', 'c'), 'c', {})
+        handler.endElementNS(  ('blaA', 'c'), 'c')
+        handler.endElementNS(  ('blaA', 'a'), 'a')
+        handler.endPrefixMapping(None)
+        handler.endDocument()
+
+        new_tree = handler.etree
+        root = new_tree.getroot()
+        self.assertEqual('{blaA}a',
+                         root.tag)
+        self.assertEqual('{blaB}b',
+                         root[0].tag)
+        self.assertEqual('{blaA}c',
+                         root[1].tag)
+
+    def test_etree_sax_handler_default_ns_None(self):
+        handler = sax.ElementTreeContentHandler()
+        handler.startDocument()
+        handler.startPrefixMapping(None, 'blaA')
+        handler.startElementNS((None, 'a'), 'a', {})
+        handler.startPrefixMapping(None, 'blaB')
+        handler.startElementNS((None, 'b'), 'b', {})
+        handler.endElementNS(  (None, 'b'), 'b')
+        handler.endPrefixMapping(None)
+        handler.startElementNS((None, 'c'), 'c', {})
+        handler.endElementNS(  (None, 'c'), 'c')
+        handler.endElementNS(  (None, 'a'), 'a')
+        handler.endPrefixMapping(None)
+        handler.endDocument()
+
+        new_tree = handler.etree
+        root = new_tree.getroot()
+        self.assertEqual('{blaA}a',
+                         root.tag)
+        self.assertEqual('{blaB}b',
+                         root[0].tag)
+        self.assertEqual('{blaA}c',
+                         root[1].tag)
+
+    def test_etree_sax_redefine_ns(self):
+        handler = sax.ElementTreeContentHandler()
+        handler.startDocument()
+        handler.startPrefixMapping('ns', 'blaA')
+        handler.startElementNS(('blaA', 'a'), 'ns:a', {})
+        handler.startPrefixMapping('ns', 'blaB')
+        handler.startElementNS(('blaB', 'b'), 'ns:b', {})
+        handler.endElementNS(  ('blaB', 'b'), 'ns:b')
+        handler.endPrefixMapping('ns')
+        handler.startElementNS(('blaA', 'c'), 'ns:c', {})
+        handler.endElementNS(  ('blaA', 'c'), 'ns:c')
+        handler.endElementNS(  ('blaA', 'a'), 'ns:a')
+        handler.endPrefixMapping('ns')
+        handler.endDocument()
+
+        new_tree = handler.etree
+        root = new_tree.getroot()
+        self.assertEqual('{blaA}a',
+                         root.tag)
+        self.assertEqual('{blaB}b',
+                         root[0].tag)
+        self.assertEqual('{blaA}c',
+                         root[1].tag)
+
+    def test_etree_sax_no_ns(self):
+        handler = sax.ElementTreeContentHandler()
+        handler.startDocument()
+        handler.startElement('a', {})
+        handler.startElement('b', {})
+        handler.endElement('b')
+        handler.startElement('c') # with empty attributes
+        handler.endElement('c')
+        handler.endElement('a')
+        handler.endDocument()
+
+        new_tree = handler.etree
+        root = new_tree.getroot()
+        self.assertEqual('a', root.tag)
+        self.assertEqual('b', root[0].tag)
+        self.assertEqual('c', root[1].tag)
+
+    def test_etree_sax_no_ns_attributes(self):
+        handler = sax.ElementTreeContentHandler()
+        handler.startDocument()
+        handler.startElement('a', {"attr_a1": "a1"})
+        handler.startElement('b', {"attr_b1": "b1"})
+        handler.endElement('b')
+        handler.endElement('a')
+        handler.endDocument()
+
+        new_tree = handler.etree
+        root = new_tree.getroot()
+        self.assertEqual('a', root.tag)
+        self.assertEqual('b', root[0].tag)
+        self.assertEqual('a1', root.attrib["attr_a1"])
+        self.assertEqual('b1', root[0].attrib["attr_b1"])
+
+    def test_etree_sax_ns_attributes(self):
+        handler = sax.ElementTreeContentHandler()
+        handler.startDocument()
+
+        self.assertRaises(ValueError,
+            handler.startElement,
+            'a', {"blaA:attr_a1": "a1"}
+        )
+
+    def test_etree_sax_error(self):
+        handler = sax.ElementTreeContentHandler()
+        handler.startDocument()
+        handler.startElement('a')
+        self.assertRaises(sax.SaxError, handler.endElement, 'b')
+
+    def test_etree_sax_error2(self):
+        handler = sax.ElementTreeContentHandler()
+        handler.startDocument()
+        handler.startElement('a')
+        handler.startElement('b')
+        self.assertRaises(sax.SaxError, handler.endElement, 'a')
+
+    def _saxify_unsaxify(self, saxifiable):
+        handler = sax.ElementTreeContentHandler()
+        sax.ElementTreeProducer(saxifiable, handler).saxify()
+        return handler.etree
+
+    def _saxify_serialize(self, tree):
+        new_tree = self._saxify_unsaxify(tree)
+        f = BytesIO()
+        new_tree.write(f)
+        return f.getvalue().replace(_bytes('\n'), _bytes(''))
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeSaxTestCase)])
+    suite.addTests(
+        [make_doctest('../../../doc/sax.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_schematron.py b/lib/lxml/tests/test_schematron.py
new file mode 100644
index 00000000..fd956694
--- /dev/null
+++ b/lib/lxml/tests/test_schematron.py
@@ -0,0 +1,84 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to Schematron parsing and validation
+"""
+
+import unittest, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, HelperTestCase, fileInTestDir
+from common_imports import doctest, make_doctest
+
+class ETreeSchematronTestCase(HelperTestCase):
+    def test_schematron(self):
+        tree_valid = self.parse('<AAA><BBB/><CCC/></AAA>')
+        tree_invalid = self.parse('<AAA><BBB/><CCC/><DDD/></AAA>')
+        schema = self.parse('''\
+<schema xmlns="http://purl.oclc.org/dsdl/schematron" >
+     <pattern name="Open model">
+          <rule context="AAA">
+               <assert test="BBB"> BBB element is not present</assert>
+               <assert test="CCC"> CCC element is not present</assert>
+          </rule>
+     </pattern>
+     <pattern name="Closed model">
+          <rule context="AAA">
+               <assert test="BBB"> BBB element is not present</assert>
+               <assert test="CCC"> CCC element is not present</assert>
+               <assert test="count(BBB|CCC) = count (*)">There is an extra element</assert>
+          </rule>
+     </pattern>
+</schema>
+''')
+        schema = etree.Schematron(schema)
+        self.assertTrue(schema.validate(tree_valid))
+        self.assertFalse(schema.error_log.filter_from_errors())
+
+        self.assertFalse(schema.validate(tree_invalid))
+        self.assertTrue(schema.error_log.filter_from_errors())
+
+        self.assertTrue(schema.validate(tree_valid))             # repeat valid
+        self.assertFalse(schema.error_log.filter_from_errors())  # repeat valid
+
+    def test_schematron_elementtree_error(self):
+        self.assertRaises(ValueError, etree.Schematron, etree.ElementTree())
+
+    def test_schematron_invalid_schema(self):
+        schema = self.parse('''\
+<schema xmlns="http://purl.oclc.org/dsdl/schematron" >
+     <pattern name="Open model">
+     </pattern>
+</schema>
+''')
+        self.assertRaises(etree.SchematronParseError,
+                          etree.Schematron, schema)
+
+    def test_schematron_invalid_schema_empty(self):
+        schema = self.parse('''\
+<schema xmlns="http://purl.oclc.org/dsdl/schematron" />
+''')
+        self.assertRaises(etree.SchematronParseError,
+                          etree.Schematron, schema)
+
+    def test_schematron_invalid_schema_namespace(self):
+        # segfault
+        schema = self.parse('''\
+<schema xmlns="mynamespace" />
+''')
+        self.assertRaises(etree.SchematronParseError,
+                          etree.Schematron, schema)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeSchematronTestCase)])
+    suite.addTests(
+        [make_doctest('../../../doc/validation.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_threading.py b/lib/lxml/tests/test_threading.py
new file mode 100644
index 00000000..454da2bb
--- /dev/null
+++ b/lib/lxml/tests/test_threading.py
@@ -0,0 +1,422 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests for thread usage in lxml.etree.
+"""
+
+import unittest, threading, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, HelperTestCase, BytesIO, _bytes
+
+try:
+    from Queue import Queue
+except ImportError:
+    from queue import Queue # Py3
+
+class ThreadingTestCase(HelperTestCase):
+    """Threading tests"""
+    etree = etree
+
+    def _run_thread(self, func):
+        thread = threading.Thread(target=func)
+        thread.start()
+        thread.join()
+
+    def test_subtree_copy_thread(self):
+        tostring = self.etree.tostring
+        XML = self.etree.XML
+        xml = _bytes("<root><threadtag/></root>")
+        main_root = XML(_bytes("<root/>"))
+
+        def run_thread():
+            thread_root = XML(xml)
+            main_root.append(thread_root[0])
+            del thread_root
+
+        self._run_thread(run_thread)
+        self.assertEqual(xml, tostring(main_root))
+
+    def test_main_xslt_in_thread(self):
+        XML = self.etree.XML
+        style = XML(_bytes('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*">
+    <foo><xsl:copy><xsl:value-of select="/a/b/text()" /></xsl:copy></foo>
+  </xsl:template>
+</xsl:stylesheet>'''))
+        st = etree.XSLT(style)
+
+        result = []
+
+        def run_thread():
+            root = XML(_bytes('<a><b>B</b><c>C</c></a>'))
+            result.append( st(root) )
+
+        self._run_thread(run_thread)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo><a>B</a></foo>
+''',
+                          str(result[0]))
+
+    def test_thread_xslt(self):
+        XML = self.etree.XML
+        tostring = self.etree.tostring
+        root = XML(_bytes('<a><b>B</b><c>C</c></a>'))
+
+        def run_thread():
+            style = XML(_bytes('''\
+    <xsl:stylesheet version="1.0"
+        xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+      <xsl:template match="*">
+        <foo><xsl:copy><xsl:value-of select="/a/b/text()" /></xsl:copy></foo>
+      </xsl:template>
+    </xsl:stylesheet>'''))
+            st = etree.XSLT(style)
+            root.append( st(root).getroot() )
+
+        self._run_thread(run_thread)
+        self.assertEqual(_bytes('<a><b>B</b><c>C</c><foo><a>B</a></foo></a>'),
+                          tostring(root))
+
+    def test_thread_xslt_attr_replace(self):
+        # this is the only case in XSLT where the result tree can be
+        # modified in-place
+        XML = self.etree.XML
+        tostring = self.etree.tostring
+        style = self.etree.XSLT(XML(_bytes('''\
+    <xsl:stylesheet version="1.0"
+        xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+      <xsl:template match="*">
+        <root class="abc">
+          <xsl:copy-of select="@class" />
+          <xsl:attribute name="class">xyz</xsl:attribute> 
+        </root>
+      </xsl:template>
+    </xsl:stylesheet>''')))
+
+        result = []
+        def run_thread():
+            root = XML(_bytes('<ROOT class="ABC" />'))
+            result.append( style(root).getroot() )
+
+        self._run_thread(run_thread)
+        self.assertEqual(_bytes('<root class="xyz"/>'),
+                          tostring(result[0]))
+
+    def test_thread_create_xslt(self):
+        XML = self.etree.XML
+        tostring = self.etree.tostring
+        root = XML(_bytes('<a><b>B</b><c>C</c></a>'))
+
+        stylesheets = []
+
+        def run_thread():
+            style = XML(_bytes('''\
+    <xsl:stylesheet
+        xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+        version="1.0">
+      <xsl:output method="xml" />
+      <xsl:template match="/">
+         <div id="test">
+           <xsl:apply-templates/>
+         </div>
+      </xsl:template>
+    </xsl:stylesheet>'''))
+            stylesheets.append( etree.XSLT(style) )
+
+        self._run_thread(run_thread)
+
+        st = stylesheets[0]
+        result = tostring( st(root) )
+
+        self.assertEqual(_bytes('<div id="test">BC</div>'),
+                          result)
+
+    def test_thread_error_log(self):
+        XML = self.etree.XML
+        ParseError = self.etree.ParseError
+        expected_error = [self.etree.ErrorTypes.ERR_TAG_NAME_MISMATCH]
+        children = "<a>test</a>" * 100
+
+        def parse_error_test(thread_no):
+            tag = "tag%d" % thread_no
+            xml = "<%s>%s</%s>" % (tag, children, tag.upper())
+            parser = self.etree.XMLParser()
+            for _ in range(10):
+                errors = None
+                try:
+                    XML(xml, parser)
+                except self.etree.ParseError:
+                    e = sys.exc_info()[1]
+                    errors = e.error_log.filter_types(expected_error)
+                self.assertTrue(errors, "Expected error not found")
+                for error in errors:
+                    self.assertTrue(
+                        tag in error.message and tag.upper() in error.message,
+                        "%s and %s not found in '%s'" % (
+                        tag, tag.upper(), error.message))
+
+        self.etree.clear_error_log()
+        threads = []
+        for thread_no in range(1, 10):
+            t = threading.Thread(target=parse_error_test,
+                                 args=(thread_no,))
+            threads.append(t)
+            t.start()
+
+        parse_error_test(0)
+
+        for t in threads:
+            t.join()
+
+    def test_thread_mix(self):
+        XML = self.etree.XML
+        Element = self.etree.Element
+        SubElement = self.etree.SubElement
+        tostring = self.etree.tostring
+        xml = _bytes('<a><b>B</b><c xmlns="test">C</c></a>')
+        root = XML(xml)
+        fragment = XML(_bytes("<other><tags/></other>"))
+
+        result = self.etree.Element("{myns}root", att = "someval")
+
+        def run_XML():
+            thread_root = XML(xml)
+            result.append(thread_root[0])
+            result.append(thread_root[-1])
+
+        def run_parse():
+            thread_root = self.etree.parse(BytesIO(xml)).getroot()
+            result.append(thread_root[0])
+            result.append(thread_root[-1])
+
+        def run_move_main():
+            result.append(fragment[0])
+
+        def run_build():
+            result.append(
+                Element("{myns}foo", attrib={'{test}attr':'val'}))
+            SubElement(result, "{otherns}tasty")
+
+        def run_xslt():
+            style = XML(_bytes('''\
+    <xsl:stylesheet version="1.0"
+        xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+      <xsl:template match="*">
+        <xsl:copy><foo><xsl:value-of select="/a/b/text()" /></foo></xsl:copy>
+      </xsl:template>
+    </xsl:stylesheet>'''))
+            st = etree.XSLT(style)
+            result.append( st(root).getroot() )
+
+        for test in (run_XML, run_parse, run_move_main, run_xslt, run_build):
+            tostring(result)
+            self._run_thread(test)
+
+        self.assertEqual(
+            _bytes('<ns0:root xmlns:ns0="myns" att="someval"><b>B</b>'
+                   '<c xmlns="test">C</c><b>B</b><c xmlns="test">C</c><tags/>'
+                   '<a><foo>B</foo></a>'
+                   '<ns0:foo xmlns:ns1="test" ns1:attr="val"/>'
+                   '<ns1:tasty xmlns:ns1="otherns"/></ns0:root>'),
+            tostring(result))
+
+        def strip_first():
+            root = Element("newroot")
+            root.append(result[0])
+
+        while len(result):
+            self._run_thread(strip_first)
+
+        self.assertEqual(
+            _bytes('<ns0:root xmlns:ns0="myns" att="someval"/>'),
+            tostring(result))
+
+    def test_concurrent_proxies(self):
+        XML = self.etree.XML
+        root = XML(_bytes('<root><a>A</a><b xmlns="test">B</b><c/></root>'))
+        child_count = len(root)
+        def testrun():
+            for i in range(10000):
+                el = root[i%child_count]
+                del el
+        threads = [ threading.Thread(target=testrun)
+                    for _ in range(10) ]
+        for thread in threads:
+            thread.start()
+        for thread in threads:
+            thread.join()
+
+    def test_concurrent_class_lookup(self):
+        XML = self.etree.XML
+
+        class TestElement(etree.ElementBase):
+            pass
+
+        class MyLookup(etree.CustomElementClassLookup):
+            repeat = range(100)
+            def lookup(self, t, d, ns, name):
+                count = 0
+                for i in self.repeat:
+                    # allow other threads to run
+                    count += 1
+                return TestElement
+
+        parser = self.etree.XMLParser()
+        parser.set_element_class_lookup(MyLookup())
+
+        root = XML(_bytes('<root><a>A</a><b xmlns="test">B</b><c/></root>'),
+                   parser)
+
+        child_count = len(root)
+        def testrun():
+            for i in range(1000):
+                el = root[i%child_count]
+                del el
+        threads = [ threading.Thread(target=testrun)
+                    for _ in range(10) ]
+        for thread in threads:
+            thread.start()
+        for thread in threads:
+            thread.join()
+
+
+class ThreadPipelineTestCase(HelperTestCase):
+    """Threading tests based on a thread worker pipeline.
+    """
+    etree = etree
+    item_count = 20
+
+    class Worker(threading.Thread):
+        def __init__(self, in_queue, in_count, **kwargs):
+            threading.Thread.__init__(self)
+            self.in_queue = in_queue
+            self.in_count = in_count
+            self.out_queue = Queue(in_count)
+            self.__dict__.update(kwargs)
+        def run(self):
+            get, put = self.in_queue.get, self.out_queue.put
+            handle = self.handle
+            for _ in range(self.in_count):
+                put(handle(get()))
+
+    class ParseWorker(Worker):
+        XML = etree.XML
+        def handle(self, xml):
+            return self.XML(xml)
+    class RotateWorker(Worker):
+        def handle(self, element):
+            first = element[0]
+            element[:] = element[1:]
+            element.append(first)
+            return element
+    class ReverseWorker(Worker):
+        def handle(self, element):
+            element[:] = element[::-1]
+            return element
+    class ParseAndExtendWorker(Worker):
+        XML = etree.XML
+        def handle(self, element):
+            element.extend(self.XML(self.xml))
+            return element
+    class SerialiseWorker(Worker):
+        def handle(self, element):
+            return etree.tostring(element)
+
+    xml = _bytes('''\
+<xsl:stylesheet
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    version="1.0">
+  <xsl:output method="xml" />
+  <xsl:template match="/">
+     <div id="test">
+       <xsl:apply-templates/>
+     </div>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+    def _build_pipeline(self, item_count, *classes, **kwargs):
+        in_queue = Queue(item_count)
+        start = last = classes[0](in_queue, item_count, **kwargs)
+        start.setDaemon(True)
+        for worker_class in classes[1:]:
+            last = worker_class(last.out_queue, item_count, **kwargs)
+            last.setDaemon(True)
+            last.start()
+        return (in_queue, start, last)
+
+    def test_thread_pipeline_thread_parse(self):
+        item_count = self.item_count
+        # build and start the pipeline
+        in_queue, start, last = self._build_pipeline(
+            item_count,
+            self.ParseWorker,
+            self.RotateWorker,
+            self.ReverseWorker,
+            self.ParseAndExtendWorker,
+            self.SerialiseWorker,
+            xml = self.xml)
+
+        # fill the queue
+        put = start.in_queue.put
+        for _ in range(item_count):
+            put(self.xml)
+
+        # start the first thread and thus everything
+        start.start()
+        # make sure the last thread has terminated
+        last.join(60) # time out after 60 seconds
+        self.assertEqual(item_count, last.out_queue.qsize())
+        # read the results
+        get = last.out_queue.get
+        results = [ get() for _ in range(item_count) ]
+
+        comparison = results[0]
+        for i, result in enumerate(results[1:]):
+            self.assertEqual(comparison, result)
+
+    def test_thread_pipeline_global_parse(self):
+        item_count = self.item_count
+        XML = self.etree.XML
+        # build and start the pipeline
+        in_queue, start, last = self._build_pipeline(
+            item_count,
+            self.RotateWorker,
+            self.ReverseWorker,
+            self.ParseAndExtendWorker,
+            self.SerialiseWorker,
+            xml = self.xml)
+
+        # fill the queue
+        put = start.in_queue.put
+        for _ in range(item_count):
+            put(XML(self.xml))
+
+        # start the first thread and thus everything
+        start.start()
+        # make sure the last thread has terminated
+        last.join(60) # time out after 90 seconds
+        self.assertEqual(item_count, last.out_queue.qsize())
+        # read the results
+        get = last.out_queue.get
+        results = [ get() for _ in range(item_count) ]
+
+        comparison = results[0]
+        for i, result in enumerate(results[1:]):
+            self.assertEqual(comparison, result)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ThreadingTestCase)])
+    suite.addTests([unittest.makeSuite(ThreadPipelineTestCase)])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_unicode.py b/lib/lxml/tests/test_unicode.py
new file mode 100644
index 00000000..44f4e767
--- /dev/null
+++ b/lib/lxml/tests/test_unicode.py
@@ -0,0 +1,99 @@
+# -*- coding: utf-8 -*-
+import unittest, doctest, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import StringIO, etree, SillyFileLike, HelperTestCase
+from common_imports import _str, _bytes
+
+try:
+    unicode
+except NameError:
+    unicode = str
+
+ascii_uni = _bytes('a').decode('utf8')
+
+klingon = _bytes("\\uF8D2").decode("unicode_escape") # not valid for XML names
+
+invalid_tag = _bytes("test").decode('utf8') + klingon
+
+uni = _bytes('\\xc3\\u0680\\u3120').decode("unicode_escape") # some non-ASCII characters
+
+uxml = _bytes("<test><title>test \\xc3\\xa1\\u3120</title><h1>page \\xc3\\xa1\\u3120 title</h1></test>"
+              ).decode("unicode_escape")
+
+class UnicodeTestCase(HelperTestCase):
+    def test_unicode_xml(self):
+        tree = etree.XML('<p>%s</p>' % uni)
+        self.assertEqual(uni, tree.text)
+
+    def test_wide_unicode_xml(self):
+        if sys.maxunicode < 1114111:
+            return  # skip test
+        tree = etree.XML(_bytes('<p>\\U00026007</p>').decode('unicode_escape'))
+        self.assertEqual(1, len(tree.text))
+        self.assertEqual(_bytes('\\U00026007').decode('unicode_escape'),
+                         tree.text)
+
+    def test_unicode_xml_broken(self):
+        uxml = ('<?xml version="1.0" encoding="UTF-8"?>' +
+                '<p>%s</p>' % uni)
+        self.assertRaises(ValueError, etree.XML, uxml)
+
+    def test_unicode_tag(self):
+        el = etree.Element(uni)
+        self.assertEqual(uni, el.tag)
+
+    def test_unicode_tag_invalid(self):
+        # sadly, Klingon is not well-formed
+        self.assertRaises(ValueError, etree.Element, invalid_tag)
+
+    def test_unicode_nstag(self):
+        tag = "{http://abc/}%s" % uni
+        el = etree.Element(tag)
+        self.assertEqual(tag, el.tag)
+
+    def test_unicode_ns_invalid(self):
+        # namespace URIs must conform to RFC 3986
+        tag = "{http://%s/}abc" % uni
+        self.assertRaises(ValueError, etree.Element, tag)
+
+    def test_unicode_nstag_invalid(self):
+        # sadly, Klingon is not well-formed
+        tag = "{http://abc/}%s" % invalid_tag
+        self.assertRaises(ValueError, etree.Element, tag)
+
+    def test_unicode_qname(self):
+        qname = etree.QName(uni, uni)
+        tag = "{%s}%s" % (uni, uni)
+        self.assertEqual(qname.text, tag)
+        self.assertEqual(unicode(qname), tag)
+
+    def test_unicode_qname_invalid(self):
+        self.assertRaises(ValueError, etree.QName, invalid_tag)
+
+    def test_unicode_attr(self):
+        el = etree.Element('foo', {'bar': uni})
+        self.assertEqual(uni, el.attrib['bar'])
+
+    def test_unicode_comment(self):
+        el = etree.Comment(uni)
+        self.assertEqual(uni, el.text)
+
+    def test_unicode_parse_stringio(self):
+        el = etree.parse(StringIO('<p>%s</p>' % uni)).getroot()
+        self.assertEqual(uni, el.text)
+
+##     def test_parse_fileobject_unicode(self):
+##         # parse unicode from unamed file object (not support by ElementTree)
+##         f = SillyFileLike(uxml)
+##         root = etree.parse(f).getroot()
+##         self.assertEqual(unicode(etree.tostring(root, 'UTF-8'), 'UTF-8'),
+##                           uxml)
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(UnicodeTestCase)])
+    return suite
diff --git a/lib/lxml/tests/test_xmlschema.py b/lib/lxml/tests/test_xmlschema.py
new file mode 100644
index 00000000..b29a4978
--- /dev/null
+++ b/lib/lxml/tests/test_xmlschema.py
@@ -0,0 +1,442 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to XML Schema parsing and validation
+"""
+
+import unittest, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, BytesIO, HelperTestCase, fileInTestDir
+from common_imports import doctest, make_doctest
+
+
+class ETreeXMLSchemaTestCase(HelperTestCase):
+    def test_xmlschema(self):
+        tree_valid = self.parse('<a><b></b></a>')
+        tree_invalid = self.parse('<a><c></c></a>')
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema)
+        self.assertTrue(schema.validate(tree_valid))
+        self.assertFalse(schema.validate(tree_invalid))
+        self.assertTrue(schema.validate(tree_valid))     # retry valid
+        self.assertFalse(schema.validate(tree_invalid))  # retry invalid
+
+    def test_xmlschema_error_log(self):
+        tree_valid = self.parse('<a><b></b></a>')
+        tree_invalid = self.parse('<a><c></c></a>')
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema)
+        self.assertTrue(schema.validate(tree_valid))
+        self.assertFalse(schema.error_log.filter_from_errors())
+
+        self.assertFalse(schema.validate(tree_invalid))
+        self.assertTrue(schema.error_log.filter_from_errors())
+        self.assertTrue(schema.error_log.filter_types(
+            etree.ErrorTypes.SCHEMAV_ELEMENT_CONTENT))
+
+        self.assertTrue(schema.validate(tree_valid))
+        self.assertFalse(schema.error_log.filter_from_errors())
+
+        self.assertFalse(schema.validate(tree_invalid))
+        self.assertTrue(schema.error_log.filter_from_errors())
+        self.assertTrue(schema.error_log.filter_types(
+            etree.ErrorTypes.SCHEMAV_ELEMENT_CONTENT))
+
+    def test_xmlschema_default_attributes(self):
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence minOccurs="4" maxOccurs="4">
+      <xsd:element name="b" type="BType" />
+    </xsd:sequence>
+  </xsd:complexType>
+  <xsd:complexType name="BType">
+    <xsd:attribute name="hardy" type="xsd:string" default="hey" />
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema, attribute_defaults=True)
+
+        tree = self.parse('<a><b hardy="ho"/><b/><b hardy="ho"/><b/></a>')
+
+        root = tree.getroot()
+        self.assertEqual('ho', root[0].get('hardy'))
+        self.assertEqual(None, root[1].get('hardy'))
+        self.assertEqual('ho', root[2].get('hardy'))
+        self.assertEqual(None, root[3].get('hardy'))
+
+        self.assertTrue(schema(tree))
+
+        root = tree.getroot()
+        self.assertEqual('ho', root[0].get('hardy'))
+        self.assertEqual('hey', root[1].get('hardy'))
+        self.assertEqual('ho', root[2].get('hardy'))
+        self.assertEqual('hey', root[3].get('hardy'))
+
+    def test_xmlschema_parse(self):
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema)
+        parser = etree.XMLParser(schema=schema)
+
+        tree_valid = self.parse('<a><b></b></a>', parser=parser)
+        self.assertEqual('a', tree_valid.getroot().tag)
+
+        self.assertRaises(etree.XMLSyntaxError,
+                          self.parse, '<a><c></c></a>', parser=parser)
+
+    def test_xmlschema_parse_default_attributes(self):
+        # does not work as of libxml2 2.7.3
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence minOccurs="4" maxOccurs="4">
+      <xsd:element name="b" type="BType" />
+    </xsd:sequence>
+  </xsd:complexType>
+  <xsd:complexType name="BType">
+    <xsd:attribute name="hardy" type="xsd:string" default="hey" />
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema)
+        parser = etree.XMLParser(schema=schema, attribute_defaults=True)
+
+        tree_valid = self.parse('<a><b hardy="ho"/><b/><b hardy="ho"/><b/></a>',
+                                parser=parser)
+        root = tree_valid.getroot()
+        self.assertEqual('ho', root[0].get('hardy'))
+        self.assertEqual('hey', root[1].get('hardy'))
+        self.assertEqual('ho', root[2].get('hardy'))
+        self.assertEqual('hey', root[3].get('hardy'))
+
+    def test_xmlschema_parse_default_attributes_schema_config(self):
+        # does not work as of libxml2 2.7.3
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence minOccurs="4" maxOccurs="4">
+      <xsd:element name="b" type="BType" />
+    </xsd:sequence>
+  </xsd:complexType>
+  <xsd:complexType name="BType">
+    <xsd:attribute name="hardy" type="xsd:string" default="hey" />
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema, attribute_defaults=True)
+        parser = etree.XMLParser(schema=schema)
+
+        tree_valid = self.parse('<a><b hardy="ho"/><b/><b hardy="ho"/><b/></a>',
+                                parser=parser)
+        root = tree_valid.getroot()
+        self.assertEqual('ho', root[0].get('hardy'))
+        self.assertEqual('hey', root[1].get('hardy'))
+        self.assertEqual('ho', root[2].get('hardy'))
+        self.assertEqual('hey', root[3].get('hardy'))
+
+    def test_xmlschema_parse_fixed_attributes(self):
+        # does not work as of libxml2 2.7.3
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence minOccurs="3" maxOccurs="3">
+      <xsd:element name="b" type="BType" />
+    </xsd:sequence>
+  </xsd:complexType>
+  <xsd:complexType name="BType">
+    <xsd:attribute name="hardy" type="xsd:string" fixed="hey" />
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema)
+        parser = etree.XMLParser(schema=schema, attribute_defaults=True)
+
+        tree_valid = self.parse('<a><b/><b hardy="hey"/><b/></a>',
+                                parser=parser)
+        root = tree_valid.getroot()
+        self.assertEqual('hey', root[0].get('hardy'))
+        self.assertEqual('hey', root[1].get('hardy'))
+        self.assertEqual('hey', root[2].get('hardy'))
+
+    def test_xmlschema_stringio(self):
+        schema_file = BytesIO('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(file=schema_file)
+        parser = etree.XMLParser(schema=schema)
+
+        tree_valid = self.parse('<a><b></b></a>', parser=parser)
+        self.assertEqual('a', tree_valid.getroot().tag)
+
+        self.assertRaises(etree.XMLSyntaxError,
+                          self.parse, '<a><c></c></a>', parser=parser)
+
+    def test_xmlschema_iterparse(self):
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema)
+        xml = BytesIO('<a><b></b></a>')
+        events = [ (event, el.tag)
+                   for (event, el) in etree.iterparse(xml, schema=schema) ]
+
+        self.assertEqual([('end', 'b'), ('end', 'a')],
+                          events)
+
+    def test_xmlschema_iterparse_fail(self):
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema)
+        self.assertRaises(
+            etree.XMLSyntaxError,
+            list, etree.iterparse(BytesIO('<a><c></c></a>'), schema=schema))
+
+    def test_xmlschema_elementtree_error(self):
+        self.assertRaises(ValueError, etree.XMLSchema, etree.ElementTree())
+
+    def test_xmlschema_comment_error(self):
+        self.assertRaises(ValueError, etree.XMLSchema, etree.Comment('TEST'))
+
+    def test_xmlschema_illegal_validation_error(self):
+        schema = self.parse('''
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="xsd:string"/>
+</xsd:schema>
+''')
+        schema = etree.XMLSchema(schema)
+
+        root = etree.Element('a')
+        root.text = 'TEST'
+        self.assertTrue(schema(root))
+
+        self.assertRaises(ValueError, schema, etree.Comment('TEST'))
+        self.assertRaises(ValueError, schema, etree.PI('a', 'text'))
+        self.assertRaises(ValueError, schema, etree.Entity('text'))
+
+    def test_xmlschema_invalid_schema1(self):
+        schema = self.parse('''\
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
+''')
+        self.assertRaises(etree.XMLSchemaParseError,
+                          etree.XMLSchema, schema)
+
+    def test_xmlschema_invalid_schema2(self):
+        schema = self.parse('<test/>')
+        self.assertRaises(etree.XMLSchemaParseError,
+                          etree.XMLSchema, schema)
+
+    def test_xmlschema_file(self):
+        # this will only work if we access the file through path or
+        # file object..
+        f = open(fileInTestDir('test.xsd'), 'rb')
+        try:
+            schema = etree.XMLSchema(file=f)
+        finally:
+            f.close()
+        tree_valid = self.parse('<a><b></b></a>')
+        self.assertTrue(schema.validate(tree_valid))
+
+    def test_xmlschema_import_file(self):
+        # this will only work if we access the file through path or
+        # file object..
+        schema = etree.XMLSchema(file=fileInTestDir('test_import.xsd'))
+        tree_valid = self.parse(
+            '<a:x xmlns:a="http://codespeak.net/lxml/schema/ns1"><b></b></a:x>')
+        self.assertTrue(schema.validate(tree_valid))
+
+    def test_xmlschema_shortcut(self):
+        tree_valid = self.parse('<a><b></b></a>')
+        tree_invalid = self.parse('<a><c></c></a>')
+        schema = self.parse('''\
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
+  <xsd:element name="a" type="AType"/>
+  <xsd:complexType name="AType">
+    <xsd:sequence>
+      <xsd:element name="b" type="xsd:string" />
+    </xsd:sequence>
+  </xsd:complexType>
+</xsd:schema>
+''')
+        self.assertTrue(tree_valid.xmlschema(schema))
+        self.assertFalse(tree_invalid.xmlschema(schema))
+
+
+class ETreeXMLSchemaResolversTestCase(HelperTestCase):
+    resolver_schema_int = BytesIO("""\
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema"
+    xmlns:etype="http://codespeak.net/lxml/test/external"
+    targetNamespace="http://codespeak.net/lxml/test/internal">
+        <xsd:import namespace="http://codespeak.net/lxml/test/external" schemaLocation="XXX.xsd" />
+        <xsd:element name="a" type="etype:AType"/>
+</xsd:schema>""")
+
+    resolver_schema_int2 = BytesIO("""\
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema"
+    xmlns:etype="http://codespeak.net/lxml/test/external"
+    targetNamespace="http://codespeak.net/lxml/test/internal">
+        <xsd:import namespace="http://codespeak.net/lxml/test/external" schemaLocation="YYY.xsd" />
+        <xsd:element name="a" type="etype:AType"/>
+</xsd:schema>""")
+
+    resolver_schema_ext = """\
+<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema"
+    targetNamespace="http://codespeak.net/lxml/test/external">
+    <xsd:complexType name="AType">
+      <xsd:sequence><xsd:element name="b" type="xsd:string" minOccurs="0" maxOccurs="unbounded" /></xsd:sequence>
+    </xsd:complexType>
+</xsd:schema>""" 
+
+    class simple_resolver(etree.Resolver):
+        def __init__(self, schema):
+            self.schema = schema
+
+        def resolve(self, url, id, context):
+            assert url == 'XXX.xsd'
+            return self.resolve_string(self.schema, context)
+
+    # tests:
+
+    def test_xmlschema_resolvers(self):
+        # test that resolvers work with schema.
+        parser = etree.XMLParser()
+        parser.resolvers.add(self.simple_resolver(self.resolver_schema_ext))
+        schema_doc = etree.parse(self.resolver_schema_int, parser = parser)
+        schema = etree.XMLSchema(schema_doc)
+
+    def test_xmlschema_resolvers_root(self):
+        # test that the default resolver will get called if there's no
+        # specific parser resolver.
+        root_resolver = self.simple_resolver(self.resolver_schema_ext)
+        etree.get_default_parser().resolvers.add(root_resolver)
+        schema_doc = etree.parse(self.resolver_schema_int)
+        schema = etree.XMLSchema(schema_doc)
+        etree.get_default_parser().resolvers.remove(root_resolver)
+
+    def test_xmlschema_resolvers_noroot(self):
+        # test that the default resolver will not get called when a
+        # more specific resolver is registered.
+
+        class res_root(etree.Resolver):
+            def resolve(self, url, id, context):
+                assert False
+                return None
+
+        root_resolver = res_root()
+        etree.get_default_parser().resolvers.add(root_resolver)
+
+        parser = etree.XMLParser()
+        parser.resolvers.add(self.simple_resolver(self.resolver_schema_ext))
+
+        schema_doc = etree.parse(self.resolver_schema_int, parser = parser)
+        schema = etree.XMLSchema(schema_doc)
+        etree.get_default_parser().resolvers.remove(root_resolver)
+
+    def test_xmlschema_nested_resolvers(self):
+        # test that resolvers work in a nested fashion.
+
+        resolver_schema = self.resolver_schema_ext
+
+        class res_nested(etree.Resolver):
+            def __init__(self, ext_schema):
+                self.ext_schema = ext_schema
+
+            def resolve(self, url, id, context):
+                assert url == 'YYY.xsd'
+                return self.resolve_string(self.ext_schema, context)
+
+        class res(etree.Resolver):
+            def __init__(self, ext_schema_1, ext_schema_2):
+                self.ext_schema_1 = ext_schema_1
+                self.ext_schema_2 = ext_schema_2
+
+            def resolve(self, url, id, context):
+                assert url == 'XXX.xsd'
+
+                new_parser = etree.XMLParser()
+                new_parser.resolvers.add(res_nested(self.ext_schema_2))
+                new_schema_doc = etree.parse(self.ext_schema_1, parser = new_parser)
+                new_schema = etree.XMLSchema(new_schema_doc)
+
+                return self.resolve_string(resolver_schema, context)
+
+        parser = etree.XMLParser()
+        parser.resolvers.add(res(self.resolver_schema_int2, self.resolver_schema_ext))
+        schema_doc = etree.parse(self.resolver_schema_int, parser = parser)
+        schema = etree.XMLSchema(schema_doc)
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeXMLSchemaTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeXMLSchemaResolversTestCase)])
+    suite.addTests(
+        [make_doctest('../../../doc/validation.txt')])
+    return suite
+
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_xpathevaluator.py b/lib/lxml/tests/test_xpathevaluator.py
new file mode 100644
index 00000000..a2df6ddb
--- /dev/null
+++ b/lib/lxml/tests/test_xpathevaluator.py
@@ -0,0 +1,750 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to XPath evaluation and the XPath class
+"""
+
+import unittest, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+from common_imports import etree, HelperTestCase, _bytes, BytesIO
+from common_imports import doctest, make_doctest
+
+class ETreeXPathTestCase(HelperTestCase):
+    """XPath tests etree"""
+
+    def test_xpath_boolean(self):
+        tree = self.parse('<a><b></b><b></b></a>')
+        self.assertTrue(tree.xpath('boolean(/a/b)'))
+        self.assertTrue(not tree.xpath('boolean(/a/c)'))
+
+    def test_xpath_number(self):
+        tree = self.parse('<a>1</a>')
+        self.assertEqual(1.,
+                          tree.xpath('number(/a)'))
+        tree = self.parse('<a>A</a>')
+        actual = str(tree.xpath('number(/a)'))
+        expected = ['nan', '1.#qnan', 'nanq']
+        if not actual.lower() in expected:
+            self.fail('Expected a NAN value, got %s' % actual)
+        
+    def test_xpath_string(self):
+        tree = self.parse('<a>Foo</a>')
+        self.assertEqual('Foo',
+                          tree.xpath('string(/a/text())'))
+
+    def test_xpath_document_root(self):
+        tree = self.parse('<a><b/></a>')
+        self.assertEqual([],
+                          tree.xpath('/'))
+
+    def test_xpath_namespace(self):
+        tree = self.parse('<a xmlns="test" xmlns:p="myURI"/>')
+        self.assertTrue((None, "test") in tree.xpath('namespace::*'))
+        self.assertTrue(('p', 'myURI') in tree.xpath('namespace::*'))
+
+    def test_xpath_namespace_empty(self):
+        tree = self.parse('<a/>')
+        self.assertEqual([('xml', 'http://www.w3.org/XML/1998/namespace')],
+                          tree.xpath('namespace::*'))
+
+    def test_xpath_list_elements(self):
+        tree = self.parse('<a><b>Foo</b><b>Bar</b></a>')
+        root = tree.getroot()
+        self.assertEqual([root[0], root[1]],
+                          tree.xpath('/a/b'))
+
+    def test_xpath_list_nothing(self):
+        tree = self.parse('<a><b/></a>')
+        self.assertEqual([],
+                          tree.xpath('/a/c'))
+        # this seems to pass a different code path, also should return nothing
+        self.assertEqual([],
+                          tree.xpath('/a/c/text()'))
+    
+    def test_xpath_list_text(self):
+        tree = self.parse('<a><b>Foo</b><b>Bar</b></a>')
+        root = tree.getroot()
+        self.assertEqual(['Foo', 'Bar'],
+                          tree.xpath('/a/b/text()'))
+
+    def test_xpath_list_text_parent(self):
+        tree = self.parse('<a><b>FooBar</b><b>BarFoo</b></a>')
+        root = tree.getroot()
+        self.assertEqual(['FooBar', 'BarFoo'],
+                          tree.xpath('/a/b/text()'))
+        self.assertEqual([root[0], root[1]],
+                          [r.getparent() for r in tree.xpath('/a/b/text()')])
+
+    def test_xpath_list_text_parent_no_smart_strings(self):
+        tree = self.parse('<a><b>FooBar</b><b>BarFoo</b></a>')
+        root = tree.getroot()
+        self.assertEqual(['FooBar', 'BarFoo'],
+                          tree.xpath('/a/b/text()', smart_strings=True))
+        self.assertEqual([root[0], root[1]],
+                          [r.getparent() for r in
+                           tree.xpath('/a/b/text()', smart_strings=True)])
+        self.assertEqual([None, None],
+                          [r.attrname for r in
+                           tree.xpath('/a/b/text()', smart_strings=True)])
+
+        self.assertEqual(['FooBar', 'BarFoo'],
+                          tree.xpath('/a/b/text()', smart_strings=False))
+        self.assertEqual([False, False],
+                          [hasattr(r, 'getparent') for r in
+                           tree.xpath('/a/b/text()', smart_strings=False)])
+        self.assertEqual([None, None],
+                          [r.attrname for r in
+                           tree.xpath('/a/b/text()', smart_strings=True)])
+
+    def test_xpath_list_unicode_text_parent(self):
+        xml = _bytes('<a><b>FooBar\\u0680\\u3120</b><b>BarFoo\\u0680\\u3120</b></a>').decode("unicode_escape")
+        tree = self.parse(xml.encode('utf-8'))
+        root = tree.getroot()
+        self.assertEqual([_bytes('FooBar\\u0680\\u3120').decode("unicode_escape"),
+                           _bytes('BarFoo\\u0680\\u3120').decode("unicode_escape")],
+                          tree.xpath('/a/b/text()'))
+        self.assertEqual([root[0], root[1]],
+                          [r.getparent() for r in tree.xpath('/a/b/text()')])
+
+    def test_xpath_list_attribute(self):
+        tree = self.parse('<a b="B" c="C"/>')
+        self.assertEqual(['B'],
+                          tree.xpath('/a/@b'))
+
+    def test_xpath_list_attribute_parent(self):
+        tree = self.parse('<a b="BaSdFgHjKl" c="CqWeRtZuI"/>')
+        results = tree.xpath('/a/@c')
+        self.assertEqual(1, len(results))
+        self.assertEqual('CqWeRtZuI', results[0])
+        self.assertEqual(tree.getroot().tag, results[0].getparent().tag)
+
+    def test_xpath_list_attribute_parent_no_smart_strings(self):
+        tree = self.parse('<a b="BaSdFgHjKl" c="CqWeRtZuI"/>')
+
+        results = tree.xpath('/a/@c', smart_strings=True)
+        self.assertEqual(1, len(results))
+        self.assertEqual('CqWeRtZuI', results[0])
+        self.assertEqual('c', results[0].attrname)
+        self.assertEqual(tree.getroot().tag, results[0].getparent().tag)
+
+        results = tree.xpath('/a/@c', smart_strings=False)
+        self.assertEqual(1, len(results))
+        self.assertEqual('CqWeRtZuI', results[0])
+        self.assertEqual(False, hasattr(results[0], 'getparent'))
+        self.assertEqual(False, hasattr(results[0], 'attrname'))
+
+    def test_xpath_text_from_other_document(self):
+        xml_data = '''
+        <table>
+                <item xml:id="k1"><value>v1</value></item>
+                <item xml:id="k2"><value>v2</value></item>
+        </table>
+        '''
+
+        def lookup(dummy, id):
+            return etree.XML(xml_data).xpath('id(%r)' % id)
+        functions = {(None, 'lookup') : lookup}
+
+        root = etree.XML('<dummy/>')
+        values = root.xpath("lookup('k1')/value/text()",
+                           extensions=functions)
+        self.assertEqual(['v1'], values)
+        self.assertEqual('value', values[0].getparent().tag)
+
+    def test_xpath_list_comment(self):
+        tree = self.parse('<a><!-- Foo --></a>')
+        self.assertEqual(['<!-- Foo -->'],
+                          list(map(repr, tree.xpath('/a/node()'))))
+
+    def test_rel_xpath_boolean(self):
+        root = etree.XML('<a><b><c/></b></a>')
+        el = root[0]
+        self.assertTrue(el.xpath('boolean(c)'))
+        self.assertTrue(not el.xpath('boolean(d)'))
+
+    def test_rel_xpath_list_elements(self):
+        tree = self.parse('<a><c><b>Foo</b><b>Bar</b></c><c><b>Hey</b></c></a>')
+        root = tree.getroot()
+        c = root[0]
+        self.assertEqual([c[0], c[1]],
+                          c.xpath('b'))
+        self.assertEqual([c[0], c[1], root[1][0]],
+                          c.xpath('//b'))
+
+    def test_xpath_ns(self):
+        tree = self.parse('<a xmlns="uri:a"><b></b></a>')
+        root = tree.getroot()
+        self.assertEqual(
+            [root[0]],
+            tree.xpath('//foo:b', namespaces={'foo': 'uri:a'}))
+        self.assertEqual(
+            [],
+            tree.xpath('//foo:b', namespaces={'foo': 'uri:c'}))
+        self.assertEqual(
+            [root[0]],
+            root.xpath('//baz:b', namespaces={'baz': 'uri:a'}))
+
+    def test_xpath_ns_none(self):
+        tree = self.parse('<a xmlns="uri:a"><b></b></a>')
+        root = tree.getroot()
+        self.assertRaises(
+            TypeError,
+            root.xpath, '//b', namespaces={None: 'uri:a'})
+
+    def test_xpath_ns_empty(self):
+        tree = self.parse('<a xmlns="uri:a"><b></b></a>')
+        root = tree.getroot()
+        self.assertRaises(
+            TypeError,
+            root.xpath, '//b', namespaces={'': 'uri:a'})
+
+    def test_xpath_error(self):
+        tree = self.parse('<a/>')
+        self.assertRaises(etree.XPathEvalError, tree.xpath, '\\fad')
+
+    def test_xpath_class_error(self):
+        self.assertRaises(SyntaxError, etree.XPath, '\\fad')
+        self.assertRaises(etree.XPathSyntaxError, etree.XPath, '\\fad')
+
+    def test_xpath_prefix_error(self):
+        tree = self.parse('<a/>')
+        self.assertRaises(etree.XPathEvalError, tree.xpath, '/fa:d')
+
+    def test_xpath_class_prefix_error(self):
+        tree = self.parse('<a/>')
+        xpath = etree.XPath("/fa:d")
+        self.assertRaises(etree.XPathEvalError, xpath, tree)
+
+    def test_elementtree_getpath(self):
+        a  = etree.Element("a")
+        b  = etree.SubElement(a, "b")
+        c  = etree.SubElement(a, "c")
+        d1 = etree.SubElement(c, "d")
+        d2 = etree.SubElement(c, "d")
+
+        tree = etree.ElementTree(a)
+        self.assertEqual('/a/c/d',
+                         tree.getpath(d2)[:6])
+        self.assertEqual([d2],
+                         tree.xpath(tree.getpath(d2)))
+
+    def test_elementtree_getpath_partial(self):
+        a  = etree.Element("a")
+        b  = etree.SubElement(a, "b")
+        c  = etree.SubElement(a, "c")
+        d1 = etree.SubElement(c, "d")
+        d2 = etree.SubElement(c, "d")
+
+        tree = etree.ElementTree(c)
+        self.assertEqual('/c/d',
+                         tree.getpath(d2)[:4])
+        self.assertEqual([d2],
+                         tree.xpath(tree.getpath(d2)))
+
+    def test_xpath_evaluator(self):
+        tree = self.parse('<a><b><c></c></b></a>')
+        e = etree.XPathEvaluator(tree)
+        root = tree.getroot()
+        self.assertEqual(
+            [root],
+            e('//a'))
+
+    def test_xpath_evaluator_tree(self):
+        tree = self.parse('<a><b><c></c></b></a>')
+        child_tree = etree.ElementTree(tree.getroot()[0])
+        e = etree.XPathEvaluator(child_tree)
+        self.assertEqual(
+            [],
+            e('a'))
+        root = child_tree.getroot()
+        self.assertEqual(
+            [root[0]],
+            e('c'))
+
+    def test_xpath_evaluator_tree_absolute(self):
+        tree = self.parse('<a><b><c></c></b></a>')
+        child_tree = etree.ElementTree(tree.getroot()[0])
+        e = etree.XPathEvaluator(child_tree)
+        self.assertEqual(
+            [],
+            e('/a'))
+        root = child_tree.getroot()
+        self.assertEqual(
+            [root],
+            e('/b'))
+        self.assertEqual(
+            [],
+            e('/c'))
+
+    def test_xpath_evaluator_element(self):
+        tree = self.parse('<a><b><c></c></b></a>')
+        root = tree.getroot()
+        e = etree.XPathEvaluator(root[0])
+        self.assertEqual(
+            [root[0][0]],
+            e('c'))
+        
+    def test_xpath_extensions(self):
+        def foo(evaluator, a):
+            return 'hello %s' % a
+        extension = {(None, 'foo'): foo}
+        tree = self.parse('<a><b></b></a>')
+        e = etree.XPathEvaluator(tree, extensions=[extension])
+        self.assertEqual(
+            "hello you", e("foo('you')"))
+
+    def test_xpath_extensions_wrong_args(self):
+        def foo(evaluator, a, b):
+            return "hello %s and %s" % (a, b)
+        extension = {(None, 'foo'): foo}
+        tree = self.parse('<a><b></b></a>')
+        e = etree.XPathEvaluator(tree, extensions=[extension])
+        self.assertRaises(TypeError, e, "foo('you')")
+
+    def test_xpath_extensions_error(self):
+        def foo(evaluator, a):
+            return 1/0
+        extension = {(None, 'foo'): foo}
+        tree = self.parse('<a/>')
+        e = etree.XPathEvaluator(tree, extensions=[extension])
+        self.assertRaises(ZeroDivisionError, e, "foo('test')")
+
+    def test_xpath_extensions_nodes(self):
+        def f(evaluator, arg):
+            r = etree.Element('results')
+            b = etree.SubElement(r, 'result')
+            b.text = 'Hoi'
+            b = etree.SubElement(r, 'result')
+            b.text = 'Dag'
+            return r
+
+        x = self.parse('<a/>')
+        e = etree.XPathEvaluator(x, extensions=[{(None, 'foo'): f}])
+        r = e("foo('World')/result")
+        self.assertEqual(2, len(r))
+        self.assertEqual('Hoi', r[0].text)
+        self.assertEqual('Dag', r[1].text)
+
+    def test_xpath_extensions_nodes_append(self):
+        def f(evaluator, nodes):
+            r = etree.SubElement(nodes[0], 'results')
+            b = etree.SubElement(r, 'result')
+            b.text = 'Hoi'
+            b = etree.SubElement(r, 'result')
+            b.text = 'Dag'
+            return r
+
+        x = self.parse('<a/>')
+        e = etree.XPathEvaluator(x, extensions=[{(None, 'foo'): f}])
+        r = e("foo(/*)/result")
+        self.assertEqual(2, len(r))
+        self.assertEqual('Hoi', r[0].text)
+        self.assertEqual('Dag', r[1].text)
+
+    def test_xpath_extensions_nodes_append2(self):
+        def f(evaluator, nodes):
+            r = etree.Element('results')
+            b = etree.SubElement(r, 'result')
+            b.text = 'Hoi'
+            b = etree.SubElement(r, 'result')
+            b.text = 'Dag'
+            r.append(nodes[0])
+            return r
+
+        x = self.parse('<result>Honk</result>')
+        e = etree.XPathEvaluator(x, extensions=[{(None, 'foo'): f}])
+        r = e("foo(/*)/result")
+        self.assertEqual(3, len(r))
+        self.assertEqual('Hoi',  r[0].text)
+        self.assertEqual('Dag',  r[1].text)
+        self.assertEqual('Honk', r[2].text)
+
+    def test_xpath_context_node(self):
+        tree = self.parse('<root><a/><b><c/></b></root>')
+
+        check_call = []
+        def check_context(ctxt, nodes):
+            self.assertEqual(len(nodes), 1)
+            check_call.append(nodes[0].tag)
+            self.assertEqual(ctxt.context_node, nodes[0])
+            return True
+
+        find = etree.XPath("//*[p:foo(.)]",
+                           namespaces={'p' : 'ns'},
+                           extensions=[{('ns', 'foo') : check_context}])
+        find(tree)
+
+        check_call.sort()
+        self.assertEqual(check_call, ["a", "b", "c", "root"])
+
+    def test_xpath_eval_context_propagation(self):
+        tree = self.parse('<root><a/><b><c/></b></root>')
+
+        check_call = {}
+        def check_context(ctxt, nodes):
+            self.assertEqual(len(nodes), 1)
+            tag = nodes[0].tag
+            # empty during the "b" call, a "b" during the "c" call
+            check_call[tag] = ctxt.eval_context.get("b")
+            ctxt.eval_context[tag] = tag
+            return True
+
+        find = etree.XPath("//b[p:foo(.)]/c[p:foo(.)]",
+                           namespaces={'p' : 'ns'},
+                           extensions=[{('ns', 'foo') : check_context}])
+        result = find(tree)
+
+        self.assertEqual(result, [tree.getroot()[1][0]])
+        self.assertEqual(check_call, {'b':None, 'c':'b'})
+
+    def test_xpath_eval_context_clear(self):
+        tree = self.parse('<root><a/><b><c/></b></root>')
+
+        check_call = {}
+        def check_context(ctxt):
+            check_call["done"] = True
+            # context must be empty for each new evaluation
+            self.assertEqual(len(ctxt.eval_context), 0)
+            ctxt.eval_context["test"] = True
+            return True
+
+        find = etree.XPath("//b[p:foo()]",
+                           namespaces={'p' : 'ns'},
+                           extensions=[{('ns', 'foo') : check_context}])
+        result = find(tree)
+
+        self.assertEqual(result, [tree.getroot()[1]])
+        self.assertEqual(check_call["done"], True)
+
+        check_call.clear()
+        find = etree.XPath("//b[p:foo()]",
+                           namespaces={'p' : 'ns'},
+                           extensions=[{('ns', 'foo') : check_context}])
+        result = find(tree)
+
+        self.assertEqual(result, [tree.getroot()[1]])
+        self.assertEqual(check_call["done"], True)
+
+    def test_xpath_variables(self):
+        x = self.parse('<a attr="true"/>')
+        e = etree.XPathEvaluator(x)
+
+        expr = "/a[@attr=$aval]"
+        r = e(expr, aval=1)
+        self.assertEqual(0, len(r))
+
+        r = e(expr, aval="true")
+        self.assertEqual(1, len(r))
+        self.assertEqual("true", r[0].get('attr'))
+
+        r = e(expr, aval=True)
+        self.assertEqual(1, len(r))
+        self.assertEqual("true", r[0].get('attr'))
+
+    def test_xpath_variables_nodeset(self):
+        x = self.parse('<a attr="true"/>')
+        e = etree.XPathEvaluator(x)
+
+        element = etree.Element("test-el")
+        etree.SubElement(element, "test-sub")
+        expr = "$value"
+        r = e(expr, value=element)
+        self.assertEqual(1, len(r))
+        self.assertEqual(element.tag, r[0].tag)
+        self.assertEqual(element[0].tag, r[0][0].tag)
+
+    def test_xpath_extensions_mix(self):
+        x = self.parse('<a attr="true"><test/></a>')
+
+        class LocalException(Exception):
+            pass
+
+        def foo(evaluator, a, varval):
+            etree.Element("DUMMY")
+            if varval == 0:
+                raise LocalException
+            elif varval == 1:
+                return ()
+            elif varval == 2:
+                return None
+            elif varval == 3:
+                return a[0][0]
+            a = a[0]
+            if a.get("attr") == str(varval):
+                return a
+            else:
+                return etree.Element("NODE")
+
+        extension = {(None, 'foo'): foo}
+        e = etree.XPathEvaluator(x, extensions=[extension])
+        del x
+
+        self.assertRaises(LocalException, e, "foo(., 0)")
+        self.assertRaises(LocalException, e, "foo(., $value)", value=0)
+
+        r = e("foo(., $value)", value=1)
+        self.assertEqual(len(r), 0)
+
+        r = e("foo(.,  1)")
+        self.assertEqual(len(r), 0)
+
+        r = e("foo(., $value)", value=2)
+        self.assertEqual(len(r), 0)
+
+        r = e("foo(., $value)", value=3)
+        self.assertEqual(len(r), 1)
+        self.assertEqual(r[0].tag, "test")
+
+        r = e("foo(., $value)", value="false")
+        self.assertEqual(len(r), 1)
+        self.assertEqual(r[0].tag, "NODE")
+
+        r = e("foo(., 'false')")
+        self.assertEqual(len(r), 1)
+        self.assertEqual(r[0].tag, "NODE")
+
+        r = e("foo(., 'true')")
+        self.assertEqual(len(r), 1)
+        self.assertEqual(r[0].tag, "a")
+        self.assertEqual(r[0][0].tag, "test")
+
+        r = e("foo(., $value)", value="true")
+        self.assertEqual(len(r), 1)
+        self.assertEqual(r[0].tag, "a")
+
+        self.assertRaises(LocalException, e, "foo(., 0)")
+        self.assertRaises(LocalException, e, "foo(., $value)", value=0)
+
+
+class ETreeXPathClassTestCase(HelperTestCase):
+    "Tests for the XPath class"
+    def test_xpath_compile_doc(self):
+        x = self.parse('<a attr="true"/>')
+
+        expr = etree.XPath("/a[@attr != 'true']")
+        r = expr(x)
+        self.assertEqual(0, len(r))
+
+        expr = etree.XPath("/a[@attr = 'true']")
+        r = expr(x)
+        self.assertEqual(1, len(r))
+
+        expr = etree.XPath( expr.path )
+        r = expr(x)
+        self.assertEqual(1, len(r))
+
+    def test_xpath_compile_element(self):
+        x = self.parse('<a><b/><c/></a>')
+        root = x.getroot()
+
+        expr = etree.XPath("./b")
+        r = expr(root)
+        self.assertEqual(1, len(r))
+        self.assertEqual('b', r[0].tag)
+
+        expr = etree.XPath("./*")
+        r = expr(root)
+        self.assertEqual(2, len(r))
+
+    def test_xpath_compile_vars(self):
+        x = self.parse('<a attr="true"/>')
+
+        expr = etree.XPath("/a[@attr=$aval]")
+        r = expr(x, aval=False)
+        self.assertEqual(0, len(r))
+
+        r = expr(x, aval=True)
+        self.assertEqual(1, len(r))
+
+    def test_xpath_compile_error(self):
+        self.assertRaises(SyntaxError, etree.XPath, '\\fad')
+
+    def test_xpath_elementtree_error(self):
+        self.assertRaises(ValueError, etree.XPath('*'), etree.ElementTree())
+
+
+class ETreeXPathExsltTestCase(HelperTestCase):
+    "Tests for the EXSLT support in XPath (requires libxslt 1.1.25+)"
+
+    NSMAP = dict(
+        date = "http://exslt.org/dates-and-times",
+        math = "http://exslt.org/math",
+        set  = "http://exslt.org/sets",
+        str  = "http://exslt.org/strings",
+        )
+
+    def test_xpath_exslt_functions_date(self):
+        tree = self.parse('<a><b>2009-11-12</b><b>2008-12-11</b></a>')
+
+        match_dates = tree.xpath('//b[date:year(string()) = 2009]',
+                                 namespaces=self.NSMAP)
+        self.assertTrue(match_dates, str(match_dates))
+        self.assertEqual(len(match_dates), 1, str(match_dates))
+        self.assertEqual(match_dates[0].text, '2009-11-12')
+
+    def test_xpath_exslt_functions_strings(self):
+        tree = self.parse('<a><b>2009-11-12</b><b>2008-12-11</b></a>')
+
+        aligned_date = tree.xpath(
+            'str:align(string(//b[1]), "%s", "center")' % ('-'*20),
+            namespaces=self.NSMAP)
+        self.assertTrue(aligned_date, str(aligned_date))
+        self.assertEqual(aligned_date, '-----2009-11-12-----')
+
+
+class ETreeETXPathClassTestCase(HelperTestCase):
+    "Tests for the ETXPath class"
+    def test_xpath_compile_ns(self):
+        x = self.parse('<a><b xmlns="nsa"/><b xmlns="nsb"/></a>')
+
+        expr = etree.ETXPath("/a/{nsa}b")
+        r = expr(x)
+        self.assertEqual(1, len(r))
+        self.assertEqual('{nsa}b', r[0].tag)
+
+        expr = etree.ETXPath("/a/{nsb}b")
+        r = expr(x)
+        self.assertEqual(1, len(r))
+        self.assertEqual('{nsb}b', r[0].tag)
+
+    # disabled this test as non-ASCII characters in namespace URIs are
+    # not acceptable
+    def _test_xpath_compile_unicode(self):
+        x = self.parse(_bytes('<a><b xmlns="http://nsa/\\uf8d2"/><b xmlns="http://nsb/\\uf8d1"/></a>'
+                              ).decode("unicode_escape"))
+
+        expr = etree.ETXPath(_bytes("/a/{http://nsa/\\uf8d2}b").decode("unicode_escape"))
+        r = expr(x)
+        self.assertEqual(1, len(r))
+        self.assertEqual(_bytes('{http://nsa/\\uf8d2}b').decode("unicode_escape"), r[0].tag)
+
+        expr = etree.ETXPath(_bytes("/a/{http://nsb/\\uf8d1}b").decode("unicode_escape"))
+        r = expr(x)
+        self.assertEqual(1, len(r))
+        self.assertEqual(_bytes('{http://nsb/\\uf8d1}b').decode("unicode_escape"), r[0].tag)
+
+SAMPLE_XML = etree.parse(BytesIO("""
+<body>
+  <tag>text</tag>
+  <section>
+    <tag>subtext</tag>
+  </section>
+  <tag />
+  <tag />
+</body>
+"""))
+
+def tag(elem):
+    return elem.tag
+
+def tag_or_value(elem):
+    return getattr(elem, 'tag', elem)
+
+def stringTest(ctxt, s1):
+    return "Hello "+s1
+
+def stringListTest(ctxt, s1):
+    return ["Hello "] + list(s1) +  ["!"]
+    
+def floatTest(ctxt, f1):
+    return f1+4
+
+def booleanTest(ctxt, b1):
+    return not b1
+    
+def setTest(ctxt, st1):
+    return st1[0]
+    
+def setTest2(ctxt, st1):
+    return st1[0:2]
+
+def argsTest1(ctxt, s, f, b, st):
+    return ", ".join(map(str, (s, f, b, list(map(tag, st)))))
+
+def argsTest2(ctxt, st1, st2):
+    st1.extend(st2)
+    return st1
+
+def resultTypesTest(ctxt):
+    return [None,None]
+
+def resultTypesTest2(ctxt):
+    return resultTypesTest
+    
+uri = "http://www.example.com/"
+
+extension = {(None, 'stringTest'): stringTest,
+             (None, 'stringListTest'): stringListTest,
+             (None, 'floatTest'): floatTest,
+             (None, 'booleanTest'): booleanTest,
+             (None, 'setTest'): setTest,
+             (None, 'setTest2'): setTest2,
+             (None, 'argsTest1'): argsTest1,
+             (None, 'argsTest2'): argsTest2,
+             (None, 'resultTypesTest'): resultTypesTest,
+             (None, 'resultTypesTest2'): resultTypesTest2,}
+
+def xpath():
+    """
+    Test xpath extension functions.
+    
+    >>> root = SAMPLE_XML
+    >>> e = etree.XPathEvaluator(root, extensions=[extension])
+    >>> e("stringTest('you')")
+    'Hello you'
+    >>> e(_bytes("stringTest('\\\\xe9lan')").decode("unicode_escape"))
+    u'Hello \\xe9lan'
+    >>> e("stringTest('you','there')")   #doctest: +ELLIPSIS
+    Traceback (most recent call last):
+    ...
+    TypeError: stringTest() takes... 2 ...arguments ...
+    >>> e("floatTest(2)")
+    6.0
+    >>> e("booleanTest(true())")
+    False
+    >>> list(map(tag, e("setTest(/body/tag)")))
+    ['tag']
+    >>> list(map(tag, e("setTest2(/body/*)")))
+    ['tag', 'section']
+    >>> list(map(tag_or_value, e("stringListTest(/body/tag)")))
+    ['Hello ', 'tag', 'tag', 'tag', '!']
+    >>> e("argsTest1('a',1.5,true(),/body/tag)")
+    "a, 1.5, True, ['tag', 'tag', 'tag']"
+    >>> list(map(tag, e("argsTest2(/body/tag, /body/section)")))
+    ['tag', 'section', 'tag', 'tag']
+    >>> e("resultTypesTest()")
+    Traceback (most recent call last):
+    ...
+    XPathResultError: This is not a supported node-set result: None
+    >>> try:
+    ...     e("resultTypesTest2()")
+    ... except etree.XPathResultError:
+    ...     print("Got error")
+    Got error
+    """
+
+if sys.version_info[0] >= 3:
+    xpath.__doc__ = xpath.__doc__.replace(" u'", " '")
+    xpath.__doc__ = xpath.__doc__.replace(" XPathResultError",
+                                          " lxml.etree.XPathResultError")
+    xpath.__doc__ = xpath.__doc__.replace(" exactly 2 arguments",
+                                          " exactly 2 positional arguments")
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeXPathTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeXPathClassTestCase)])
+    if etree.LIBXSLT_COMPILED_VERSION >= (1,1,25):
+        suite.addTests([unittest.makeSuite(ETreeXPathExsltTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeETXPathClassTestCase)])
+    suite.addTests([doctest.DocTestSuite()])
+    suite.addTests(
+        [make_doctest('../../../doc/xpathxslt.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/tests/test_xslt.py b/lib/lxml/tests/test_xslt.py
new file mode 100644
index 00000000..4288dc28
--- /dev/null
+++ b/lib/lxml/tests/test_xslt.py
@@ -0,0 +1,1848 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test cases related to XSLT processing
+"""
+
+import unittest, copy, sys, os.path
+
+this_dir = os.path.dirname(__file__)
+if this_dir not in sys.path:
+    sys.path.insert(0, this_dir) # needed for Py3
+
+is_python3 = sys.version_info[0] >= 3
+
+try:
+    unicode
+except NameError: # Python 3
+    unicode = str
+
+try:
+    basestring
+except NameError: # Python 3
+    basestring = str
+
+from common_imports import etree, BytesIO, HelperTestCase, fileInTestDir
+from common_imports import doctest, _bytes, _str, make_doctest, skipif
+
+class ETreeXSLTTestCase(HelperTestCase):
+    """XSLT tests etree"""
+        
+    def test_xslt(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+''',
+                          str(res))
+
+    def test_xslt_elementtree_error(self):
+        self.assertRaises(ValueError, etree.XSLT, etree.ElementTree())
+
+    def test_xslt_input_none(self):
+        self.assertRaises(TypeError, etree.XSLT, None)
+
+    if False and etree.LIBXSLT_VERSION >= (1,1,15):
+        # earlier versions generate no error
+        if etree.LIBXSLT_VERSION > (1,1,17):
+            def test_xslt_invalid_stylesheet(self):
+                style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:stylesheet />
+</xsl:stylesheet>''')
+
+                self.assertRaises(
+                    etree.XSLTParseError, etree.XSLT, style)
+        
+    def test_xslt_copy(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        transform = etree.XSLT(style)
+        res = transform(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+''',
+                          str(res))
+
+        transform_copy = copy.deepcopy(transform)
+        res = transform_copy(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+''',
+                          str(res))
+
+        transform = etree.XSLT(style)
+        res = transform(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+''',
+                          str(res))
+
+    def test_xslt_utf8(self):
+        tree = self.parse(_bytes('<a><b>\\uF8D2</b><c>\\uF8D2</c></a>'
+                                 ).decode("unicode_escape"))
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:output encoding="UTF-8"/>
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        expected = _bytes('''\
+<?xml version="1.0" encoding="UTF-8"?>
+<foo>\\uF8D2</foo>
+''').decode("unicode_escape")
+        if is_python3:
+            self.assertEqual(expected,
+                              str(bytes(res), 'UTF-8'))
+        else:
+            self.assertEqual(expected,
+                              unicode(str(res), 'UTF-8'))
+
+    def test_xslt_encoding(self):
+        tree = self.parse(_bytes('<a><b>\\uF8D2</b><c>\\uF8D2</c></a>'
+                                 ).decode("unicode_escape"))
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:output encoding="UTF-16"/>
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        expected = _bytes('''\
+<?xml version="1.0" encoding="UTF-16"?>
+<foo>\\uF8D2</foo>
+''').decode("unicode_escape")
+        if is_python3:
+            self.assertEqual(expected,
+                              str(bytes(res), 'UTF-16'))
+        else:
+            self.assertEqual(expected,
+                              unicode(str(res), 'UTF-16'))
+
+    def test_xslt_encoding_override(self):
+        tree = self.parse(_bytes('<a><b>\\uF8D2</b><c>\\uF8D2</c></a>'
+                                 ).decode("unicode_escape"))
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:output encoding="UTF-8"/>
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        expected = _bytes("""\
+<?xml version='1.0' encoding='UTF-16'?>\
+<foo>\\uF8D2</foo>""").decode("unicode_escape")
+
+        f = BytesIO()
+        res.write(f, encoding='UTF-16')
+        if is_python3:
+            result = str(f.getvalue(), 'UTF-16').replace('\n', '')
+        else:
+            result = unicode(str(f.getvalue()), 'UTF-16').replace('\n', '')
+        self.assertEqual(expected, result)
+
+    def test_xslt_unicode(self):
+        tree = self.parse(_bytes('<a><b>\\uF8D2</b><c>\\uF8D2</c></a>'
+                                 ).decode("unicode_escape"))
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:output encoding="UTF-16"/>
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        expected = _bytes('''\
+<?xml version="1.0"?>
+<foo>\\uF8D2</foo>
+''').decode("unicode_escape")
+        self.assertEqual(expected,
+                          unicode(res))
+
+    def test_xslt_unicode_standalone(self):
+        tree = self.parse(_bytes('<a><b>\\uF8D2</b><c>\\uF8D2</c></a>'
+        ).decode("unicode_escape"))
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:output encoding="UTF-16" standalone="no"/>
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        expected = _bytes('''\
+<?xml version="1.0" standalone="no"?>
+<foo>\\uF8D2</foo>
+''').decode("unicode_escape")
+        self.assertEqual(expected,
+                         unicode(res))
+
+    def test_xslt_input(self):
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        st = etree.XSLT(style.getroot())
+
+    def test_xslt_input_partial_doc(self):
+        style = self.parse('''\
+<otherroot>
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>
+</otherroot>''')
+
+        self.assertRaises(etree.XSLTParseError, etree.XSLT, style)
+        root_node = style.getroot()
+        self.assertRaises(etree.XSLTParseError, etree.XSLT, root_node)
+        st = etree.XSLT(root_node[0])
+
+    def test_xslt_broken(self):
+        tree = self.parse('<a/>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+    <xsl:foo />
+</xsl:stylesheet>''')
+        self.assertRaises(etree.XSLTParseError,
+                          etree.XSLT, style)
+
+    def test_xslt_parameters(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <foo><xsl:value-of select="$bar" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree, bar="'Bar'")
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>Bar</foo>
+''',
+                          str(res))
+
+    def test_xslt_string_parameters(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <foo><xsl:value-of select="$bar" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree, bar=etree.XSLT.strparam('''it's me, "Bar"'''))
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>it's me, "Bar"</foo>
+''',
+                          str(res))
+
+    def test_xslt_parameter_invalid(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:param name="bar"/>
+  <xsl:template match="/">
+    <foo><xsl:value-of select="$bar" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = self.assertRaises(etree.XSLTApplyError,
+                                st, tree, bar="<test/>")
+        res = self.assertRaises(etree.XSLTApplyError,
+                                st, tree, bar="....")
+
+    if etree.LIBXSLT_VERSION < (1,1,18):
+        # later versions produce no error
+        def test_xslt_parameter_missing(self):
+            # apply() without needed parameter will lead to XSLTApplyError
+            tree = self.parse('<a><b>B</b><c>C</c></a>')
+            style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <foo><xsl:value-of select="$bar" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+            st = etree.XSLT(style)
+            self.assertRaises(etree.XSLTApplyError,
+                              st.apply, tree)
+
+    def test_xslt_multiple_parameters(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="$bar" /></foo>
+    <foo><xsl:value-of select="$baz" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree, bar="'Bar'", baz="'Baz'")
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>Bar</foo><foo>Baz</foo>
+''',
+                          str(res))
+        
+    def test_xslt_parameter_xpath(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="$bar" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree, bar="/a/b/text()")
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+''',
+                          str(res))
+
+    def test_xslt_parameter_xpath_object(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="$bar" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree, bar=etree.XPath("/a/b/text()"))
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+''',
+                          str(res))
+        
+    def test_xslt_default_parameters(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:param name="bar" select="'Default'" />
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="$bar" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree, bar="'Bar'")
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>Bar</foo>
+''',
+                          str(res))
+        res = st(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>Default</foo>
+''',
+                          str(res))
+        
+    def test_xslt_html_output(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:output method="html"/>
+  <xsl:strip-space elements="*"/>
+  <xsl:template match="/">
+    <html><body><xsl:value-of select="/a/b/text()" /></body></html>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        self.assertEqual('<html><body>B</body></html>',
+                          str(res).strip())
+
+    def test_xslt_include(self):
+        tree = etree.parse(fileInTestDir('test1.xslt'))
+        st = etree.XSLT(tree)
+
+    def test_xslt_include_from_filelike(self):
+        f = open(fileInTestDir('test1.xslt'), 'rb')
+        tree = etree.parse(f)
+        f.close()
+        st = etree.XSLT(tree)
+
+    def test_xslt_multiple_transforms(self):
+        xml = '<a/>'
+        xslt = '''\
+<xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+    <xsl:template match="/">
+        <response>Some text</response>
+    </xsl:template>
+</xsl:stylesheet>
+'''
+        source = self.parse(xml)
+        styledoc = self.parse(xslt)
+        style = etree.XSLT(styledoc)
+        result = style(source)
+
+        etree.tostring(result.getroot())
+        
+        source = self.parse(xml)
+        styledoc = self.parse(xslt)
+        style = etree.XSLT(styledoc)
+        result = style(source)
+        
+        etree.tostring(result.getroot())
+
+    def test_xslt_repeat_transform(self):
+        xml = '<a/>'
+        xslt = '''\
+<xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+    <xsl:template match="/">
+        <response>Some text</response>
+    </xsl:template>
+</xsl:stylesheet>
+'''
+        source = self.parse(xml)
+        styledoc = self.parse(xslt)
+        transform = etree.XSLT(styledoc)
+        result = transform(source)
+        result = transform(source)
+        etree.tostring(result.getroot())
+        result = transform(source)
+        etree.tostring(result.getroot())
+        str(result)
+
+        result1 = transform(source)
+        result2 = transform(source)
+        self.assertEqual(str(result1), str(result2))
+        result = transform(source)
+        str(result)
+
+    def test_xslt_empty(self):
+        # could segfault if result contains "empty document"
+        xml = '<blah/>'
+        xslt = '''
+        <xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+          <xsl:template match="/" />
+        </xsl:stylesheet>
+        '''
+
+        source = self.parse(xml)
+        styledoc = self.parse(xslt)
+        style = etree.XSLT(styledoc)
+        result = style(source)
+        self.assertEqual('', str(result))
+
+    def test_xslt_message(self):
+        xml = '<blah/>'
+        xslt = '''
+        <xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+          <xsl:template match="/">
+            <xsl:message>TEST TEST TEST</xsl:message>
+          </xsl:template>
+        </xsl:stylesheet>
+        '''
+
+        source = self.parse(xml)
+        styledoc = self.parse(xslt)
+        style = etree.XSLT(styledoc)
+        result = style(source)
+        self.assertEqual('', str(result))
+        self.assertTrue("TEST TEST TEST" in [entry.message
+                                          for entry in style.error_log])
+
+    def test_xslt_message_terminate(self):
+        xml = '<blah/>'
+        xslt = '''
+        <xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+          <xsl:template match="/">
+            <xsl:message terminate="yes">TEST TEST TEST</xsl:message>
+          </xsl:template>
+        </xsl:stylesheet>
+        '''
+
+        source = self.parse(xml)
+        styledoc = self.parse(xslt)
+        style = etree.XSLT(styledoc)
+
+        self.assertRaises(etree.XSLTApplyError, style, source)
+        self.assertTrue("TEST TEST TEST" in [entry.message
+                                          for entry in style.error_log])
+
+    def test_xslt_shortcut(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <doc>
+    <foo><xsl:value-of select="$bar" /></foo>
+    <foo><xsl:value-of select="$baz" /></foo>
+    </doc>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        result = tree.xslt(style, bar="'Bar'", baz="'Baz'")
+        self.assertEqual(
+            _bytes('<doc><foo>Bar</foo><foo>Baz</foo></doc>'),
+            etree.tostring(result.getroot()))
+        
+    def test_multiple_elementrees(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="a"><A><xsl:apply-templates/></A></xsl:template>
+  <xsl:template match="b"><B><xsl:apply-templates/></B></xsl:template>
+  <xsl:template match="c"><C><xsl:apply-templates/></C></xsl:template>
+</xsl:stylesheet>''')
+
+        self.assertEqual(self._rootstring(tree),
+                          _bytes('<a><b>B</b><c>C</c></a>'))
+        result = tree.xslt(style)
+        self.assertEqual(self._rootstring(tree),
+                          _bytes('<a><b>B</b><c>C</c></a>'))
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A><B>B</B><C>C</C></A>'))
+
+        b_tree = etree.ElementTree(tree.getroot()[0])
+        self.assertEqual(self._rootstring(b_tree),
+                          _bytes('<b>B</b>'))
+        result = b_tree.xslt(style)
+        self.assertEqual(self._rootstring(tree),
+                          _bytes('<a><b>B</b><c>C</c></a>'))
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<B>B</B>'))
+
+        c_tree = etree.ElementTree(tree.getroot()[1])
+        self.assertEqual(self._rootstring(c_tree),
+                          _bytes('<c>C</c>'))
+        result = c_tree.xslt(style)
+        self.assertEqual(self._rootstring(tree),
+                          _bytes('<a><b>B</b><c>C</c></a>'))
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<C>C</C>'))
+
+    def test_xslt_document_XML(self):
+        # make sure document('') works from parsed strings
+        xslt = etree.XSLT(etree.XML("""\
+<xsl:stylesheet version="1.0"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <test>TEXT<xsl:copy-of select="document('')//test"/></test>
+  </xsl:template>
+</xsl:stylesheet>
+"""))
+        result = xslt(etree.XML('<a/>'))
+        root = result.getroot()
+        self.assertEqual(root.tag,
+                          'test')
+        self.assertEqual(root[0].tag,
+                          'test')
+        self.assertEqual(root[0].text,
+                          'TEXT')
+        self.assertEqual(root[0][0].tag,
+                          '{http://www.w3.org/1999/XSL/Transform}copy-of')
+
+    def test_xslt_document_parse(self):
+        # make sure document('') works from loaded files
+        xslt = etree.XSLT(etree.parse(fileInTestDir("test-document.xslt")))
+        result = xslt(etree.XML('<a/>'))
+        root = result.getroot()
+        self.assertEqual(root.tag,
+                          'test')
+        self.assertEqual(root[0].tag,
+                          '{http://www.w3.org/1999/XSL/Transform}stylesheet')
+
+    def test_xslt_document_elementtree(self):
+        # make sure document('') works from loaded files
+        xslt = etree.XSLT(etree.ElementTree(file=fileInTestDir("test-document.xslt")))
+        result = xslt(etree.XML('<a/>'))
+        root = result.getroot()
+        self.assertEqual(root.tag,
+                          'test')
+        self.assertEqual(root[0].tag,
+                          '{http://www.w3.org/1999/XSL/Transform}stylesheet')
+
+    def test_xslt_document_error(self):
+        xslt = etree.XSLT(etree.XML("""\
+<xsl:stylesheet version="1.0"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <test>TEXT<xsl:copy-of select="document('uri:__junkfood__is__evil__')//test"/></test>
+  </xsl:template>
+</xsl:stylesheet>
+"""))
+        self.assertRaises(etree.XSLTApplyError, xslt, etree.XML('<a/>'))
+
+    def test_xslt_document_XML_resolver(self):
+        # make sure document('') works when custom resolvers are in use
+        assertEqual = self.assertEqual
+        called = {'count' : 0}
+        class TestResolver(etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, 'file://ANYTHING')
+                called['count'] += 1
+                return self.resolve_string('<CALLED/>', context)
+
+        parser = etree.XMLParser()
+        parser.resolvers.add(TestResolver())
+
+        xslt = etree.XSLT(etree.XML(_bytes("""\
+<xsl:stylesheet version="1.0"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+   xmlns:l="local">
+  <xsl:template match="/">
+    <test>
+      <xsl:for-each select="document('')//l:data/l:entry">
+        <xsl:copy-of select="document('file://ANYTHING')"/>
+        <xsl:copy>
+          <xsl:attribute name="value">
+            <xsl:value-of select="."/>
+          </xsl:attribute>
+        </xsl:copy>
+      </xsl:for-each>
+    </test>
+  </xsl:template>
+  <l:data>
+    <l:entry>A</l:entry>
+    <l:entry>B</l:entry>
+  </l:data>
+</xsl:stylesheet>
+"""), parser))
+
+        self.assertEqual(called['count'], 0)
+        result = xslt(etree.XML('<a/>'))
+        self.assertEqual(called['count'], 1)
+
+        root = result.getroot()
+        self.assertEqual(root.tag,
+                          'test')
+        self.assertEqual(len(root), 4)
+
+        self.assertEqual(root[0].tag,
+                          'CALLED')
+        self.assertEqual(root[1].tag,
+                          '{local}entry')
+        self.assertEqual(root[1].text,
+                          None)
+        self.assertEqual(root[1].get("value"),
+                          'A')
+        self.assertEqual(root[2].tag,
+                          'CALLED')
+        self.assertEqual(root[3].tag,
+                          '{local}entry')
+        self.assertEqual(root[3].text,
+                          None)
+        self.assertEqual(root[3].get("value"),
+                          'B')
+
+    def test_xslt_resolver_url_building(self):
+        assertEqual = self.assertEqual
+        called = {'count' : 0}
+        expected_url = None
+        class TestResolver(etree.Resolver):
+            def resolve(self, url, id, context):
+                assertEqual(url, expected_url)
+                called['count'] += 1
+                return self.resolve_string('<CALLED/>', context)
+
+        stylesheet_xml = _bytes("""\
+<xsl:stylesheet version="1.0"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+   xmlns:l="local">
+  <xsl:template match="/">
+    <xsl:copy-of select="document('test.xml')"/>
+  </xsl:template>
+</xsl:stylesheet>
+""")
+
+        parser = etree.XMLParser()
+        parser.resolvers.add(TestResolver())
+
+        # test without base_url => relative path only
+        expected_url = 'test.xml'
+        xslt = etree.XSLT(etree.XML(stylesheet_xml, parser))
+
+        self.assertEqual(called['count'], 0)
+        result = xslt(etree.XML('<a/>'))
+        self.assertEqual(called['count'], 1)
+
+        # now the same thing with a stylesheet base URL on the filesystem
+        called['count'] = 0
+        expected_url = 'MY/BASE/test.xml'  # seems to be the same on Windows
+        xslt = etree.XSLT(etree.XML(
+            stylesheet_xml, parser,
+            base_url=os.path.join('MY', 'BASE', 'FILE')))
+
+        self.assertEqual(called['count'], 0)
+        result = xslt(etree.XML('<a/>'))
+        self.assertEqual(called['count'], 1)
+
+        # now the same thing with a stylesheet base URL
+        called['count'] = 0
+        expected_url = 'http://server.com/BASE/DIR/test.xml'
+        xslt = etree.XSLT(etree.XML(
+            stylesheet_xml, parser,
+            base_url='http://server.com/BASE/DIR/FILE'))
+
+        self.assertEqual(called['count'], 0)
+        result = xslt(etree.XML('<a/>'))
+        self.assertEqual(called['count'], 1)
+
+        # now the same thing with a stylesheet base file:// URL
+        called['count'] = 0
+        expected_url = 'file://BASE/DIR/test.xml'
+        xslt = etree.XSLT(etree.XML(
+            stylesheet_xml, parser,
+            base_url='file://BASE/DIR/FILE'))
+
+        self.assertEqual(called['count'], 0)
+        result = xslt(etree.XML('<a/>'))
+        self.assertEqual(called['count'], 1)
+
+    def test_xslt_document_parse_allow(self):
+        access_control = etree.XSLTAccessControl(read_file=True)
+        xslt = etree.XSLT(etree.parse(fileInTestDir("test-document.xslt")),
+                          access_control=access_control)
+        result = xslt(etree.XML('<a/>'))
+        root = result.getroot()
+        self.assertEqual(root.tag,
+                         'test')
+        self.assertEqual(root[0].tag,
+                         '{http://www.w3.org/1999/XSL/Transform}stylesheet')
+
+    def test_xslt_document_parse_deny(self):
+        access_control = etree.XSLTAccessControl(read_file=False)
+        xslt = etree.XSLT(etree.parse(fileInTestDir("test-document.xslt")),
+                          access_control=access_control)
+        self.assertRaises(etree.XSLTApplyError, xslt, etree.XML('<a/>'))
+
+    def test_xslt_document_parse_deny_all(self):
+        access_control = etree.XSLTAccessControl.DENY_ALL
+        xslt = etree.XSLT(etree.parse(fileInTestDir("test-document.xslt")),
+                          access_control=access_control)
+        self.assertRaises(etree.XSLTApplyError, xslt, etree.XML('<a/>'))
+
+    def test_xslt_access_control_repr(self):
+        access_control = etree.XSLTAccessControl.DENY_ALL
+        self.assertTrue(repr(access_control).startswith(type(access_control).__name__))
+        self.assertEqual(repr(access_control), repr(access_control))
+        self.assertNotEqual(repr(etree.XSLTAccessControl.DENY_ALL),
+                            repr(etree.XSLTAccessControl.DENY_WRITE))
+        self.assertNotEqual(repr(etree.XSLTAccessControl.DENY_ALL),
+                            repr(etree.XSLTAccessControl()))
+
+    def test_xslt_move_result(self):
+        root = etree.XML(_bytes('''\
+        <transform>
+          <widget displayType="fieldset"/>
+        </transform>'''))
+
+        xslt = etree.XSLT(etree.XML(_bytes('''\
+        <xsl:stylesheet version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+          <xsl:output method="html" indent="no"/>
+          <xsl:template match="/">
+            <html>
+              <xsl:apply-templates/>
+            </html>
+          </xsl:template>
+
+          <xsl:template match="widget">
+            <xsl:element name="{@displayType}"/>
+          </xsl:template>
+
+        </xsl:stylesheet>''')))
+
+        result = xslt(root[0])
+        root[:] = result.getroot()[:]
+        del root # segfaulted before
+        
+    def test_xslt_pi(self):
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/xsl" href="%s"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+</a>''' % fileInTestDir("test1.xslt"))
+
+        style_root = tree.getroot().getprevious().parseXSL().getroot()
+        self.assertEqual("{http://www.w3.org/1999/XSL/Transform}stylesheet",
+                          style_root.tag)
+
+    def test_xslt_pi_embedded_xmlid(self):
+        # test xml:id dictionary lookup mechanism
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/xsl" href="#style"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+  <xsl:stylesheet version="1.0" xml:id="style"
+      xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+    <xsl:template match="*" />
+    <xsl:template match="/">
+      <foo><xsl:value-of select="/a/b/text()" /></foo>
+    </xsl:template>
+  </xsl:stylesheet>
+</a>''')
+
+        style_root = tree.getroot().getprevious().parseXSL().getroot()
+        self.assertEqual("{http://www.w3.org/1999/XSL/Transform}stylesheet",
+                          style_root.tag)
+
+        st = etree.XSLT(style_root)
+        res = st(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+''',
+                          str(res))
+
+    def test_xslt_pi_embedded_id(self):
+        # test XPath lookup mechanism
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/xsl" href="#style"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+</a>''')
+
+        style = self.parse('''\
+<xsl:stylesheet version="1.0" xml:id="style"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>
+''')
+
+        tree.getroot().append(style.getroot())
+
+        style_root = tree.getroot().getprevious().parseXSL().getroot()
+        self.assertEqual("{http://www.w3.org/1999/XSL/Transform}stylesheet",
+                          style_root.tag)
+
+        st = etree.XSLT(style_root)
+        res = st(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+''',
+                          str(res))
+
+    def test_xslt_pi_get(self):
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/xsl" href="TEST"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+</a>''')
+
+        pi = tree.getroot().getprevious()
+        self.assertEqual("TEST", pi.get("href"))
+
+    def test_xslt_pi_get_all(self):
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/xsl" href="TEST"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+</a>''')
+
+        pi = tree.getroot().getprevious()
+        self.assertEqual("TEST", pi.get("href"))
+        self.assertEqual("text/xsl", pi.get("type"))
+        self.assertEqual(None, pi.get("motz"))
+
+    def test_xslt_pi_get_all_reversed(self):
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet href="TEST" type="text/xsl"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+</a>''')
+
+        pi = tree.getroot().getprevious()
+        self.assertEqual("TEST", pi.get("href"))
+        self.assertEqual("text/xsl", pi.get("type"))
+        self.assertEqual(None, pi.get("motz"))
+
+    def test_xslt_pi_get_unknown(self):
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/xsl" href="TEST"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+</a>''')
+
+        pi = tree.getroot().getprevious()
+        self.assertEqual(None, pi.get("unknownattribute"))
+
+    def test_xslt_pi_set_replace(self):
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/xsl" href="TEST"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+</a>''')
+
+        pi = tree.getroot().getprevious()
+        self.assertEqual("TEST", pi.get("href"))
+
+        pi.set("href", "TEST123")
+        self.assertEqual("TEST123", pi.get("href"))
+
+    def test_xslt_pi_set_new(self):
+        tree = self.parse('''\
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/xsl"?>
+<a>
+  <b>B</b>
+  <c>C</c>
+</a>''')
+
+        pi = tree.getroot().getprevious()
+        self.assertEqual(None, pi.get("href"))
+
+        pi.set("href", "TEST")
+        self.assertEqual("TEST", pi.get("href"))
+
+class ETreeEXSLTTestCase(HelperTestCase):
+    """EXSLT tests"""
+
+    def test_exslt_str(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:str="http://exslt.org/strings"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    exclude-result-prefixes="str xsl">
+  <xsl:template match="text()">
+    <xsl:value-of select="str:align(string(.), '***', 'center')" />
+  </xsl:template>
+  <xsl:template match="*">
+    <xsl:copy>
+      <xsl:apply-templates/>
+    </xsl:copy>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<a><b>*B*</b><c>*C*</c></a>
+''',
+                          str(res))
+
+    if etree.LIBXSLT_VERSION >= (1,1,21):
+        def test_exslt_str_attribute_replace(self):
+            tree = self.parse('<a><b>B</b><c>C</c></a>')
+            style = self.parse('''\
+      <xsl:stylesheet version = "1.0"
+          xmlns:xsl='http://www.w3.org/1999/XSL/Transform'
+          xmlns:str="http://exslt.org/strings"
+          extension-element-prefixes="str">
+
+          <xsl:template match="/">
+            <h1 class="{str:replace('abc', 'b', 'x')}">test</h1>
+          </xsl:template>
+
+      </xsl:stylesheet>''')
+
+            st = etree.XSLT(style)
+            res = st(tree)
+            self.assertEqual('''\
+<?xml version="1.0"?>
+<h1 class="axc">test</h1>
+''',
+                              str(res))
+
+    def test_exslt_math(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:math="http://exslt.org/math"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    exclude-result-prefixes="math xsl">
+  <xsl:template match="*">
+    <xsl:copy>
+      <xsl:attribute name="pi">
+        <xsl:value-of select="math:constant('PI', count(*)+2)"/>
+      </xsl:attribute>
+      <xsl:apply-templates/>
+    </xsl:copy>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        self.assertEqual('''\
+<?xml version="1.0"?>
+<a pi="3.14"><b pi="3">B</b><c pi="3">C</c></a>
+''',
+                          str(res))
+
+    def test_exslt_regexp_test(self):
+        xslt = etree.XSLT(etree.XML(_bytes("""\
+<xsl:stylesheet version="1.0"
+   xmlns:regexp="http://exslt.org/regular-expressions"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*">
+    <test><xsl:copy-of select="*[regexp:test(string(.), '8.')]"/></test>
+  </xsl:template>
+</xsl:stylesheet>
+""")))
+        result = xslt(etree.XML(_bytes('<a><b>123</b><b>098</b><b>987</b></a>')))
+        root = result.getroot()
+        self.assertEqual(root.tag,
+                          'test')
+        self.assertEqual(len(root), 1)
+        self.assertEqual(root[0].tag,
+                          'b')
+        self.assertEqual(root[0].text,
+                          '987')
+
+    def test_exslt_regexp_replace(self):
+        xslt = etree.XSLT(etree.XML("""\
+<xsl:stylesheet version="1.0"
+   xmlns:regexp="http://exslt.org/regular-expressions"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*">
+    <test>
+      <xsl:copy-of select="regexp:replace(string(.), 'd.', '',   'XX')"/>
+      <xsl:text>-</xsl:text>
+      <xsl:copy-of select="regexp:replace(string(.), 'd.', 'gi', 'XX')"/>
+    </test>
+  </xsl:template>
+</xsl:stylesheet>
+"""))
+        result = xslt(etree.XML(_bytes('<a>abdCdEeDed</a>')))
+        root = result.getroot()
+        self.assertEqual(root.tag,
+                          'test')
+        self.assertEqual(len(root), 0)
+        self.assertEqual(root.text, 'abXXdEeDed-abXXXXeXXd')
+
+    def test_exslt_regexp_match(self):
+        xslt = etree.XSLT(etree.XML("""\
+<xsl:stylesheet version="1.0"
+   xmlns:regexp="http://exslt.org/regular-expressions"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*">
+    <test>
+      <test1><xsl:copy-of  select="regexp:match(string(.), 'd.')"/></test1>
+      <test2><xsl:copy-of  select="regexp:match(string(.), 'd.', 'g')"/></test2>
+      <test2i><xsl:copy-of select="regexp:match(string(.), 'd.', 'gi')"/></test2i>
+    </test>
+  </xsl:template>
+</xsl:stylesheet>
+"""))
+        result = xslt(etree.XML(_bytes('<a>abdCdEeDed</a>')))
+        root = result.getroot()
+        self.assertEqual(root.tag,  'test')
+        self.assertEqual(len(root), 3)
+
+        self.assertEqual(len(root[0]), 1)
+        self.assertEqual(root[0][0].tag, 'match')
+        self.assertEqual(root[0][0].text, 'dC')
+
+        self.assertEqual(len(root[1]), 2)
+        self.assertEqual(root[1][0].tag, 'match')
+        self.assertEqual(root[1][0].text, 'dC')
+        self.assertEqual(root[1][1].tag, 'match')
+        self.assertEqual(root[1][1].text, 'dE')
+
+        self.assertEqual(len(root[2]), 3)
+        self.assertEqual(root[2][0].tag, 'match')
+        self.assertEqual(root[2][0].text, 'dC')
+        self.assertEqual(root[2][1].tag, 'match')
+        self.assertEqual(root[2][1].text, 'dE')
+        self.assertEqual(root[2][2].tag, 'match')
+        self.assertEqual(root[2][2].text, 'De')
+
+    def test_exslt_regexp_match_groups(self):
+        xslt = etree.XSLT(etree.XML(_bytes("""\
+<xsl:stylesheet version="1.0"
+   xmlns:regexp="http://exslt.org/regular-expressions"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <test>
+      <xsl:for-each select="regexp:match(
+            '123abc567', '([0-9]+)([a-z]+)([0-9]+)' )">
+        <test1><xsl:value-of select="."/></test1>
+      </xsl:for-each>
+    </test>
+  </xsl:template>
+</xsl:stylesheet>
+""")))
+        result = xslt(etree.XML(_bytes('<a/>')))
+        root = result.getroot()
+        self.assertEqual(root.tag,  'test')
+        self.assertEqual(len(root), 4)
+
+        self.assertEqual(root[0].text, "123abc567")
+        self.assertEqual(root[1].text, "123")
+        self.assertEqual(root[2].text, "abc")
+        self.assertEqual(root[3].text, "567")
+
+    def test_exslt_regexp_match1(self):
+        # taken from http://www.exslt.org/regexp/functions/match/index.html
+        xslt = etree.XSLT(etree.XML(_bytes("""\
+<xsl:stylesheet version="1.0"
+   xmlns:regexp="http://exslt.org/regular-expressions"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <test>
+      <xsl:for-each select="regexp:match(
+            'http://www.bayes.co.uk/xml/index.xml?/xml/utils/rechecker.xml',
+            '(\w+):\/\/([^/:]+)(:\d*)?([^# ]*)')">
+        <test1><xsl:value-of select="."/></test1>
+      </xsl:for-each>
+    </test>
+  </xsl:template>
+</xsl:stylesheet>
+""")))
+        result = xslt(etree.XML(_bytes('<a/>')))
+        root = result.getroot()
+        self.assertEqual(root.tag,  'test')
+        self.assertEqual(len(root), 5)
+
+        self.assertEqual(
+            root[0].text,
+            "http://www.bayes.co.uk/xml/index.xml?/xml/utils/rechecker.xml")
+        self.assertEqual(
+            root[1].text,
+            "http")
+        self.assertEqual(
+            root[2].text,
+            "www.bayes.co.uk")
+        self.assertFalse(root[3].text)
+        self.assertEqual(
+            root[4].text,
+            "/xml/index.xml?/xml/utils/rechecker.xml")
+
+    def test_exslt_regexp_match2(self):
+        # taken from http://www.exslt.org/regexp/functions/match/index.html
+        xslt = etree.XSLT(self.parse("""\
+<xsl:stylesheet version="1.0"
+   xmlns:regexp="http://exslt.org/regular-expressions"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <test>
+      <xsl:for-each select="regexp:match(
+            'This is a test string', '(\w+)', 'g')">
+        <test1><xsl:value-of select="."/></test1>
+      </xsl:for-each>
+    </test>
+  </xsl:template>
+</xsl:stylesheet>
+"""))
+        result = xslt(etree.XML(_bytes('<a/>')))
+        root = result.getroot()
+        self.assertEqual(root.tag,  'test')
+        self.assertEqual(len(root), 5)
+
+        self.assertEqual(root[0].text, "This")
+        self.assertEqual(root[1].text, "is")
+        self.assertEqual(root[2].text, "a")
+        self.assertEqual(root[3].text, "test")
+        self.assertEqual(root[4].text, "string")
+
+    def _test_exslt_regexp_match3(self):
+        # taken from http://www.exslt.org/regexp/functions/match/index.html
+        # THIS IS NOT SUPPORTED!
+        xslt = etree.XSLT(etree.XML(_bytes("""\
+<xsl:stylesheet version="1.0"
+   xmlns:regexp="http://exslt.org/regular-expressions"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <test>
+      <xsl:for-each select="regexp:match(
+            'This is a test string', '([a-z])+ ', 'g')">
+        <test1><xsl:value-of select="."/></test1>
+      </xsl:for-each>
+    </test>
+  </xsl:template>
+</xsl:stylesheet>
+""")))
+        result = xslt(etree.XML(_bytes('<a/>')))
+        root = result.getroot()
+        self.assertEqual(root.tag,  'test')
+        self.assertEqual(len(root), 4)
+
+        self.assertEqual(root[0].text, "his")
+        self.assertEqual(root[1].text, "is")
+        self.assertEqual(root[2].text, "a")
+        self.assertEqual(root[3].text, "test")
+
+    def _test_exslt_regexp_match4(self):
+        # taken from http://www.exslt.org/regexp/functions/match/index.html
+        # THIS IS NOT SUPPORTED!
+        xslt = etree.XSLT(etree.XML(_bytes("""\
+<xsl:stylesheet version="1.0"
+   xmlns:regexp="http://exslt.org/regular-expressions"
+   xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="/">
+    <test>
+      <xsl:for-each select="regexp:match(
+            'This is a test string', '([a-z])+ ', 'gi')">
+        <test1><xsl:value-of select="."/></test1>
+      </xsl:for-each>
+    </test>
+  </xsl:template>
+</xsl:stylesheet>
+""")))
+        result = xslt(etree.XML(_bytes('<a/>')))
+        root = result.getroot()
+        self.assertEqual(root.tag,  'test')
+        self.assertEqual(len(root), 4)
+
+        self.assertEqual(root[0].text, "This")
+        self.assertEqual(root[1].text, "is")
+        self.assertEqual(root[2].text, "a")
+        self.assertEqual(root[3].text, "test")
+
+
+class ETreeXSLTExtFuncTestCase(HelperTestCase):
+    """Tests for XPath extension functions in XSLT."""
+
+    def test_extensions1(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    exclude-result-prefixes="myns">
+  <xsl:template match="a"><A><xsl:value-of select="myns:mytext(b)"/></A></xsl:template>
+</xsl:stylesheet>''')
+
+        def mytext(ctxt, values):
+            return 'X' * len(values)
+
+        result = tree.xslt(style, {('testns', 'mytext') : mytext})
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A>X</A>'))
+
+    def test_extensions2(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    exclude-result-prefixes="myns">
+  <xsl:template match="a"><A><xsl:value-of select="myns:mytext(b)"/></A></xsl:template>
+</xsl:stylesheet>''')
+
+        def mytext(ctxt, values):
+            return 'X' * len(values)
+
+        namespace = etree.FunctionNamespace('testns')
+        namespace['mytext'] = mytext
+
+        result = tree.xslt(style)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A>X</A>'))
+
+    def test_variable_result_tree_fragment(self):
+        tree = self.parse('<a><b>B</b><b/></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    exclude-result-prefixes="myns">
+  <xsl:template match="a">
+    <xsl:variable name="content">
+       <xsl:apply-templates/>
+    </xsl:variable>
+    <A><xsl:value-of select="myns:mytext($content)"/></A>
+  </xsl:template>
+  <xsl:template match="b"><xsl:copy>BBB</xsl:copy></xsl:template>
+</xsl:stylesheet>''')
+
+        def mytext(ctxt, values):
+            for value in values:
+                self.assertTrue(hasattr(value, 'tag'),
+                             "%s is not an Element" % type(value))
+                self.assertEqual(value.tag, 'b')
+                self.assertEqual(value.text, 'BBB')
+            return 'X'.join([el.tag for el in values])
+
+        namespace = etree.FunctionNamespace('testns')
+        namespace['mytext'] = mytext
+
+        result = tree.xslt(style)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A>bXb</A>'))
+
+
+class ETreeXSLTExtElementTestCase(HelperTestCase):
+    """Tests for extension elements in XSLT."""
+
+    def test_extension_element(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns"
+    exclude-result-prefixes="myns">
+  <xsl:template match="a">
+    <A><myns:myext>b</myns:myext></A>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                child = etree.Element(self_node.text)
+                child.text = 'X'
+                output_parent.append(child)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A><b>X</b></A>'))
+
+    def test_extension_element_doc_context(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns"
+    exclude-result-prefixes="myns">
+  <xsl:template match="/">
+    <A><myns:myext>b</myns:myext></A>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        tags = []
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                tags.append(input_node.tag)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(tags, ['a'])
+
+    def test_extension_element_comment_pi_context(self):
+        tree = self.parse('<?test toast?><a><!--a comment--><?another pi?></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns"
+    exclude-result-prefixes="myns">
+  <xsl:template match="/">
+    <ROOT><xsl:apply-templates /></ROOT>
+  </xsl:template>
+  <xsl:template match="comment()">
+    <A><myns:myext>b</myns:myext></A>
+  </xsl:template>
+  <xsl:template match="processing-instruction()">
+    <A><myns:myext>b</myns:myext></A>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        text = []
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                text.append(input_node.text)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(text, ['toast', 'a comment', 'pi'])
+
+    def _test_extension_element_attribute_context(self):
+        # currently not supported
+        tree = self.parse('<a test="A"><b attr="B"/></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns"
+    exclude-result-prefixes="myns">
+  <xsl:template match="@test">
+    <A><myns:myext>b</myns:myext></A>
+  </xsl:template>
+  <xsl:template match="@attr">
+    <A><myns:myext>b</myns:myext></A>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        text = []
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, attr_value, output_parent):
+                text.append(attr_value)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(text, ['A', 'B'])
+
+    def test_extension_element_content(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <A><myns:myext><x>X</x><y>Y</y><z/></myns:myext></A>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                output_parent.extend(list(self_node)[1:])
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A><y>Y</y><z/></A>'))
+
+    def test_extension_element_apply_templates(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <A><myns:myext><x>X</x><y>Y</y><z/></myns:myext></A>
+  </xsl:template>
+  <xsl:template match="x" />
+  <xsl:template match="z">XYZ</xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                for child in self_node:
+                    for result in self.apply_templates(context, child):
+                        if isinstance(result, basestring):
+                            el = etree.Element("T")
+                            el.text = result
+                        else:
+                            el = result
+                        output_parent.append(el)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A><T>Y</T><T>XYZ</T></A>'))
+
+    def test_extension_element_apply_templates_elements_only(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <A><myns:myext><x>X</x><y>Y</y><z/></myns:myext></A>
+  </xsl:template>
+  <xsl:template match="x"><X/></xsl:template>
+  <xsl:template match="z">XYZ</xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                for child in self_node:
+                    for result in self.apply_templates(context, child,
+                                                       elements_only=True):
+                        assert not isinstance(result, basestring)
+                        output_parent.append(result)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A><X/></A>'))
+
+    def test_extension_element_apply_templates_remove_blank_text(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <A><myns:myext><x>X</x><y>Y</y><z/></myns:myext></A>
+  </xsl:template>
+  <xsl:template match="x"><X/></xsl:template>
+  <xsl:template match="y"><xsl:text>   </xsl:text></xsl:template>
+  <xsl:template match="z">XYZ</xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                for child in self_node:
+                    for result in self.apply_templates(context, child,
+                                                       remove_blank_text=True):
+                        if isinstance(result, basestring):
+                            assert result.strip()
+                            el = etree.Element("T")
+                            el.text = result
+                        else:
+                            el = result
+                        output_parent.append(el)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A><X/><T>XYZ</T></A>'))
+
+    def test_extension_element_apply_templates_target_node(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <A><myns:myext><x>X</x><y>Y</y><z/></myns:myext></A>
+  </xsl:template>
+  <xsl:template match="x" />
+  <xsl:template match="z">XYZ</xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                for child in self_node:
+                    self.apply_templates(context, child, output_parent)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A>YXYZ</A>'))
+
+    def test_extension_element_apply_templates_target_node_doc(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <myns:myext><x>X</x><y>Y</y><z/></myns:myext>
+  </xsl:template>
+  <xsl:template match="x"><xsl:processing-instruction name="test">TEST</xsl:processing-instruction></xsl:template>
+  <xsl:template match="y"><Y>XYZ</Y></xsl:template>
+  <xsl:template match="z"><xsl:comment>TEST</xsl:comment></xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                for child in self_node:
+                    self.apply_templates(context, child, output_parent)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(etree.tostring(result),
+                          _bytes('<?test TEST?><Y>XYZ</Y><!--TEST-->'))
+
+    def test_extension_element_process_children(self):
+        tree = self.parse('<a><b>E</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <xsl:variable name="testvar">yo</xsl:variable>
+    <A>
+      <myns:myext>
+        <xsl:attribute name="attr">
+          <xsl:value-of select="$testvar" />
+        </xsl:attribute>
+        <B>
+          <xsl:choose>
+            <xsl:when test="1 = 2"><C/></xsl:when>
+            <xsl:otherwise><D><xsl:value-of select="b/text()" /></D></xsl:otherwise>
+          </xsl:choose>
+        </B>
+      </myns:myext>
+    </A>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                el = etree.Element('MY')
+                self.process_children(context, el)
+                output_parent.append(el)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A><MYattr="yo"><B><D>E</D></B></MY></A>'))
+
+    def test_extension_element_process_children_to_append_only(self):
+        tree = self.parse('<a/>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <myns:myext>
+      <A/>
+    </myns:myext>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                self.process_children(context, output_parent)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<A/>'))
+
+    def test_extension_element_process_children_to_read_only_raise(self):
+        tree = self.parse('<a/>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <myns:myext>
+      <A/>
+    </myns:myext>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                self.process_children(context, self_node)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        self.assertRaises(TypeError, tree.xslt, style, extensions=extensions)
+
+    def test_extension_element_process_children_with_subextension_element(self):
+        tree = self.parse('<a/>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns">
+  <xsl:template match="a">
+    <myns:myext>
+      <A><myns:myext><B/></myns:myext></A>
+    </myns:myext>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        class MyExt(etree.XSLTExtension):
+            callback_call_counter = 0
+            def execute(self, context, self_node, input_node, output_parent):
+                self.callback_call_counter += 1
+                el = etree.Element('MY', n=str(self.callback_call_counter))
+                self.process_children(context, el)
+                output_parent.append(el)
+
+        extensions = { ('testns', 'myext') : MyExt() }
+
+        result = tree.xslt(style, extensions=extensions)
+        self.assertEqual(self._rootstring(result),
+                          _bytes('<MYn="1"><A><MYn="2"><B/></MY></A></MY>'))
+
+    def test_extension_element_raise(self):
+        tree = self.parse('<a><b>B</b></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+    xmlns:myns="testns"
+    extension-element-prefixes="myns"
+    exclude-result-prefixes="myns">
+  <xsl:template match="a">
+    <A><myns:myext>b</myns:myext></A>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        class MyError(Exception):
+            pass
+
+        class MyExt(etree.XSLTExtension):
+            def execute(self, context, self_node, input_node, output_parent):
+                raise MyError("expected!")
+
+        extensions = { ('testns', 'myext') : MyExt() }
+        self.assertRaises(MyError, tree.xslt, style, extensions=extensions)
+
+
+class Py3XSLTTestCase(HelperTestCase):
+    """XSLT tests for etree under Python 3"""
+
+    pytestmark = skipif('sys.version_info < (3,0)')
+
+    def test_xslt_result_bytes(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        self.assertEqual(_bytes('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+'''),
+                          bytes(res))
+
+    def test_xslt_result_bytearray(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        self.assertEqual(_bytes('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+'''),
+                          bytearray(res))
+
+    def test_xslt_result_memoryview(self):
+        tree = self.parse('<a><b>B</b><c>C</c></a>')
+        style = self.parse('''\
+<xsl:stylesheet version="1.0"
+    xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
+  <xsl:template match="*" />
+  <xsl:template match="/">
+    <foo><xsl:value-of select="/a/b/text()" /></foo>
+  </xsl:template>
+</xsl:stylesheet>''')
+
+        st = etree.XSLT(style)
+        res = st(tree)
+        self.assertEqual(_bytes('''\
+<?xml version="1.0"?>
+<foo>B</foo>
+'''),
+                          bytes(memoryview(res)))
+
+
+def test_suite():
+    suite = unittest.TestSuite()
+    suite.addTests([unittest.makeSuite(ETreeXSLTTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeEXSLTTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeXSLTExtFuncTestCase)])
+    suite.addTests([unittest.makeSuite(ETreeXSLTExtElementTestCase)])
+    if is_python3:
+        suite.addTests([unittest.makeSuite(Py3XSLTTestCase)])
+    suite.addTests(
+        [make_doctest('../../../doc/extensions.txt')])
+    suite.addTests(
+        [make_doctest('../../../doc/xpathxslt.txt')])
+    return suite
+
+if __name__ == '__main__':
+    print('to test use test.py %s' % __file__)
diff --git a/lib/lxml/usedoctest.py b/lib/lxml/usedoctest.py
new file mode 100644
index 00000000..f1da8cad
--- /dev/null
+++ b/lib/lxml/usedoctest.py
@@ -0,0 +1,13 @@
+"""Doctest module for XML comparison.
+
+Usage::
+
+   >>> import lxml.usedoctest
+   >>> # now do your XML doctests ...
+
+See `lxml.doctestcompare`
+"""
+
+from lxml import doctestcompare
+
+doctestcompare.temp_install(del_module=__name__)
diff --git a/lib/lxml/xinclude.pxi b/lib/lxml/xinclude.pxi
new file mode 100644
index 00000000..72e6a1c8
--- /dev/null
+++ b/lib/lxml/xinclude.pxi
@@ -0,0 +1,64 @@
+# XInclude processing
+
+from lxml.includes cimport xinclude
+
+class XIncludeError(LxmlError):
+    u"""Error during XInclude processing.
+    """
+    pass
+
+cdef class XInclude:
+    u"""XInclude(self)
+    XInclude processor.
+
+    Create an instance and call it on an Element to run XInclude
+    processing.
+    """
+    cdef _ErrorLog _error_log
+    def __init__(self):
+        self._error_log = _ErrorLog()
+
+    property error_log:
+        def __get__(self):
+            assert self._error_log is not None, "XInclude instance not initialised"
+            return self._error_log.copy()
+
+    def __call__(self, _Element node not None):
+        u"__call__(self, node)"
+        # We cannot pass the XML_PARSE_NOXINCNODE option as this would free
+        # the XInclude nodes - there may still be Python references to them!
+        # Therefore, we allow XInclude nodes to be converted to
+        # XML_XINCLUDE_START nodes.  XML_XINCLUDE_END nodes are added as
+        # siblings.  Tree traversal will simply ignore them as they are not
+        # typed as elements.  The included fragment is added between the two,
+        # i.e. as a sibling, which does not conflict with traversal.
+        cdef int result
+        _assertValidNode(node)
+        assert self._error_log is not None, "XInclude processor not initialised"
+        if node._doc._parser is not None:
+            parse_options = node._doc._parser._parse_options
+            context = node._doc._parser._getParserContext()
+            c_context = <void*>context
+        else:
+            parse_options = 0
+            context = None
+            c_context = NULL
+
+        self._error_log.connect()
+        if tree.LIBXML_VERSION < 20704 or not c_context:
+            __GLOBAL_PARSER_CONTEXT.pushImpliedContext(context)
+        with nogil:
+            if c_context:
+                result = xinclude.xmlXIncludeProcessTreeFlagsData(
+                    node._c_node, parse_options, c_context)
+            else:
+                result = xinclude.xmlXIncludeProcessTree(node._c_node)
+        if tree.LIBXML_VERSION < 20704 or not c_context:
+            __GLOBAL_PARSER_CONTEXT.popImpliedContext()
+        self._error_log.disconnect()
+
+        if result == -1:
+            raise XIncludeError(
+                self._error_log._buildExceptionMessage(
+                    u"XInclude processing failed"),
+                self._error_log)
diff --git a/lib/lxml/xmlerror.pxi b/lib/lxml/xmlerror.pxi
new file mode 100644
index 00000000..5294b500
--- /dev/null
+++ b/lib/lxml/xmlerror.pxi
@@ -0,0 +1,1581 @@
+# DEBUG and error logging
+
+from lxml.includes cimport xmlerror
+from lxml cimport cvarargs
+
+# module level API functions
+
+def clear_error_log():
+    u"""clear_error_log()
+
+    Clear the global error log.  Note that this log is already bound to a
+    fixed size.
+
+    Note: since lxml 2.2, the global error log is local to a thread
+    and this function will only clear the global error log of the
+    current thread.
+    """
+    _getGlobalErrorLog().clear()
+
+# dummy function: no debug output at all
+cdef void _nullGenericErrorFunc(void* ctxt, char* msg, ...) nogil:
+    pass
+
+# setup for global log:
+
+cdef void _initThreadLogging():
+    # disable generic error lines from libxml2
+    xmlerror.xmlSetGenericErrorFunc(NULL, <xmlerror.xmlGenericErrorFunc>_nullGenericErrorFunc)
+
+    # divert error messages to the global error log
+    connectErrorLog(NULL)
+
+cdef void connectErrorLog(void* log):
+    xslt.xsltSetGenericErrorFunc(log, <xmlerror.xmlGenericErrorFunc>_receiveXSLTError)
+
+# Logging classes
+
+@cython.final
+@cython.freelist(16)
+cdef class _LogEntry:
+    """A log message entry from an error log.
+
+    Attributes:
+
+    - message: the message text
+    - domain: the domain ID (see lxml.etree.ErrorDomains)
+    - type: the message type ID (see lxml.etree.ErrorTypes)
+    - level: the log level ID (see lxml.etree.ErrorLevels)
+    - line: the line at which the message originated (if applicable)
+    - column: the character column at which the message originated (if applicable)
+    - filename: the name of the file in which the message originated (if applicable)
+    """
+    cdef readonly int domain
+    cdef readonly int type
+    cdef readonly int level
+    cdef readonly int line
+    cdef readonly int column
+    cdef object _message
+    cdef object _filename
+    cdef char* _c_message
+    cdef xmlChar* _c_filename
+
+    def __dealloc__(self):
+        tree.xmlFree(self._c_message)
+        tree.xmlFree(self._c_filename)
+
+    @cython.final
+    cdef _setError(self, xmlerror.xmlError* error):
+        self.domain   = error.domain
+        self.type     = error.code
+        self.level    = <int>error.level
+        self.line     = error.line
+        self.column   = error.int2
+        self._c_message = NULL
+        self._c_filename = NULL
+        if error.message is NULL or error.message[0] in b'\n\0':
+            self._message = u"unknown error"
+        else:
+            self._message = None
+            self._c_message = <char*> tree.xmlStrdup(
+                <const_xmlChar*> error.message)
+            if not self._c_message:
+                raise MemoryError()
+        if error.file is NULL:
+            self._filename = u'<string>'
+        else:
+            self._filename = None
+            self._c_filename = tree.xmlStrdup(<const_xmlChar*> error.file)
+            if not self._c_filename:
+                raise MemoryError()
+
+    @cython.final
+    cdef _setGeneric(self, int domain, int type, int level, int line,
+                     message, filename):
+        self.domain  = domain
+        self.type    = type
+        self.level   = level
+        self.line    = line
+        self.column  = 0
+        self._message = message
+        self._filename = filename
+
+    def __repr__(self):
+        return u"%s:%d:%d:%s:%s:%s: %s" % (
+            self.filename, self.line, self.column, self.level_name,
+            self.domain_name, self.type_name, self.message)
+
+    property domain_name:
+        """The name of the error domain.  See lxml.etree.ErrorDomains
+        """
+        def __get__(self):
+            return ErrorDomains._getName(self.domain, u"unknown")
+
+    property type_name:
+        """The name of the error type.  See lxml.etree.ErrorTypes
+        """
+        def __get__(self):
+            if self.domain == ErrorDomains.RELAXNGV:
+                getName = RelaxNGErrorTypes._getName
+            else:
+                getName = ErrorTypes._getName
+            return getName(self.type, u"unknown")
+
+    property level_name:
+        """The name of the error level.  See lxml.etree.ErrorLevels
+        """
+        def __get__(self):
+            return ErrorLevels._getName(self.level, u"unknown")
+
+    property message:
+        def __get__(self):
+            cdef size_t size
+            if self._message is not None:
+                return self._message
+            if self._c_message is NULL:
+                return None
+            size = cstring_h.strlen(self._c_message)
+            if size > 0 and self._c_message[size-1] == '\n':
+                size -= 1  # strip EOL
+            # cannot use funicode() here because the message may contain
+            # byte encoded file paths etc.
+            try:
+                self._message = self._c_message[:size].decode('utf8')
+            except UnicodeDecodeError:
+                try:
+                    self.message = self._c_message[:size].decode(
+                        'ascii', 'backslashreplace')
+                except UnicodeDecodeError:
+                    self._message = u'<undecodable error message>'
+            if self._c_message:
+                # clean up early
+                tree.xmlFree(self._c_message)
+                self._c_message = NULL
+            return self._message
+
+    property filename:
+        def __get__(self):
+            if self._filename is None:
+                if self._c_filename is not NULL:
+                    self._filename = _decodeFilename(self._c_filename)
+                    # clean up early
+                    tree.xmlFree(self._c_filename)
+                    self._c_filename = NULL
+            return self._filename
+
+
+cdef class _BaseErrorLog:
+    cdef _LogEntry _first_error
+    cdef readonly object last_error
+    def __init__(self, first_error, last_error):
+        self._first_error = first_error
+        self.last_error = last_error
+
+    cpdef copy(self):
+        return _BaseErrorLog(self._first_error, self.last_error)
+
+    def __repr__(self):
+        return u''
+
+    cpdef receive(self, _LogEntry entry):
+        pass
+
+    @cython.final
+    cdef void _receive(self, xmlerror.xmlError* error):
+        cdef bint is_error
+        cdef _LogEntry entry
+        cdef _BaseErrorLog global_log
+        entry = _LogEntry.__new__(_LogEntry)
+        entry._setError(error)
+        is_error = error.level == xmlerror.XML_ERR_ERROR or \
+                   error.level == xmlerror.XML_ERR_FATAL
+        global_log = _getGlobalErrorLog()
+        if global_log is not self:
+            global_log.receive(entry)
+            if is_error:
+                global_log.last_error = entry
+        self.receive(entry)
+        if is_error:
+            self.last_error = entry
+
+    @cython.final
+    cdef void _receiveGeneric(self, int domain, int type, int level, int line,
+                              message, filename):
+        cdef bint is_error
+        cdef _LogEntry entry
+        cdef _BaseErrorLog global_log
+        entry = _LogEntry.__new__(_LogEntry)
+        entry._setGeneric(domain, type, level, line, message, filename)
+        is_error = level == xmlerror.XML_ERR_ERROR or \
+                   level == xmlerror.XML_ERR_FATAL
+        global_log = _getGlobalErrorLog()
+        if global_log is not self:
+            global_log.receive(entry)
+            if is_error:
+                global_log.last_error = entry
+        self.receive(entry)
+        if is_error:
+            self.last_error = entry
+
+    @cython.final
+    cdef _buildParseException(self, exctype, default_message):
+        code = xmlerror.XML_ERR_INTERNAL_ERROR
+        if self._first_error is None:
+            return exctype(default_message, code, 0, 0)
+        message = self._first_error.message
+        if message:
+            code = self._first_error.type
+        else:
+            message = default_message
+        line = self._first_error.line
+        column = self._first_error.column
+        if line > 0:
+            if column > 0:
+                message = u"%s, line %d, column %d" % (message, line, column)
+            else:
+                message = u"%s, line %d" % (message, line)
+        return exctype(message, code, line, column)
+
+    @cython.final
+    cdef _buildExceptionMessage(self, default_message):
+        if self._first_error is None:
+            return default_message
+        if self._first_error.message:
+            message = self._first_error.message
+        elif default_message is None:
+            return None
+        else:
+            message = default_message
+        if self._first_error.line > 0:
+            if self._first_error.column > 0:
+                message = u"%s, line %d, column %d" % (
+                    message, self._first_error.line, self._first_error.column)
+            else:
+                message = u"%s, line %d" % (message, self._first_error.line)
+        return message
+
+cdef class _ListErrorLog(_BaseErrorLog):
+    u"Immutable base version of a list based error log."
+    cdef list _entries
+    cdef int _offset
+    def __init__(self, entries, first_error, last_error):
+        if entries:
+            if first_error is None:
+                first_error = entries[0]
+            if last_error is None:
+                last_error = entries[-1]
+        _BaseErrorLog.__init__(self, first_error, last_error)
+        self._entries = entries
+
+    cpdef copy(self):
+        u"""Creates a shallow copy of this error log.  Reuses the list of
+        entries.
+        """
+        cdef _ListErrorLog log = _ListErrorLog(
+            self._entries, self._first_error, self.last_error)
+        log._offset = self._offset
+        return log
+
+    def __iter__(self):
+        entries = self._entries
+        if self._offset:
+            entries = islice(entries, self._offset)
+        return iter(entries)
+
+    def __repr__(self):
+        return u'\n'.join([repr(entry) for entry in self])
+
+    def __getitem__(self, index):
+        if self._offset:
+            index += self._offset
+        return self._entries[index]
+
+    def __len__(self):
+        return len(self._entries) - self._offset
+
+    def __contains__(self, error_type):
+        cdef Py_ssize_t i
+        for i, entry in enumerate(self._entries):
+            if i < self._offset:
+                continue
+            if entry.type == error_type:
+                return True
+        return False
+
+    def __nonzero__(self):
+        return len(self._entries) > self._offset
+
+    def filter_domains(self, domains):
+        u"""Filter the errors by the given domains and return a new error log
+        containing the matches.
+        """
+        cdef _LogEntry entry
+        if isinstance(domains, (int, long)):
+            domains = (domains,)
+        filtered = [entry for entry in self if entry.domain in domains]
+        return _ListErrorLog(filtered, None, None)
+
+    def filter_types(self, types):
+        u"""filter_types(self, types)
+
+        Filter the errors by the given types and return a new error
+        log containing the matches.
+        """
+        cdef _LogEntry entry
+        if isinstance(types, (int, long)):
+            types = (types,)
+        filtered = [entry for entry in self if entry.type in types]
+        return _ListErrorLog(filtered, None, None)
+
+    def filter_levels(self, levels):
+        u"""filter_levels(self, levels)
+
+        Filter the errors by the given error levels and return a new
+        error log containing the matches.
+        """
+        cdef _LogEntry entry
+        if isinstance(levels, (int, long)):
+            levels = (levels,)
+        filtered = [entry for entry in self if entry.level in levels]
+        return _ListErrorLog(filtered, None, None)
+
+    def filter_from_level(self, level):
+        u"""filter_from_level(self, level)
+
+        Return a log with all messages of the requested level of worse.
+        """
+        cdef _LogEntry entry
+        filtered = [entry for entry in self if entry.level >= level]
+        return _ListErrorLog(filtered, None, None)
+
+    def filter_from_fatals(self):
+        u"""filter_from_fatals(self)
+
+        Convenience method to get all fatal error messages.
+        """
+        return self.filter_from_level(ErrorLevels.FATAL)
+    
+    def filter_from_errors(self):
+        u"""filter_from_errors(self)
+
+        Convenience method to get all error messages or worse.
+        """
+        return self.filter_from_level(ErrorLevels.ERROR)
+    
+    def filter_from_warnings(self):
+        u"""filter_from_warnings(self)
+
+        Convenience method to get all warnings or worse.
+        """
+        return self.filter_from_level(ErrorLevels.WARNING)
+
+@cython.final
+@cython.internal
+cdef class _ErrorLogContext:
+    """
+    Error log context for the 'with' statement.
+    Stores a reference to the current callbacks to allow for
+    recursively stacked log contexts.
+    """
+    cdef xmlerror.xmlStructuredErrorFunc old_error_func
+    cdef void* old_error_context
+
+cdef class _ErrorLog(_ListErrorLog):
+    cdef list _logContexts
+    def __cinit__(self):
+        self._logContexts = []
+
+    def __init__(self):
+        _ListErrorLog.__init__(self, [], None, None)
+
+    @cython.final
+    cdef int __enter__(self) except -1:
+        return self.connect()
+
+    def __exit__(self, *args):
+        #  TODO: make this a cdef function when Cython supports it
+        self.disconnect()
+
+    @cython.final
+    cdef int connect(self) except -1:
+        self._first_error = None
+        del self._entries[:]
+
+        cdef _ErrorLogContext context = _ErrorLogContext.__new__(_ErrorLogContext)
+        context.old_error_func = xmlerror.xmlStructuredError
+        context.old_error_context = xmlerror.xmlStructuredErrorContext
+        self._logContexts.append(context)
+        xmlerror.xmlSetStructuredErrorFunc(
+            <void*>self, <xmlerror.xmlStructuredErrorFunc>_receiveError)
+        return 0
+
+    @cython.final
+    cdef int disconnect(self) except -1:
+        cdef _ErrorLogContext context = self._logContexts.pop()
+        xmlerror.xmlSetStructuredErrorFunc(
+            context.old_error_context, context.old_error_func)
+        return 0
+
+    cpdef clear(self):
+        self._first_error = None
+        self.last_error = None
+        self._offset = 0
+        del self._entries[:]
+
+    cpdef copy(self):
+        u"""Creates a shallow copy of this error log and the list of entries.
+        """
+        return _ListErrorLog(
+            self._entries[self._offset:],
+            self._first_error, self.last_error)
+
+    def __iter__(self):
+        return iter(self._entries[self._offset:])
+
+    cpdef receive(self, _LogEntry entry):
+        if self._first_error is None and entry.level >= xmlerror.XML_ERR_ERROR:
+            self._first_error = entry
+        self._entries.append(entry)
+
+cdef class _DomainErrorLog(_ErrorLog):
+    def __init__(self, domains):
+        _ErrorLog.__init__(self)
+        self._accepted_domains = tuple(domains)
+
+    cpdef receive(self, _LogEntry entry):
+        if entry.domain in self._accepted_domains:
+            _ErrorLog.receive(self, entry)
+
+cdef class _RotatingErrorLog(_ErrorLog):
+    cdef int _max_len
+    def __init__(self, max_len):
+        _ErrorLog.__init__(self)
+        self._max_len = max_len
+
+    cpdef receive(self, _LogEntry entry):
+        if self._first_error is None and entry.level >= xmlerror.XML_ERR_ERROR:
+            self._first_error = entry
+        self._entries.append(entry)
+
+        if len(self._entries) > self._max_len:
+            self._offset += 1
+            if self._offset > self._max_len // 3:
+                offset = self._offset
+                self._offset = 0
+                del self._entries[:offset]
+
+cdef class PyErrorLog(_BaseErrorLog):
+    u"""PyErrorLog(self, logger_name=None, logger=None)
+    A global error log that connects to the Python stdlib logging package.
+
+    The constructor accepts an optional logger name or a readily
+    instantiated logger instance.
+
+    If you want to change the mapping between libxml2's ErrorLevels and Python
+    logging levels, you can modify the level_map dictionary from a subclass.
+
+    The default mapping is::
+
+            ErrorLevels.WARNING = logging.WARNING
+            ErrorLevels.ERROR   = logging.ERROR
+            ErrorLevels.FATAL   = logging.CRITICAL
+
+    You can also override the method ``receive()`` that takes a LogEntry
+    object and calls ``self.log(log_entry, format_string, arg1, arg2, ...)``
+    with appropriate data.
+    """
+    cdef readonly dict level_map
+    cdef object _map_level
+    cdef object _log
+    def __init__(self, logger_name=None, logger=None):
+        _BaseErrorLog.__init__(self, None, None)
+        import logging
+        self.level_map = {
+            ErrorLevels.WARNING : logging.WARNING,
+            ErrorLevels.ERROR   : logging.ERROR,
+            ErrorLevels.FATAL   : logging.CRITICAL
+            }
+        self._map_level = self.level_map.get
+        if logger is None:
+            if logger_name:
+                logger = logging.getLogger(logger_name)
+            else:
+                logger = logging.getLogger()
+        self._log = logger.log
+
+    cpdef copy(self):
+        u"""Dummy method that returns an empty error log.
+        """
+        return _ListErrorLog([], None, None)
+
+    def log(self, log_entry, message, *args):
+        u"""log(self, log_entry, message, *args)
+
+        Called by the .receive() method to log a _LogEntry instance to
+        the Python logging system.  This handles the error level
+        mapping.
+
+        In the default implementation, the ``message`` argument
+        receives a complete log line, and there are no further
+        ``args``.  To change the message format, it is best to
+        override the .receive() method instead of this one.
+        """
+        self._log(
+            self._map_level(log_entry.level, 0),
+            message, *args
+            )
+
+    cpdef receive(self, _LogEntry log_entry):
+        u"""receive(self, log_entry)
+
+        Receive a _LogEntry instance from the logging system.  Calls
+        the .log() method with appropriate parameters::
+
+            self.log(log_entry, repr(log_entry))
+
+        You can override this method to provide your own log output
+        format.
+        """
+        self.log(log_entry, repr(log_entry))
+
+# thread-local, global list log to collect error output messages from
+# libxml2/libxslt
+
+cdef _BaseErrorLog __GLOBAL_ERROR_LOG
+__GLOBAL_ERROR_LOG = _RotatingErrorLog(__MAX_LOG_SIZE)
+
+cdef _BaseErrorLog _getGlobalErrorLog():
+    u"""Retrieve the global error log of this thread."""
+    cdef python.PyObject* thread_dict
+    thread_dict = python.PyThreadState_GetDict()
+    if thread_dict is NULL:
+        return __GLOBAL_ERROR_LOG
+    try:
+        return (<object>thread_dict)[u"_GlobalErrorLog"]
+    except KeyError:
+        log = (<object>thread_dict)[u"_GlobalErrorLog"] = \
+              _RotatingErrorLog(__MAX_LOG_SIZE)
+        return log
+
+cdef _setGlobalErrorLog(_BaseErrorLog log):
+    u"""Set the global error log of this thread."""
+    cdef python.PyObject* thread_dict
+    thread_dict = python.PyThreadState_GetDict()
+    if thread_dict is NULL:
+        global __GLOBAL_ERROR_LOG
+        __GLOBAL_ERROR_LOG = log
+    else:
+        (<object>thread_dict)[u"_GlobalErrorLog"] = log
+
+cdef __copyGlobalErrorLog():
+    u"Helper function for properties in exceptions."
+    return _getGlobalErrorLog().copy()
+
+def use_global_python_log(PyErrorLog log not None):
+    u"""use_global_python_log(log)
+
+    Replace the global error log by an etree.PyErrorLog that uses the
+    standard Python logging package.
+
+    Note that this disables access to the global error log from exceptions.
+    Parsers, XSLT etc. will continue to provide their normal local error log.
+
+    Note: prior to lxml 2.2, this changed the error log globally.
+    Since lxml 2.2, the global error log is local to a thread and this
+    function will only set the global error log of the current thread.
+    """
+    _setGlobalErrorLog(log)
+
+
+# local log functions: forward error to logger object
+cdef void _forwardError(void* c_log_handler, xmlerror.xmlError* error) with gil:
+    cdef _BaseErrorLog log_handler
+    if c_log_handler is not NULL:
+        log_handler = <_BaseErrorLog>c_log_handler
+    else:
+        log_handler = _getGlobalErrorLog()
+    log_handler._receive(error)
+
+cdef void _receiveError(void* c_log_handler, xmlerror.xmlError* error) nogil:
+    # no Python objects here, may be called without thread context !
+    if __DEBUG:
+        _forwardError(c_log_handler, error)
+
+cdef void _receiveXSLTError(void* c_log_handler, char* msg, ...) nogil:
+    # no Python objects here, may be called without thread context !
+    cdef xmlerror.xmlError c_error
+    cdef cvarargs.va_list args
+    cdef char* c_text
+    cdef char* c_message
+    cdef char* c_element
+    cdef char* c_pos
+    cdef char* c_name_pos
+    cdef char* c_str
+    cdef int text_size, element_size, format_count, c_int
+    if not __DEBUG or msg is NULL:
+        return
+    if msg[0] in b'\n\0':
+        return
+
+    c_text = c_element = c_error.file = NULL
+    c_error.line = 0
+
+    # parse "NAME %s" chunks from the format string
+    cvarargs.va_start(args, msg)
+    c_name_pos = c_pos = msg
+    format_count = 0
+    while c_pos[0]:
+        if c_pos[0] == b'%':
+            c_pos += 1
+            if c_pos[0] == b's':  # "%s"
+                format_count += 1
+                c_str = cvarargs.va_charptr(args)
+                if c_pos == msg + 1:
+                    c_text = c_str  # msg == "%s..."
+                elif c_name_pos[0] == b'e':
+                    if cstring_h.strncmp(c_name_pos, 'element %s', 10):
+                        c_element = c_str
+                elif c_name_pos[0] == b'f':
+                    if cstring_h.strncmp(c_name_pos, 'file %s', 7):
+                        if cstring_h.strncmp('string://__STRING__XSLT',
+                                             c_str, 23) == 0:
+                            c_str = '<xslt>'
+                        c_error.file = c_str
+            elif c_pos[0] == b'd':  # "%d"
+                format_count += 1
+                c_int = cvarargs.va_int(args)
+                if cstring_h.strncmp(c_name_pos, 'line %d', 7):
+                    c_error.line = c_int
+            elif c_pos[0] != b'%':  # "%%" == "%"
+                format_count += 1
+                break  # unexpected format or end of string => abort
+        elif c_pos[0] == b' ':
+            if c_pos[1] != b'%':
+                c_name_pos = c_pos + 1
+        c_pos += 1
+    cvarargs.va_end(args)
+
+    c_message = NULL
+    if c_text is NULL:
+        if c_element is not NULL and format_count == 1:
+            # special case: a single occurrence of 'element %s'
+            text_size    = cstring_h.strlen(msg)
+            element_size = cstring_h.strlen(c_element)
+            c_message = <char*>stdlib.malloc(
+                (text_size + element_size + 1) * sizeof(char))
+            stdio.sprintf(c_message, msg, c_element)
+            c_error.message = c_message
+        else:
+            c_error.message = ''
+    elif c_element is NULL:
+        c_error.message = c_text
+    else:
+        text_size    = cstring_h.strlen(c_text)
+        element_size = cstring_h.strlen(c_element)
+        c_message = <char*>stdlib.malloc(
+            (text_size + 12 + element_size + 1) * sizeof(char))
+        stdio.sprintf(c_message, "%s, element '%s'", c_text, c_element)
+        c_error.message = c_message
+
+    c_error.domain = xmlerror.XML_FROM_XSLT
+    c_error.code   = xmlerror.XML_ERR_OK    # what else?
+    c_error.level  = xmlerror.XML_ERR_ERROR # what else?
+    c_error.int2   = 0
+
+    _forwardError(c_log_handler, &c_error)
+
+    if c_message is not NULL:
+        stdlib.free(c_message)
+
+################################################################################
+## CONSTANTS FROM "xmlerror.h" (or rather libxml-xmlerror.html)
+################################################################################
+
+cdef __initErrorConstants():
+    u"Called at setup time to parse the constants and build the classes below."
+    global __ERROR_LEVELS, __ERROR_DOMAINS, __PARSER_ERROR_TYPES, __RELAXNG_ERROR_TYPES
+    find_constants = re.compile(ur"\s*([a-zA-Z0-9_]+)\s*=\s*([0-9]+)").findall
+    const_defs = ((ErrorLevels,          __ERROR_LEVELS),
+                  (ErrorDomains,         __ERROR_DOMAINS),
+                  (ErrorTypes,           __PARSER_ERROR_TYPES),
+                  (RelaxNGErrorTypes,    __RELAXNG_ERROR_TYPES))
+    for cls, constant_tuple in const_defs:
+        reverse_dict = {}
+        cls._names   = reverse_dict
+        cls._getName = reverse_dict.get
+        for constants in constant_tuple:
+            #print len(constants) + 1
+            for name, value in find_constants(constants):
+                value = int(value)
+                setattr(cls, name, value)
+                reverse_dict[value] = name
+
+    # discard the global tuple references after use
+    __ERROR_LEVELS = __ERROR_DOMAINS = __PARSER_ERROR_TYPES = __RELAXNG_ERROR_TYPES = None
+
+
+class ErrorLevels(object):
+    u"Libxml2 error levels"
+
+class ErrorDomains(object):
+    u"Libxml2 error domains"
+
+class ErrorTypes(object):
+    u"Libxml2 error types"
+
+class RelaxNGErrorTypes(object):
+    u"Libxml2 RelaxNG error types"
+
+# --- BEGIN: GENERATED CONSTANTS ---
+
+# This section is generated by the script 'update-error-constants.py'.
+
+# Constants are stored in tuples of strings, for which Cython generates very
+# efficient setup code.  To parse them, iterate over the tuples and parse each
+# line in each string independently.  Tuples of strings (instead of a plain
+# string) are required as some C-compilers of a certain well-known OS vendor
+# cannot handle strings that are a few thousand bytes in length.
+
+cdef object __ERROR_LEVELS = (u"""\
+NONE=0
+WARNING=1
+ERROR=2
+FATAL=3
+""",)
+
+cdef object __ERROR_DOMAINS = (u"""\
+NONE=0
+PARSER=1
+TREE=2
+NAMESPACE=3
+DTD=4
+HTML=5
+MEMORY=6
+OUTPUT=7
+IO=8
+FTP=9
+HTTP=10
+XINCLUDE=11
+XPATH=12
+XPOINTER=13
+REGEXP=14
+DATATYPE=15
+SCHEMASP=16
+SCHEMASV=17
+RELAXNGP=18
+RELAXNGV=19
+CATALOG=20
+C14N=21
+XSLT=22
+VALID=23
+CHECK=24
+WRITER=25
+MODULE=26
+I18N=27
+SCHEMATRONV=28
+BUFFER=29
+URI=30
+""",)
+
+cdef object __PARSER_ERROR_TYPES = (u"""\
+ERR_OK=0
+ERR_INTERNAL_ERROR=1
+ERR_NO_MEMORY=2
+ERR_DOCUMENT_START=3
+ERR_DOCUMENT_EMPTY=4
+ERR_DOCUMENT_END=5
+ERR_INVALID_HEX_CHARREF=6
+ERR_INVALID_DEC_CHARREF=7
+ERR_INVALID_CHARREF=8
+ERR_INVALID_CHAR=9
+ERR_CHARREF_AT_EOF=10
+ERR_CHARREF_IN_PROLOG=11
+ERR_CHARREF_IN_EPILOG=12
+ERR_CHARREF_IN_DTD=13
+ERR_ENTITYREF_AT_EOF=14
+ERR_ENTITYREF_IN_PROLOG=15
+ERR_ENTITYREF_IN_EPILOG=16
+ERR_ENTITYREF_IN_DTD=17
+ERR_PEREF_AT_EOF=18
+ERR_PEREF_IN_PROLOG=19
+ERR_PEREF_IN_EPILOG=20
+ERR_PEREF_IN_INT_SUBSET=21
+ERR_ENTITYREF_NO_NAME=22
+ERR_ENTITYREF_SEMICOL_MISSING=23
+ERR_PEREF_NO_NAME=24
+ERR_PEREF_SEMICOL_MISSING=25
+ERR_UNDECLARED_ENTITY=26
+WAR_UNDECLARED_ENTITY=27
+ERR_UNPARSED_ENTITY=28
+ERR_ENTITY_IS_EXTERNAL=29
+ERR_ENTITY_IS_PARAMETER=30
+ERR_UNKNOWN_ENCODING=31
+ERR_UNSUPPORTED_ENCODING=32
+ERR_STRING_NOT_STARTED=33
+ERR_STRING_NOT_CLOSED=34
+ERR_NS_DECL_ERROR=35
+ERR_ENTITY_NOT_STARTED=36
+ERR_ENTITY_NOT_FINISHED=37
+ERR_LT_IN_ATTRIBUTE=38
+ERR_ATTRIBUTE_NOT_STARTED=39
+ERR_ATTRIBUTE_NOT_FINISHED=40
+ERR_ATTRIBUTE_WITHOUT_VALUE=41
+ERR_ATTRIBUTE_REDEFINED=42
+ERR_LITERAL_NOT_STARTED=43
+ERR_LITERAL_NOT_FINISHED=44
+ERR_COMMENT_NOT_FINISHED=45
+ERR_PI_NOT_STARTED=46
+ERR_PI_NOT_FINISHED=47
+ERR_NOTATION_NOT_STARTED=48
+ERR_NOTATION_NOT_FINISHED=49
+ERR_ATTLIST_NOT_STARTED=50
+ERR_ATTLIST_NOT_FINISHED=51
+ERR_MIXED_NOT_STARTED=52
+ERR_MIXED_NOT_FINISHED=53
+ERR_ELEMCONTENT_NOT_STARTED=54
+ERR_ELEMCONTENT_NOT_FINISHED=55
+ERR_XMLDECL_NOT_STARTED=56
+ERR_XMLDECL_NOT_FINISHED=57
+ERR_CONDSEC_NOT_STARTED=58
+ERR_CONDSEC_NOT_FINISHED=59
+ERR_EXT_SUBSET_NOT_FINISHED=60
+ERR_DOCTYPE_NOT_FINISHED=61
+ERR_MISPLACED_CDATA_END=62
+ERR_CDATA_NOT_FINISHED=63
+ERR_RESERVED_XML_NAME=64
+ERR_SPACE_REQUIRED=65
+ERR_SEPARATOR_REQUIRED=66
+ERR_NMTOKEN_REQUIRED=67
+ERR_NAME_REQUIRED=68
+ERR_PCDATA_REQUIRED=69
+ERR_URI_REQUIRED=70
+ERR_PUBID_REQUIRED=71
+ERR_LT_REQUIRED=72
+ERR_GT_REQUIRED=73
+ERR_LTSLASH_REQUIRED=74
+ERR_EQUAL_REQUIRED=75
+ERR_TAG_NAME_MISMATCH=76
+ERR_TAG_NOT_FINISHED=77
+ERR_STANDALONE_VALUE=78
+""",
+u"""\
+ERR_ENCODING_NAME=79
+ERR_HYPHEN_IN_COMMENT=80
+ERR_INVALID_ENCODING=81
+ERR_EXT_ENTITY_STANDALONE=82
+ERR_CONDSEC_INVALID=83
+ERR_VALUE_REQUIRED=84
+ERR_NOT_WELL_BALANCED=85
+ERR_EXTRA_CONTENT=86
+ERR_ENTITY_CHAR_ERROR=87
+ERR_ENTITY_PE_INTERNAL=88
+ERR_ENTITY_LOOP=89
+ERR_ENTITY_BOUNDARY=90
+ERR_INVALID_URI=91
+ERR_URI_FRAGMENT=92
+WAR_CATALOG_PI=93
+ERR_NO_DTD=94
+ERR_CONDSEC_INVALID_KEYWORD=95
+ERR_VERSION_MISSING=96
+WAR_UNKNOWN_VERSION=97
+WAR_LANG_VALUE=98
+WAR_NS_URI=99
+WAR_NS_URI_RELATIVE=100
+ERR_MISSING_ENCODING=101
+WAR_SPACE_VALUE=102
+ERR_NOT_STANDALONE=103
+ERR_ENTITY_PROCESSING=104
+ERR_NOTATION_PROCESSING=105
+WAR_NS_COLUMN=106
+WAR_ENTITY_REDEFINED=107
+ERR_UNKNOWN_VERSION=108
+ERR_VERSION_MISMATCH=109
+ERR_NAME_TOO_LONG=110
+ERR_USER_STOP=111
+NS_ERR_XML_NAMESPACE=200
+NS_ERR_UNDEFINED_NAMESPACE=201
+NS_ERR_QNAME=202
+NS_ERR_ATTRIBUTE_REDEFINED=203
+NS_ERR_EMPTY=204
+NS_ERR_COLON=205
+DTD_ATTRIBUTE_DEFAULT=500
+DTD_ATTRIBUTE_REDEFINED=501
+DTD_ATTRIBUTE_VALUE=502
+DTD_CONTENT_ERROR=503
+DTD_CONTENT_MODEL=504
+DTD_CONTENT_NOT_DETERMINIST=505
+DTD_DIFFERENT_PREFIX=506
+DTD_ELEM_DEFAULT_NAMESPACE=507
+DTD_ELEM_NAMESPACE=508
+DTD_ELEM_REDEFINED=509
+DTD_EMPTY_NOTATION=510
+DTD_ENTITY_TYPE=511
+DTD_ID_FIXED=512
+DTD_ID_REDEFINED=513
+DTD_ID_SUBSET=514
+DTD_INVALID_CHILD=515
+DTD_INVALID_DEFAULT=516
+DTD_LOAD_ERROR=517
+DTD_MISSING_ATTRIBUTE=518
+DTD_MIXED_CORRUPT=519
+DTD_MULTIPLE_ID=520
+DTD_NO_DOC=521
+DTD_NO_DTD=522
+DTD_NO_ELEM_NAME=523
+DTD_NO_PREFIX=524
+DTD_NO_ROOT=525
+DTD_NOTATION_REDEFINED=526
+DTD_NOTATION_VALUE=527
+DTD_NOT_EMPTY=528
+DTD_NOT_PCDATA=529
+DTD_NOT_STANDALONE=530
+DTD_ROOT_NAME=531
+DTD_STANDALONE_WHITE_SPACE=532
+DTD_UNKNOWN_ATTRIBUTE=533
+DTD_UNKNOWN_ELEM=534
+DTD_UNKNOWN_ENTITY=535
+DTD_UNKNOWN_ID=536
+DTD_UNKNOWN_NOTATION=537
+DTD_STANDALONE_DEFAULTED=538
+DTD_XMLID_VALUE=539
+DTD_XMLID_TYPE=540
+DTD_DUP_TOKEN=541
+HTML_STRUCURE_ERROR=800
+HTML_UNKNOWN_TAG=801
+RNGP_ANYNAME_ATTR_ANCESTOR=1000
+RNGP_ATTR_CONFLICT=1001
+RNGP_ATTRIBUTE_CHILDREN=1002
+""",
+u"""\
+RNGP_ATTRIBUTE_CONTENT=1003
+RNGP_ATTRIBUTE_EMPTY=1004
+RNGP_ATTRIBUTE_NOOP=1005
+RNGP_CHOICE_CONTENT=1006
+RNGP_CHOICE_EMPTY=1007
+RNGP_CREATE_FAILURE=1008
+RNGP_DATA_CONTENT=1009
+RNGP_DEF_CHOICE_AND_INTERLEAVE=1010
+RNGP_DEFINE_CREATE_FAILED=1011
+RNGP_DEFINE_EMPTY=1012
+RNGP_DEFINE_MISSING=1013
+RNGP_DEFINE_NAME_MISSING=1014
+RNGP_ELEM_CONTENT_EMPTY=1015
+RNGP_ELEM_CONTENT_ERROR=1016
+RNGP_ELEMENT_EMPTY=1017
+RNGP_ELEMENT_CONTENT=1018
+RNGP_ELEMENT_NAME=1019
+RNGP_ELEMENT_NO_CONTENT=1020
+RNGP_ELEM_TEXT_CONFLICT=1021
+RNGP_EMPTY=1022
+RNGP_EMPTY_CONSTRUCT=1023
+RNGP_EMPTY_CONTENT=1024
+RNGP_EMPTY_NOT_EMPTY=1025
+RNGP_ERROR_TYPE_LIB=1026
+RNGP_EXCEPT_EMPTY=1027
+RNGP_EXCEPT_MISSING=1028
+RNGP_EXCEPT_MULTIPLE=1029
+RNGP_EXCEPT_NO_CONTENT=1030
+RNGP_EXTERNALREF_EMTPY=1031
+RNGP_EXTERNAL_REF_FAILURE=1032
+RNGP_EXTERNALREF_RECURSE=1033
+RNGP_FORBIDDEN_ATTRIBUTE=1034
+RNGP_FOREIGN_ELEMENT=1035
+RNGP_GRAMMAR_CONTENT=1036
+RNGP_GRAMMAR_EMPTY=1037
+RNGP_GRAMMAR_MISSING=1038
+RNGP_GRAMMAR_NO_START=1039
+RNGP_GROUP_ATTR_CONFLICT=1040
+RNGP_HREF_ERROR=1041
+RNGP_INCLUDE_EMPTY=1042
+RNGP_INCLUDE_FAILURE=1043
+RNGP_INCLUDE_RECURSE=1044
+RNGP_INTERLEAVE_ADD=1045
+RNGP_INTERLEAVE_CREATE_FAILED=1046
+RNGP_INTERLEAVE_EMPTY=1047
+RNGP_INTERLEAVE_NO_CONTENT=1048
+RNGP_INVALID_DEFINE_NAME=1049
+RNGP_INVALID_URI=1050
+RNGP_INVALID_VALUE=1051
+RNGP_MISSING_HREF=1052
+RNGP_NAME_MISSING=1053
+RNGP_NEED_COMBINE=1054
+RNGP_NOTALLOWED_NOT_EMPTY=1055
+RNGP_NSNAME_ATTR_ANCESTOR=1056
+RNGP_NSNAME_NO_NS=1057
+RNGP_PARAM_FORBIDDEN=1058
+RNGP_PARAM_NAME_MISSING=1059
+RNGP_PARENTREF_CREATE_FAILED=1060
+RNGP_PARENTREF_NAME_INVALID=1061
+RNGP_PARENTREF_NO_NAME=1062
+RNGP_PARENTREF_NO_PARENT=1063
+RNGP_PARENTREF_NOT_EMPTY=1064
+RNGP_PARSE_ERROR=1065
+RNGP_PAT_ANYNAME_EXCEPT_ANYNAME=1066
+RNGP_PAT_ATTR_ATTR=1067
+RNGP_PAT_ATTR_ELEM=1068
+RNGP_PAT_DATA_EXCEPT_ATTR=1069
+RNGP_PAT_DATA_EXCEPT_ELEM=1070
+RNGP_PAT_DATA_EXCEPT_EMPTY=1071
+RNGP_PAT_DATA_EXCEPT_GROUP=1072
+RNGP_PAT_DATA_EXCEPT_INTERLEAVE=1073
+RNGP_PAT_DATA_EXCEPT_LIST=1074
+""",
+u"""\
+RNGP_PAT_DATA_EXCEPT_ONEMORE=1075
+RNGP_PAT_DATA_EXCEPT_REF=1076
+RNGP_PAT_DATA_EXCEPT_TEXT=1077
+RNGP_PAT_LIST_ATTR=1078
+RNGP_PAT_LIST_ELEM=1079
+RNGP_PAT_LIST_INTERLEAVE=1080
+RNGP_PAT_LIST_LIST=1081
+RNGP_PAT_LIST_REF=1082
+RNGP_PAT_LIST_TEXT=1083
+RNGP_PAT_NSNAME_EXCEPT_ANYNAME=1084
+RNGP_PAT_NSNAME_EXCEPT_NSNAME=1085
+RNGP_PAT_ONEMORE_GROUP_ATTR=1086
+RNGP_PAT_ONEMORE_INTERLEAVE_ATTR=1087
+RNGP_PAT_START_ATTR=1088
+RNGP_PAT_START_DATA=1089
+RNGP_PAT_START_EMPTY=1090
+RNGP_PAT_START_GROUP=1091
+RNGP_PAT_START_INTERLEAVE=1092
+RNGP_PAT_START_LIST=1093
+RNGP_PAT_START_ONEMORE=1094
+RNGP_PAT_START_TEXT=1095
+RNGP_PAT_START_VALUE=1096
+RNGP_PREFIX_UNDEFINED=1097
+RNGP_REF_CREATE_FAILED=1098
+RNGP_REF_CYCLE=1099
+RNGP_REF_NAME_INVALID=1100
+RNGP_REF_NO_DEF=1101
+RNGP_REF_NO_NAME=1102
+RNGP_REF_NOT_EMPTY=1103
+RNGP_START_CHOICE_AND_INTERLEAVE=1104
+RNGP_START_CONTENT=1105
+RNGP_START_EMPTY=1106
+RNGP_START_MISSING=1107
+RNGP_TEXT_EXPECTED=1108
+RNGP_TEXT_HAS_CHILD=1109
+RNGP_TYPE_MISSING=1110
+RNGP_TYPE_NOT_FOUND=1111
+RNGP_TYPE_VALUE=1112
+RNGP_UNKNOWN_ATTRIBUTE=1113
+RNGP_UNKNOWN_COMBINE=1114
+RNGP_UNKNOWN_CONSTRUCT=1115
+RNGP_UNKNOWN_TYPE_LIB=1116
+RNGP_URI_FRAGMENT=1117
+RNGP_URI_NOT_ABSOLUTE=1118
+RNGP_VALUE_EMPTY=1119
+RNGP_VALUE_NO_CONTENT=1120
+RNGP_XMLNS_NAME=1121
+RNGP_XML_NS=1122
+XPATH_EXPRESSION_OK=1200
+XPATH_NUMBER_ERROR=1201
+XPATH_UNFINISHED_LITERAL_ERROR=1202
+XPATH_START_LITERAL_ERROR=1203
+XPATH_VARIABLE_REF_ERROR=1204
+XPATH_UNDEF_VARIABLE_ERROR=1205
+XPATH_INVALID_PREDICATE_ERROR=1206
+XPATH_EXPR_ERROR=1207
+XPATH_UNCLOSED_ERROR=1208
+XPATH_UNKNOWN_FUNC_ERROR=1209
+XPATH_INVALID_OPERAND=1210
+XPATH_INVALID_TYPE=1211
+XPATH_INVALID_ARITY=1212
+XPATH_INVALID_CTXT_SIZE=1213
+XPATH_INVALID_CTXT_POSITION=1214
+XPATH_MEMORY_ERROR=1215
+XPTR_SYNTAX_ERROR=1216
+XPTR_RESOURCE_ERROR=1217
+XPTR_SUB_RESOURCE_ERROR=1218
+XPATH_UNDEF_PREFIX_ERROR=1219
+XPATH_ENCODING_ERROR=1220
+XPATH_INVALID_CHAR_ERROR=1221
+TREE_INVALID_HEX=1300
+TREE_INVALID_DEC=1301
+TREE_UNTERMINATED_ENTITY=1302
+""",
+u"""\
+TREE_NOT_UTF8=1303
+SAVE_NOT_UTF8=1400
+SAVE_CHAR_INVALID=1401
+SAVE_NO_DOCTYPE=1402
+SAVE_UNKNOWN_ENCODING=1403
+REGEXP_COMPILE_ERROR=1450
+IO_UNKNOWN=1500
+IO_EACCES=1501
+IO_EAGAIN=1502
+IO_EBADF=1503
+IO_EBADMSG=1504
+IO_EBUSY=1505
+IO_ECANCELED=1506
+IO_ECHILD=1507
+IO_EDEADLK=1508
+IO_EDOM=1509
+IO_EEXIST=1510
+IO_EFAULT=1511
+IO_EFBIG=1512
+IO_EINPROGRESS=1513
+IO_EINTR=1514
+IO_EINVAL=1515
+IO_EIO=1516
+IO_EISDIR=1517
+IO_EMFILE=1518
+IO_EMLINK=1519
+IO_EMSGSIZE=1520
+IO_ENAMETOOLONG=1521
+IO_ENFILE=1522
+IO_ENODEV=1523
+IO_ENOENT=1524
+IO_ENOEXEC=1525
+IO_ENOLCK=1526
+IO_ENOMEM=1527
+IO_ENOSPC=1528
+IO_ENOSYS=1529
+IO_ENOTDIR=1530
+IO_ENOTEMPTY=1531
+IO_ENOTSUP=1532
+IO_ENOTTY=1533
+IO_ENXIO=1534
+IO_EPERM=1535
+IO_EPIPE=1536
+IO_ERANGE=1537
+IO_EROFS=1538
+IO_ESPIPE=1539
+IO_ESRCH=1540
+IO_ETIMEDOUT=1541
+IO_EXDEV=1542
+IO_NETWORK_ATTEMPT=1543
+IO_ENCODER=1544
+IO_FLUSH=1545
+IO_WRITE=1546
+IO_NO_INPUT=1547
+IO_BUFFER_FULL=1548
+IO_LOAD_ERROR=1549
+IO_ENOTSOCK=1550
+IO_EISCONN=1551
+IO_ECONNREFUSED=1552
+IO_ENETUNREACH=1553
+IO_EADDRINUSE=1554
+IO_EALREADY=1555
+IO_EAFNOSUPPORT=1556
+XINCLUDE_RECURSION=1600
+XINCLUDE_PARSE_VALUE=1601
+XINCLUDE_ENTITY_DEF_MISMATCH=1602
+XINCLUDE_NO_HREF=1603
+XINCLUDE_NO_FALLBACK=1604
+XINCLUDE_HREF_URI=1605
+XINCLUDE_TEXT_FRAGMENT=1606
+XINCLUDE_TEXT_DOCUMENT=1607
+XINCLUDE_INVALID_CHAR=1608
+XINCLUDE_BUILD_FAILED=1609
+XINCLUDE_UNKNOWN_ENCODING=1610
+XINCLUDE_MULTIPLE_ROOT=1611
+XINCLUDE_XPTR_FAILED=1612
+XINCLUDE_XPTR_RESULT=1613
+XINCLUDE_INCLUDE_IN_INCLUDE=1614
+XINCLUDE_FALLBACKS_IN_INCLUDE=1615
+XINCLUDE_FALLBACK_NOT_IN_INCLUDE=1616
+XINCLUDE_DEPRECATED_NS=1617
+XINCLUDE_FRAGMENT_ID=1618
+CATALOG_MISSING_ATTR=1650
+CATALOG_ENTRY_BROKEN=1651
+CATALOG_PREFER_VALUE=1652
+CATALOG_NOT_CATALOG=1653
+CATALOG_RECURSION=1654
+SCHEMAP_PREFIX_UNDEFINED=1700
+SCHEMAP_ATTRFORMDEFAULT_VALUE=1701
+SCHEMAP_ATTRGRP_NONAME_NOREF=1702
+SCHEMAP_ATTR_NONAME_NOREF=1703
+SCHEMAP_COMPLEXTYPE_NONAME_NOREF=1704
+SCHEMAP_ELEMFORMDEFAULT_VALUE=1705
+SCHEMAP_ELEM_NONAME_NOREF=1706
+""",
+u"""\
+SCHEMAP_EXTENSION_NO_BASE=1707
+SCHEMAP_FACET_NO_VALUE=1708
+SCHEMAP_FAILED_BUILD_IMPORT=1709
+SCHEMAP_GROUP_NONAME_NOREF=1710
+SCHEMAP_IMPORT_NAMESPACE_NOT_URI=1711
+SCHEMAP_IMPORT_REDEFINE_NSNAME=1712
+SCHEMAP_IMPORT_SCHEMA_NOT_URI=1713
+SCHEMAP_INVALID_BOOLEAN=1714
+SCHEMAP_INVALID_ENUM=1715
+SCHEMAP_INVALID_FACET=1716
+SCHEMAP_INVALID_FACET_VALUE=1717
+SCHEMAP_INVALID_MAXOCCURS=1718
+SCHEMAP_INVALID_MINOCCURS=1719
+SCHEMAP_INVALID_REF_AND_SUBTYPE=1720
+SCHEMAP_INVALID_WHITE_SPACE=1721
+SCHEMAP_NOATTR_NOREF=1722
+SCHEMAP_NOTATION_NO_NAME=1723
+SCHEMAP_NOTYPE_NOREF=1724
+SCHEMAP_REF_AND_SUBTYPE=1725
+SCHEMAP_RESTRICTION_NONAME_NOREF=1726
+SCHEMAP_SIMPLETYPE_NONAME=1727
+SCHEMAP_TYPE_AND_SUBTYPE=1728
+SCHEMAP_UNKNOWN_ALL_CHILD=1729
+SCHEMAP_UNKNOWN_ANYATTRIBUTE_CHILD=1730
+SCHEMAP_UNKNOWN_ATTR_CHILD=1731
+SCHEMAP_UNKNOWN_ATTRGRP_CHILD=1732
+SCHEMAP_UNKNOWN_ATTRIBUTE_GROUP=1733
+SCHEMAP_UNKNOWN_BASE_TYPE=1734
+SCHEMAP_UNKNOWN_CHOICE_CHILD=1735
+SCHEMAP_UNKNOWN_COMPLEXCONTENT_CHILD=1736
+SCHEMAP_UNKNOWN_COMPLEXTYPE_CHILD=1737
+SCHEMAP_UNKNOWN_ELEM_CHILD=1738
+SCHEMAP_UNKNOWN_EXTENSION_CHILD=1739
+SCHEMAP_UNKNOWN_FACET_CHILD=1740
+SCHEMAP_UNKNOWN_FACET_TYPE=1741
+SCHEMAP_UNKNOWN_GROUP_CHILD=1742
+SCHEMAP_UNKNOWN_IMPORT_CHILD=1743
+SCHEMAP_UNKNOWN_LIST_CHILD=1744
+SCHEMAP_UNKNOWN_NOTATION_CHILD=1745
+SCHEMAP_UNKNOWN_PROCESSCONTENT_CHILD=1746
+SCHEMAP_UNKNOWN_REF=1747
+SCHEMAP_UNKNOWN_RESTRICTION_CHILD=1748
+SCHEMAP_UNKNOWN_SCHEMAS_CHILD=1749
+SCHEMAP_UNKNOWN_SEQUENCE_CHILD=1750
+SCHEMAP_UNKNOWN_SIMPLECONTENT_CHILD=1751
+SCHEMAP_UNKNOWN_SIMPLETYPE_CHILD=1752
+SCHEMAP_UNKNOWN_TYPE=1753
+SCHEMAP_UNKNOWN_UNION_CHILD=1754
+SCHEMAP_ELEM_DEFAULT_FIXED=1755
+SCHEMAP_REGEXP_INVALID=1756
+SCHEMAP_FAILED_LOAD=1757
+SCHEMAP_NOTHING_TO_PARSE=1758
+SCHEMAP_NOROOT=1759
+SCHEMAP_REDEFINED_GROUP=1760
+SCHEMAP_REDEFINED_TYPE=1761
+SCHEMAP_REDEFINED_ELEMENT=1762
+SCHEMAP_REDEFINED_ATTRGROUP=1763
+SCHEMAP_REDEFINED_ATTR=1764
+SCHEMAP_REDEFINED_NOTATION=1765
+SCHEMAP_FAILED_PARSE=1766
+SCHEMAP_UNKNOWN_PREFIX=1767
+""",
+u"""\
+SCHEMAP_DEF_AND_PREFIX=1768
+SCHEMAP_UNKNOWN_INCLUDE_CHILD=1769
+SCHEMAP_INCLUDE_SCHEMA_NOT_URI=1770
+SCHEMAP_INCLUDE_SCHEMA_NO_URI=1771
+SCHEMAP_NOT_SCHEMA=1772
+SCHEMAP_UNKNOWN_MEMBER_TYPE=1773
+SCHEMAP_INVALID_ATTR_USE=1774
+SCHEMAP_RECURSIVE=1775
+SCHEMAP_SUPERNUMEROUS_LIST_ITEM_TYPE=1776
+SCHEMAP_INVALID_ATTR_COMBINATION=1777
+SCHEMAP_INVALID_ATTR_INLINE_COMBINATION=1778
+SCHEMAP_MISSING_SIMPLETYPE_CHILD=1779
+SCHEMAP_INVALID_ATTR_NAME=1780
+SCHEMAP_REF_AND_CONTENT=1781
+SCHEMAP_CT_PROPS_CORRECT_1=1782
+SCHEMAP_CT_PROPS_CORRECT_2=1783
+SCHEMAP_CT_PROPS_CORRECT_3=1784
+SCHEMAP_CT_PROPS_CORRECT_4=1785
+SCHEMAP_CT_PROPS_CORRECT_5=1786
+SCHEMAP_DERIVATION_OK_RESTRICTION_1=1787
+SCHEMAP_DERIVATION_OK_RESTRICTION_2_1_1=1788
+SCHEMAP_DERIVATION_OK_RESTRICTION_2_1_2=1789
+SCHEMAP_DERIVATION_OK_RESTRICTION_2_2=1790
+SCHEMAP_DERIVATION_OK_RESTRICTION_3=1791
+SCHEMAP_WILDCARD_INVALID_NS_MEMBER=1792
+SCHEMAP_INTERSECTION_NOT_EXPRESSIBLE=1793
+SCHEMAP_UNION_NOT_EXPRESSIBLE=1794
+SCHEMAP_SRC_IMPORT_3_1=1795
+SCHEMAP_SRC_IMPORT_3_2=1796
+SCHEMAP_DERIVATION_OK_RESTRICTION_4_1=1797
+SCHEMAP_DERIVATION_OK_RESTRICTION_4_2=1798
+SCHEMAP_DERIVATION_OK_RESTRICTION_4_3=1799
+SCHEMAP_COS_CT_EXTENDS_1_3=1800
+SCHEMAV_NOROOT=1801
+SCHEMAV_UNDECLAREDELEM=1802
+SCHEMAV_NOTTOPLEVEL=1803
+SCHEMAV_MISSING=1804
+SCHEMAV_WRONGELEM=1805
+SCHEMAV_NOTYPE=1806
+SCHEMAV_NOROLLBACK=1807
+SCHEMAV_ISABSTRACT=1808
+SCHEMAV_NOTEMPTY=1809
+SCHEMAV_ELEMCONT=1810
+SCHEMAV_HAVEDEFAULT=1811
+SCHEMAV_NOTNILLABLE=1812
+SCHEMAV_EXTRACONTENT=1813
+SCHEMAV_INVALIDATTR=1814
+SCHEMAV_INVALIDELEM=1815
+SCHEMAV_NOTDETERMINIST=1816
+SCHEMAV_CONSTRUCT=1817
+SCHEMAV_INTERNAL=1818
+SCHEMAV_NOTSIMPLE=1819
+SCHEMAV_ATTRUNKNOWN=1820
+SCHEMAV_ATTRINVALID=1821
+SCHEMAV_VALUE=1822
+SCHEMAV_FACET=1823
+SCHEMAV_CVC_DATATYPE_VALID_1_2_1=1824
+SCHEMAV_CVC_DATATYPE_VALID_1_2_2=1825
+SCHEMAV_CVC_DATATYPE_VALID_1_2_3=1826
+SCHEMAV_CVC_TYPE_3_1_1=1827
+SCHEMAV_CVC_TYPE_3_1_2=1828
+SCHEMAV_CVC_FACET_VALID=1829
+SCHEMAV_CVC_LENGTH_VALID=1830
+""",
+u"""\
+SCHEMAV_CVC_MINLENGTH_VALID=1831
+SCHEMAV_CVC_MAXLENGTH_VALID=1832
+SCHEMAV_CVC_MININCLUSIVE_VALID=1833
+SCHEMAV_CVC_MAXINCLUSIVE_VALID=1834
+SCHEMAV_CVC_MINEXCLUSIVE_VALID=1835
+SCHEMAV_CVC_MAXEXCLUSIVE_VALID=1836
+SCHEMAV_CVC_TOTALDIGITS_VALID=1837
+SCHEMAV_CVC_FRACTIONDIGITS_VALID=1838
+SCHEMAV_CVC_PATTERN_VALID=1839
+SCHEMAV_CVC_ENUMERATION_VALID=1840
+SCHEMAV_CVC_COMPLEX_TYPE_2_1=1841
+SCHEMAV_CVC_COMPLEX_TYPE_2_2=1842
+SCHEMAV_CVC_COMPLEX_TYPE_2_3=1843
+SCHEMAV_CVC_COMPLEX_TYPE_2_4=1844
+SCHEMAV_CVC_ELT_1=1845
+SCHEMAV_CVC_ELT_2=1846
+SCHEMAV_CVC_ELT_3_1=1847
+SCHEMAV_CVC_ELT_3_2_1=1848
+SCHEMAV_CVC_ELT_3_2_2=1849
+SCHEMAV_CVC_ELT_4_1=1850
+SCHEMAV_CVC_ELT_4_2=1851
+SCHEMAV_CVC_ELT_4_3=1852
+SCHEMAV_CVC_ELT_5_1_1=1853
+SCHEMAV_CVC_ELT_5_1_2=1854
+SCHEMAV_CVC_ELT_5_2_1=1855
+SCHEMAV_CVC_ELT_5_2_2_1=1856
+SCHEMAV_CVC_ELT_5_2_2_2_1=1857
+SCHEMAV_CVC_ELT_5_2_2_2_2=1858
+SCHEMAV_CVC_ELT_6=1859
+SCHEMAV_CVC_ELT_7=1860
+SCHEMAV_CVC_ATTRIBUTE_1=1861
+SCHEMAV_CVC_ATTRIBUTE_2=1862
+SCHEMAV_CVC_ATTRIBUTE_3=1863
+SCHEMAV_CVC_ATTRIBUTE_4=1864
+SCHEMAV_CVC_COMPLEX_TYPE_3_1=1865
+SCHEMAV_CVC_COMPLEX_TYPE_3_2_1=1866
+SCHEMAV_CVC_COMPLEX_TYPE_3_2_2=1867
+SCHEMAV_CVC_COMPLEX_TYPE_4=1868
+SCHEMAV_CVC_COMPLEX_TYPE_5_1=1869
+SCHEMAV_CVC_COMPLEX_TYPE_5_2=1870
+SCHEMAV_ELEMENT_CONTENT=1871
+SCHEMAV_DOCUMENT_ELEMENT_MISSING=1872
+SCHEMAV_CVC_COMPLEX_TYPE_1=1873
+SCHEMAV_CVC_AU=1874
+SCHEMAV_CVC_TYPE_1=1875
+SCHEMAV_CVC_TYPE_2=1876
+SCHEMAV_CVC_IDC=1877
+SCHEMAV_CVC_WILDCARD=1878
+SCHEMAV_MISC=1879
+XPTR_UNKNOWN_SCHEME=1900
+XPTR_CHILDSEQ_START=1901
+XPTR_EVAL_FAILED=1902
+XPTR_EXTRA_OBJECTS=1903
+C14N_CREATE_CTXT=1950
+C14N_REQUIRES_UTF8=1951
+C14N_CREATE_STACK=1952
+C14N_INVALID_NODE=1953
+C14N_UNKNOW_NODE=1954
+C14N_RELATIVE_NAMESPACE=1955
+FTP_PASV_ANSWER=2000
+FTP_EPSV_ANSWER=2001
+FTP_ACCNT=2002
+FTP_URL_SYNTAX=2003
+HTTP_URL_SYNTAX=2020
+HTTP_USE_IP=2021
+HTTP_UNKNOWN_HOST=2022
+SCHEMAP_SRC_SIMPLE_TYPE_1=3000
+SCHEMAP_SRC_SIMPLE_TYPE_2=3001
+SCHEMAP_SRC_SIMPLE_TYPE_3=3002
+SCHEMAP_SRC_SIMPLE_TYPE_4=3003
+""",
+u"""\
+SCHEMAP_SRC_RESOLVE=3004
+SCHEMAP_SRC_RESTRICTION_BASE_OR_SIMPLETYPE=3005
+SCHEMAP_SRC_LIST_ITEMTYPE_OR_SIMPLETYPE=3006
+SCHEMAP_SRC_UNION_MEMBERTYPES_OR_SIMPLETYPES=3007
+SCHEMAP_ST_PROPS_CORRECT_1=3008
+SCHEMAP_ST_PROPS_CORRECT_2=3009
+SCHEMAP_ST_PROPS_CORRECT_3=3010
+SCHEMAP_COS_ST_RESTRICTS_1_1=3011
+SCHEMAP_COS_ST_RESTRICTS_1_2=3012
+SCHEMAP_COS_ST_RESTRICTS_1_3_1=3013
+SCHEMAP_COS_ST_RESTRICTS_1_3_2=3014
+SCHEMAP_COS_ST_RESTRICTS_2_1=3015
+SCHEMAP_COS_ST_RESTRICTS_2_3_1_1=3016
+SCHEMAP_COS_ST_RESTRICTS_2_3_1_2=3017
+SCHEMAP_COS_ST_RESTRICTS_2_3_2_1=3018
+SCHEMAP_COS_ST_RESTRICTS_2_3_2_2=3019
+SCHEMAP_COS_ST_RESTRICTS_2_3_2_3=3020
+SCHEMAP_COS_ST_RESTRICTS_2_3_2_4=3021
+SCHEMAP_COS_ST_RESTRICTS_2_3_2_5=3022
+SCHEMAP_COS_ST_RESTRICTS_3_1=3023
+SCHEMAP_COS_ST_RESTRICTS_3_3_1=3024
+SCHEMAP_COS_ST_RESTRICTS_3_3_1_2=3025
+SCHEMAP_COS_ST_RESTRICTS_3_3_2_2=3026
+SCHEMAP_COS_ST_RESTRICTS_3_3_2_1=3027
+SCHEMAP_COS_ST_RESTRICTS_3_3_2_3=3028
+SCHEMAP_COS_ST_RESTRICTS_3_3_2_4=3029
+SCHEMAP_COS_ST_RESTRICTS_3_3_2_5=3030
+SCHEMAP_COS_ST_DERIVED_OK_2_1=3031
+SCHEMAP_COS_ST_DERIVED_OK_2_2=3032
+SCHEMAP_S4S_ELEM_NOT_ALLOWED=3033
+SCHEMAP_S4S_ELEM_MISSING=3034
+SCHEMAP_S4S_ATTR_NOT_ALLOWED=3035
+SCHEMAP_S4S_ATTR_MISSING=3036
+SCHEMAP_S4S_ATTR_INVALID_VALUE=3037
+SCHEMAP_SRC_ELEMENT_1=3038
+SCHEMAP_SRC_ELEMENT_2_1=3039
+SCHEMAP_SRC_ELEMENT_2_2=3040
+SCHEMAP_SRC_ELEMENT_3=3041
+SCHEMAP_P_PROPS_CORRECT_1=3042
+SCHEMAP_P_PROPS_CORRECT_2_1=3043
+SCHEMAP_P_PROPS_CORRECT_2_2=3044
+SCHEMAP_E_PROPS_CORRECT_2=3045
+SCHEMAP_E_PROPS_CORRECT_3=3046
+SCHEMAP_E_PROPS_CORRECT_4=3047
+SCHEMAP_E_PROPS_CORRECT_5=3048
+SCHEMAP_E_PROPS_CORRECT_6=3049
+SCHEMAP_SRC_INCLUDE=3050
+SCHEMAP_SRC_ATTRIBUTE_1=3051
+SCHEMAP_SRC_ATTRIBUTE_2=3052
+SCHEMAP_SRC_ATTRIBUTE_3_1=3053
+SCHEMAP_SRC_ATTRIBUTE_3_2=3054
+SCHEMAP_SRC_ATTRIBUTE_4=3055
+SCHEMAP_NO_XMLNS=3056
+SCHEMAP_NO_XSI=3057
+SCHEMAP_COS_VALID_DEFAULT_1=3058
+SCHEMAP_COS_VALID_DEFAULT_2_1=3059
+SCHEMAP_COS_VALID_DEFAULT_2_2_1=3060
+SCHEMAP_COS_VALID_DEFAULT_2_2_2=3061
+""",
+u"""\
+SCHEMAP_CVC_SIMPLE_TYPE=3062
+SCHEMAP_COS_CT_EXTENDS_1_1=3063
+SCHEMAP_SRC_IMPORT_1_1=3064
+SCHEMAP_SRC_IMPORT_1_2=3065
+SCHEMAP_SRC_IMPORT_2=3066
+SCHEMAP_SRC_IMPORT_2_1=3067
+SCHEMAP_SRC_IMPORT_2_2=3068
+SCHEMAP_INTERNAL=3069
+SCHEMAP_NOT_DETERMINISTIC=3070
+SCHEMAP_SRC_ATTRIBUTE_GROUP_1=3071
+SCHEMAP_SRC_ATTRIBUTE_GROUP_2=3072
+SCHEMAP_SRC_ATTRIBUTE_GROUP_3=3073
+SCHEMAP_MG_PROPS_CORRECT_1=3074
+SCHEMAP_MG_PROPS_CORRECT_2=3075
+SCHEMAP_SRC_CT_1=3076
+SCHEMAP_DERIVATION_OK_RESTRICTION_2_1_3=3077
+SCHEMAP_AU_PROPS_CORRECT_2=3078
+SCHEMAP_A_PROPS_CORRECT_2=3079
+SCHEMAP_C_PROPS_CORRECT=3080
+SCHEMAP_SRC_REDEFINE=3081
+SCHEMAP_SRC_IMPORT=3082
+SCHEMAP_WARN_SKIP_SCHEMA=3083
+SCHEMAP_WARN_UNLOCATED_SCHEMA=3084
+SCHEMAP_WARN_ATTR_REDECL_PROH=3085
+SCHEMAP_WARN_ATTR_POINTLESS_PROH=3086
+SCHEMAP_AG_PROPS_CORRECT=3087
+SCHEMAP_COS_CT_EXTENDS_1_2=3088
+SCHEMAP_AU_PROPS_CORRECT=3089
+SCHEMAP_A_PROPS_CORRECT_3=3090
+SCHEMAP_COS_ALL_LIMITED=3091
+SCHEMATRONV_ASSERT=4000
+SCHEMATRONV_REPORT=4001
+MODULE_OPEN=4900
+MODULE_CLOSE=4901
+CHECK_FOUND_ELEMENT=5000
+CHECK_FOUND_ATTRIBUTE=5001
+CHECK_FOUND_TEXT=5002
+CHECK_FOUND_CDATA=5003
+CHECK_FOUND_ENTITYREF=5004
+CHECK_FOUND_ENTITY=5005
+CHECK_FOUND_PI=5006
+CHECK_FOUND_COMMENT=5007
+CHECK_FOUND_DOCTYPE=5008
+CHECK_FOUND_FRAGMENT=5009
+CHECK_FOUND_NOTATION=5010
+CHECK_UNKNOWN_NODE=5011
+CHECK_ENTITY_TYPE=5012
+CHECK_NO_PARENT=5013
+CHECK_NO_DOC=5014
+CHECK_NO_NAME=5015
+CHECK_NO_ELEM=5016
+CHECK_WRONG_DOC=5017
+CHECK_NO_PREV=5018
+CHECK_WRONG_PREV=5019
+CHECK_NO_NEXT=5020
+CHECK_WRONG_NEXT=5021
+CHECK_NOT_DTD=5022
+CHECK_NOT_ATTR=5023
+CHECK_NOT_ATTR_DECL=5024
+CHECK_NOT_ELEM_DECL=5025
+CHECK_NOT_ENTITY_DECL=5026
+CHECK_NOT_NS_DECL=5027
+CHECK_NO_HREF=5028
+CHECK_WRONG_PARENT=5029
+CHECK_NS_SCOPE=5030
+CHECK_NS_ANCESTOR=5031
+CHECK_NOT_UTF8=5032
+CHECK_NO_DICT=5033
+CHECK_NOT_NCNAME=5034
+CHECK_OUTSIDE_DICT=5035
+CHECK_WRONG_NAME=5036
+CHECK_NAME_NOT_NULL=5037
+I18N_NO_NAME=6000
+I18N_NO_HANDLER=6001
+I18N_EXCESS_HANDLER=6002
+I18N_CONV_FAILED=6003
+""",
+u"""\
+I18N_NO_OUTPUT=6004
+BUF_OVERFLOW=7000
+""",)
+
+cdef object __RELAXNG_ERROR_TYPES = (u"""\
+RELAXNG_OK=0
+RELAXNG_ERR_MEMORY=1
+RELAXNG_ERR_TYPE=2
+RELAXNG_ERR_TYPEVAL=3
+RELAXNG_ERR_DUPID=4
+RELAXNG_ERR_TYPECMP=5
+RELAXNG_ERR_NOSTATE=6
+RELAXNG_ERR_NODEFINE=7
+RELAXNG_ERR_LISTEXTRA=8
+RELAXNG_ERR_LISTEMPTY=9
+RELAXNG_ERR_INTERNODATA=10
+RELAXNG_ERR_INTERSEQ=11
+RELAXNG_ERR_INTEREXTRA=12
+RELAXNG_ERR_ELEMNAME=13
+RELAXNG_ERR_ATTRNAME=14
+RELAXNG_ERR_ELEMNONS=15
+RELAXNG_ERR_ATTRNONS=16
+RELAXNG_ERR_ELEMWRONGNS=17
+RELAXNG_ERR_ATTRWRONGNS=18
+RELAXNG_ERR_ELEMEXTRANS=19
+RELAXNG_ERR_ATTREXTRANS=20
+RELAXNG_ERR_ELEMNOTEMPTY=21
+RELAXNG_ERR_NOELEM=22
+RELAXNG_ERR_NOTELEM=23
+RELAXNG_ERR_ATTRVALID=24
+RELAXNG_ERR_CONTENTVALID=25
+RELAXNG_ERR_EXTRACONTENT=26
+RELAXNG_ERR_INVALIDATTR=27
+RELAXNG_ERR_DATAELEM=28
+RELAXNG_ERR_VALELEM=29
+RELAXNG_ERR_LISTELEM=30
+RELAXNG_ERR_DATATYPE=31
+RELAXNG_ERR_VALUE=32
+RELAXNG_ERR_LIST=33
+RELAXNG_ERR_NOGRAMMAR=34
+RELAXNG_ERR_EXTRADATA=35
+RELAXNG_ERR_LACKDATA=36
+RELAXNG_ERR_INTERNAL=37
+RELAXNG_ERR_ELEMWRONG=38
+RELAXNG_ERR_TEXTWRONG=39
+""",)
+# --- END: GENERATED CONSTANTS ---
+
+__initErrorConstants()
diff --git a/lib/lxml/xmlid.pxi b/lib/lxml/xmlid.pxi
new file mode 100644
index 00000000..b5b5c64a
--- /dev/null
+++ b/lib/lxml/xmlid.pxi
@@ -0,0 +1,179 @@
+cdef object _find_id_attributes
+
+def XMLID(text, parser=None, *, base_url=None):
+    u"""XMLID(text, parser=None, base_url=None)
+
+    Parse the text and return a tuple (root node, ID dictionary).  The root
+    node is the same as returned by the XML() function.  The dictionary
+    contains string-element pairs.  The dictionary keys are the values of 'id'
+    attributes.  The elements referenced by the ID are stored as dictionary
+    values.
+    """
+    cdef dict dic
+    global _find_id_attributes
+    if _find_id_attributes is None:
+        _find_id_attributes = XPath(u'//*[string(@id)]')
+
+    # ElementTree compatible implementation: parse and look for 'id' attributes
+    root = XML(text, parser, base_url=base_url)
+    dic = {}
+    for elem in _find_id_attributes(root):
+        dic[elem.get(u'id')] = elem
+    return (root, dic)
+
+def XMLDTDID(text, parser=None, *, base_url=None):
+    u"""XMLDTDID(text, parser=None, base_url=None)
+
+    Parse the text and return a tuple (root node, ID dictionary).  The root
+    node is the same as returned by the XML() function.  The dictionary
+    contains string-element pairs.  The dictionary keys are the values of ID
+    attributes as defined by the DTD.  The elements referenced by the ID are
+    stored as dictionary values.
+
+    Note that you must not modify the XML tree if you use the ID dictionary.
+    The results are undefined.
+    """
+    cdef _Element root
+    root = XML(text, parser, base_url=base_url)
+    # xml:id spec compatible implementation: use DTD ID attributes from libxml2
+    if root._doc._c_doc.ids is NULL:
+        return (root, {})
+    else:
+        return (root, _IDDict(root))
+
+def parseid(source, parser=None, *, base_url=None):
+    u"""parseid(source, parser=None)
+
+    Parses the source into a tuple containing an ElementTree object and an
+    ID dictionary.  If no parser is provided as second argument, the default
+    parser is used.
+
+    Note that you must not modify the XML tree if you use the ID dictionary.
+    The results are undefined.
+    """
+    cdef _Document doc
+    doc = _parseDocument(source, parser, base_url)
+    return (_elementTreeFactory(doc, None), _IDDict(doc))
+
+cdef class _IDDict:
+    u"""IDDict(self, etree)
+    A dictionary-like proxy class that mapps ID attributes to elements.
+
+    The dictionary must be instantiated with the root element of a parsed XML
+    document, otherwise the behaviour is undefined.  Elements and XML trees
+    that were created or modified 'by hand' are not supported.
+    """
+    cdef _Document _doc
+    cdef object _keys
+    cdef object _items
+    def __cinit__(self, etree):
+        cdef _Document doc
+        doc = _documentOrRaise(etree)
+        if doc._c_doc.ids is NULL:
+            raise ValueError, u"No ID dictionary available."
+        self._doc = doc
+        self._keys  = None
+        self._items = None
+
+    def copy(self):
+        return _IDDict(self._doc)
+
+    def __getitem__(self, id_name):
+        cdef tree.xmlHashTable* c_ids
+        cdef tree.xmlID* c_id
+        cdef xmlAttr* c_attr
+        c_ids = self._doc._c_doc.ids
+        id_utf = _utf8(id_name)
+        c_id = <tree.xmlID*>tree.xmlHashLookup(c_ids, _xcstr(id_utf))
+        if c_id is NULL:
+            raise KeyError, u"key not found."
+        c_attr = c_id.attr
+        if c_attr is NULL or c_attr.parent is NULL:
+            raise KeyError, u"ID attribute not found."
+        return _elementFactory(self._doc, c_attr.parent)
+
+    def get(self, id_name):
+        return self[id_name]
+
+    def __contains__(self, id_name):
+        cdef tree.xmlID* c_id
+        id_utf = _utf8(id_name)
+        c_id = <tree.xmlID*>tree.xmlHashLookup(
+            self._doc._c_doc.ids, _xcstr(id_utf))
+        return c_id is not NULL
+
+    def has_key(self, id_name):
+        return id_name in self
+
+    def __repr__(self):
+        return repr(dict(self))
+
+    def keys(self):
+        if self._keys is None:
+            self._keys = self._build_keys()
+        return self._keys[:]
+
+    def __iter__(self):
+        if self._keys is None:
+            self._keys = self._build_keys()
+        return iter(self._keys)
+
+    def iterkeys(self):
+        return self
+
+    def __len__(self):
+        if self._keys is None:
+            self._keys = self._build_keys()
+        return len(self._keys)
+
+    def items(self):
+        if self._items is None:
+            self._items = self._build_items()
+        return self._items[:]
+
+    def iteritems(self):
+        if self._items is None:
+            self._items = self._build_items()
+        return iter(self._items)
+
+    def values(self):
+        cdef list values = []
+        if self._items is None:
+            self._items = self._build_items()
+        for item in self._items:
+            value = python.PyTuple_GET_ITEM(item, 1)
+            python.Py_INCREF(value)
+            values.append(value)
+        return values
+
+    def itervalues(self):
+        return iter(self.values())
+
+    cdef object _build_keys(self):
+        keys = []
+        tree.xmlHashScan(<tree.xmlHashTable*>self._doc._c_doc.ids,
+                         <tree.xmlHashScanner>_collectIdHashKeys, <python.PyObject*>keys)
+        return keys
+
+    cdef object _build_items(self):
+        items = []
+        context = (items, self._doc)
+        tree.xmlHashScan(<tree.xmlHashTable*>self._doc._c_doc.ids,
+                         <tree.xmlHashScanner>_collectIdHashItemList, <python.PyObject*>context)
+        return items
+
+cdef void _collectIdHashItemList(void* payload, void* context, xmlChar* name):
+    # collect elements from ID attribute hash table
+    cdef list lst
+    c_id = <tree.xmlID*>payload
+    if c_id is NULL or c_id.attr is NULL or c_id.attr.parent is NULL:
+        return
+    lst, doc = <tuple>context
+    element = _elementFactory(doc, c_id.attr.parent)
+    lst.append( (funicode(name), element) )
+
+cdef void _collectIdHashKeys(void* payload, void* collect_list, xmlChar* name):
+    c_id = <tree.xmlID*>payload
+    if c_id is NULL or c_id.attr is NULL or c_id.attr.parent is NULL:
+        return
+    (<list>collect_list).append(funicode(name))
diff --git a/lib/lxml/xmlschema.pxi b/lib/lxml/xmlschema.pxi
new file mode 100644
index 00000000..ed61caec
--- /dev/null
+++ b/lib/lxml/xmlschema.pxi
@@ -0,0 +1,214 @@
+#  support for XMLSchema validation
+from lxml.includes cimport xmlschema
+
+class XMLSchemaError(LxmlError):
+    u"""Base class of all XML Schema errors
+    """
+    pass
+
+class XMLSchemaParseError(XMLSchemaError):
+    u"""Error while parsing an XML document as XML Schema.
+    """
+    pass
+
+class XMLSchemaValidateError(XMLSchemaError):
+    u"""Error while validating an XML document with an XML Schema.
+    """
+    pass
+
+################################################################################
+# XMLSchema
+
+cdef XPath _check_for_default_attributes = XPath(
+    u"boolean(//xs:attribute[@default or @fixed][1])",
+    namespaces={u'xs': u'http://www.w3.org/2001/XMLSchema'})
+
+cdef class XMLSchema(_Validator):
+    u"""XMLSchema(self, etree=None, file=None)
+    Turn a document into an XML Schema validator.
+
+    Either pass a schema as Element or ElementTree, or pass a file or
+    filename through the ``file`` keyword argument.
+
+    Passing the ``attribute_defaults`` boolean option will make the
+    schema insert default/fixed attributes into validated documents.
+    """
+    cdef xmlschema.xmlSchema* _c_schema
+    cdef bint _has_default_attributes
+    cdef bint _add_attribute_defaults
+    def __cinit__(self):
+        self._c_schema = NULL
+        self._has_default_attributes = True # play safe
+        self._add_attribute_defaults = False
+
+    def __init__(self, etree=None, *, file=None, attribute_defaults=False):
+        cdef _Document doc
+        cdef _Element root_node
+        cdef xmlDoc* fake_c_doc
+        cdef xmlNode* c_node
+        cdef xmlschema.xmlSchemaParserCtxt* parser_ctxt
+
+        self._add_attribute_defaults = attribute_defaults
+        _Validator.__init__(self)
+        fake_c_doc = NULL
+        if etree is not None:
+            doc = _documentOrRaise(etree)
+            root_node = _rootNodeOrRaise(etree)
+            fake_c_doc = _fakeRootDoc(doc._c_doc, root_node._c_node)
+            parser_ctxt = xmlschema.xmlSchemaNewDocParserCtxt(fake_c_doc)
+        elif file is not None:
+            if _isString(file):
+                doc = None
+                filename = _encodeFilename(file)
+                parser_ctxt = xmlschema.xmlSchemaNewParserCtxt(_cstr(filename))
+            else:
+                doc = _parseDocument(file, None, None)
+                parser_ctxt = xmlschema.xmlSchemaNewDocParserCtxt(doc._c_doc)
+        else:
+            raise XMLSchemaParseError, u"No tree or file given"
+
+        if parser_ctxt is not NULL:
+            xmlschema.xmlSchemaSetParserStructuredErrors(
+                parser_ctxt, _receiveError, <void*>self._error_log)
+            if doc is None:
+                with nogil:
+                    self._c_schema = xmlschema.xmlSchemaParse(parser_ctxt)
+            else:
+                # calling xmlSchemaParse on a schema with imports or
+                # includes will cause libxml2 to create an internal
+                # context for parsing, so push an implied context to route
+                # resolve requests to the document's parser
+                __GLOBAL_PARSER_CONTEXT.pushImpliedContextFromParser(doc._parser)
+                self._c_schema = xmlschema.xmlSchemaParse(parser_ctxt)
+                __GLOBAL_PARSER_CONTEXT.popImpliedContext()
+            xmlschema.xmlSchemaFreeParserCtxt(parser_ctxt)
+
+        if fake_c_doc is not NULL:
+            _destroyFakeDoc(doc._c_doc, fake_c_doc)
+
+        if self._c_schema is NULL:
+            raise XMLSchemaParseError(
+                self._error_log._buildExceptionMessage(
+                    u"Document is not valid XML Schema"),
+                self._error_log)
+
+        if doc is not None:
+            self._has_default_attributes = _check_for_default_attributes(doc)
+        self._add_attribute_defaults = attribute_defaults and \
+                                       self._has_default_attributes
+
+    def __dealloc__(self):
+        xmlschema.xmlSchemaFree(self._c_schema)
+
+    def __call__(self, etree):
+        u"""__call__(self, etree)
+
+        Validate doc using XML Schema.
+
+        Returns true if document is valid, false if not.
+        """
+        cdef xmlschema.xmlSchemaValidCtxt* valid_ctxt
+        cdef _Document doc
+        cdef _Element root_node
+        cdef xmlDoc* c_doc
+        cdef int ret
+
+        assert self._c_schema is not NULL, "Schema instance not initialised"
+        doc = _documentOrRaise(etree)
+        root_node = _rootNodeOrRaise(etree)
+
+        valid_ctxt = xmlschema.xmlSchemaNewValidCtxt(self._c_schema)
+        if valid_ctxt is NULL:
+            raise MemoryError()
+
+        try:
+            if self._add_attribute_defaults:
+                xmlschema.xmlSchemaSetValidOptions(
+                    valid_ctxt, xmlschema.XML_SCHEMA_VAL_VC_I_CREATE)
+
+            self._error_log.clear()
+            xmlschema.xmlSchemaSetValidStructuredErrors(
+                valid_ctxt, _receiveError, <void*>self._error_log)
+
+            c_doc = _fakeRootDoc(doc._c_doc, root_node._c_node)
+            with nogil:
+                ret = xmlschema.xmlSchemaValidateDoc(valid_ctxt, c_doc)
+            _destroyFakeDoc(doc._c_doc, c_doc)
+        finally:
+            xmlschema.xmlSchemaFreeValidCtxt(valid_ctxt)
+
+        if ret == -1:
+            raise XMLSchemaValidateError(
+                u"Internal error in XML Schema validation.",
+                self._error_log)
+        if ret == 0:
+            return True
+        else:
+            return False
+
+    cdef _ParserSchemaValidationContext _newSaxValidator(
+            self, bint add_default_attributes):
+        cdef _ParserSchemaValidationContext context
+        context = _ParserSchemaValidationContext.__new__(_ParserSchemaValidationContext)
+        context._schema = self
+        context._add_default_attributes = (self._has_default_attributes and (
+            add_default_attributes or self._add_attribute_defaults))
+        return context
+
+@cython.final
+@cython.internal
+cdef class _ParserSchemaValidationContext:
+    cdef XMLSchema _schema
+    cdef xmlschema.xmlSchemaValidCtxt* _valid_ctxt
+    cdef xmlschema.xmlSchemaSAXPlugStruct* _sax_plug
+    cdef bint _add_default_attributes
+    def __cinit__(self):
+        self._valid_ctxt = NULL
+        self._sax_plug = NULL
+        self._add_default_attributes = False
+
+    def __dealloc__(self):
+        self.disconnect()
+        if self._valid_ctxt:
+            xmlschema.xmlSchemaFreeValidCtxt(self._valid_ctxt)
+
+    cdef _ParserSchemaValidationContext copy(self):
+        assert self._schema is not None, "_ParserSchemaValidationContext not initialised"
+        return self._schema._newSaxValidator(
+            self._add_default_attributes)
+
+    cdef void inject_default_attributes(self, xmlDoc* c_doc):
+        # we currently need to insert default attributes manually
+        # after parsing, as libxml2 does not support this at parse
+        # time
+        if self._add_default_attributes:
+            with nogil:
+                xmlschema.xmlSchemaValidateDoc(self._valid_ctxt, c_doc)
+
+    cdef int connect(self, xmlparser.xmlParserCtxt* c_ctxt, _BaseErrorLog error_log) except -1:
+        if self._valid_ctxt is NULL:
+            self._valid_ctxt = xmlschema.xmlSchemaNewValidCtxt(
+                self._schema._c_schema)
+            if self._valid_ctxt is NULL:
+                raise MemoryError()
+            if self._add_default_attributes:
+                xmlschema.xmlSchemaSetValidOptions(
+                    self._valid_ctxt, xmlschema.XML_SCHEMA_VAL_VC_I_CREATE)
+        if error_log is not None:
+            xmlschema.xmlSchemaSetValidStructuredErrors(
+                self._valid_ctxt, _receiveError, <void*>error_log)
+        self._sax_plug = xmlschema.xmlSchemaSAXPlug(
+            self._valid_ctxt, &c_ctxt.sax, &c_ctxt.userData)
+
+    cdef void disconnect(self):
+        if self._sax_plug is not NULL:
+            xmlschema.xmlSchemaSAXUnplug(self._sax_plug)
+            self._sax_plug = NULL
+        if self._valid_ctxt is not NULL:
+            xmlschema.xmlSchemaSetValidStructuredErrors(
+                self._valid_ctxt, NULL, NULL)
+
+    cdef bint isvalid(self):
+        if self._valid_ctxt is NULL:
+            return 1 # valid
+        return xmlschema.xmlSchemaIsValid(self._valid_ctxt)
diff --git a/lib/lxml/xpath.pxi b/lib/lxml/xpath.pxi
new file mode 100644
index 00000000..8e71e28f
--- /dev/null
+++ b/lib/lxml/xpath.pxi
@@ -0,0 +1,506 @@
+# XPath evaluation
+
+class XPathSyntaxError(LxmlSyntaxError, XPathError):
+    pass
+
+################################################################################
+# XPath
+
+cdef object _XPATH_SYNTAX_ERRORS
+_XPATH_SYNTAX_ERRORS = (
+    xmlerror.XML_XPATH_NUMBER_ERROR,
+    xmlerror.XML_XPATH_UNFINISHED_LITERAL_ERROR,
+    xmlerror.XML_XPATH_VARIABLE_REF_ERROR,
+    xmlerror.XML_XPATH_INVALID_PREDICATE_ERROR,
+    xmlerror.XML_XPATH_UNCLOSED_ERROR,
+    xmlerror.XML_XPATH_INVALID_CHAR_ERROR
+)
+
+cdef object _XPATH_EVAL_ERRORS
+_XPATH_EVAL_ERRORS = (
+    xmlerror.XML_XPATH_UNDEF_VARIABLE_ERROR,
+    xmlerror.XML_XPATH_UNDEF_PREFIX_ERROR,
+    xmlerror.XML_XPATH_UNKNOWN_FUNC_ERROR,
+    xmlerror.XML_XPATH_INVALID_OPERAND,
+    xmlerror.XML_XPATH_INVALID_TYPE,
+    xmlerror.XML_XPATH_INVALID_ARITY,
+    xmlerror.XML_XPATH_INVALID_CTXT_SIZE,
+    xmlerror.XML_XPATH_INVALID_CTXT_POSITION
+)
+
+cdef int _register_xpath_function(void* ctxt, name_utf, ns_utf):
+    if ns_utf is None:
+        return xpath.xmlXPathRegisterFunc(
+            <xpath.xmlXPathContext*>ctxt, _xcstr(name_utf),
+            _xpath_function_call)
+    else:
+        return xpath.xmlXPathRegisterFuncNS(
+            <xpath.xmlXPathContext*>ctxt, _xcstr(name_utf), _xcstr(ns_utf),
+            _xpath_function_call)
+
+cdef int _unregister_xpath_function(void* ctxt, name_utf, ns_utf):
+    if ns_utf is None:
+        return xpath.xmlXPathRegisterFunc(
+            <xpath.xmlXPathContext*>ctxt, _xcstr(name_utf), NULL)
+    else:
+        return xpath.xmlXPathRegisterFuncNS(
+            <xpath.xmlXPathContext*>ctxt, _xcstr(name_utf), _xcstr(ns_utf), NULL)
+
+
+@cython.final
+@cython.internal
+cdef class _XPathContext(_BaseContext):
+    cdef object _variables
+    def __init__(self, namespaces, extensions, error_log, enable_regexp, variables,
+                 build_smart_strings):
+        self._variables = variables
+        _BaseContext.__init__(self, namespaces, extensions, error_log, enable_regexp,
+                              build_smart_strings)
+
+    cdef set_context(self, xpath.xmlXPathContext* xpathCtxt):
+        self._set_xpath_context(xpathCtxt)
+        # This would be a good place to set up the XPath parser dict, but
+        # we cannot use the current thread dict as we do not know which
+        # thread will execute the XPath evaluator - so, no dict for now.
+        self.registerLocalNamespaces()
+        self.registerLocalFunctions(xpathCtxt, _register_xpath_function)
+
+    cdef register_context(self, _Document doc):
+        self._register_context(doc)
+        self.registerGlobalNamespaces()
+        self.registerGlobalFunctions(self._xpathCtxt, _register_xpath_function)
+        self.registerExsltFunctions()
+        if self._variables is not None:
+            self.registerVariables(self._variables)
+
+    cdef unregister_context(self):
+        self.unregisterGlobalFunctions(
+            self._xpathCtxt, _unregister_xpath_function)
+        self.unregisterGlobalNamespaces()
+        xpath.xmlXPathRegisteredVariablesCleanup(self._xpathCtxt)
+        self._cleanup_context()
+
+    cdef void registerExsltFunctions(self):
+        if xslt.LIBXSLT_VERSION < 10125:
+            # we'd only execute dummy functions anyway
+            return
+        tree.xmlHashScan(
+            self._xpathCtxt.nsHash, _registerExsltFunctionsForNamespaces,
+            self._xpathCtxt)
+
+    cdef registerVariables(self, variable_dict):
+        for name, value in variable_dict.items():
+            name_utf = self._to_utf(name)
+            xpath.xmlXPathRegisterVariable(
+                self._xpathCtxt, _xcstr(name_utf), _wrapXPathObject(value, None, None))
+
+    cdef registerVariable(self, name, value):
+        name_utf = self._to_utf(name)
+        xpath.xmlXPathRegisterVariable(
+            self._xpathCtxt, _xcstr(name_utf), _wrapXPathObject(value, None, None))
+
+
+cdef void _registerExsltFunctionsForNamespaces(
+        void* _c_href, void* _ctxt, xmlChar* c_prefix):
+    c_href = <const_xmlChar*> _c_href
+    ctxt = <xpath.xmlXPathContext*> _ctxt
+
+    if tree.xmlStrcmp(c_href, xslt.EXSLT_DATE_NAMESPACE) == 0:
+        xslt.exsltDateXpathCtxtRegister(ctxt, c_prefix)
+    elif tree.xmlStrcmp(c_href, xslt.EXSLT_SETS_NAMESPACE) == 0:
+        xslt.exsltSetsXpathCtxtRegister(ctxt, c_prefix)
+    elif tree.xmlStrcmp(c_href, xslt.EXSLT_MATH_NAMESPACE) == 0:
+        xslt.exsltMathXpathCtxtRegister(ctxt, c_prefix)
+    elif tree.xmlStrcmp(c_href, xslt.EXSLT_STRINGS_NAMESPACE) == 0:
+        xslt.exsltStrXpathCtxtRegister(ctxt, c_prefix)
+
+
+cdef class _XPathEvaluatorBase:
+    cdef xpath.xmlXPathContext* _xpathCtxt
+    cdef _XPathContext _context
+    cdef python.PyThread_type_lock _eval_lock
+    cdef _ErrorLog _error_log
+    def __cinit__(self):
+        self._xpathCtxt = NULL
+        if config.ENABLE_THREADING:
+            self._eval_lock = python.PyThread_allocate_lock()
+            if self._eval_lock is NULL:
+                raise MemoryError()
+        self._error_log = _ErrorLog()
+
+    def __init__(self, namespaces, extensions, enable_regexp,
+                 smart_strings):
+        self._context = _XPathContext(namespaces, extensions, self._error_log,
+                                      enable_regexp, None, smart_strings)
+
+    property error_log:
+        def __get__(self):
+            assert self._error_log is not None, "XPath evaluator not initialised"
+            return self._error_log.copy()
+
+    def __dealloc__(self):
+        if self._xpathCtxt is not NULL:
+            xpath.xmlXPathFreeContext(self._xpathCtxt)
+        if config.ENABLE_THREADING:
+            if self._eval_lock is not NULL:
+                python.PyThread_free_lock(self._eval_lock)
+
+    cdef set_context(self, xpath.xmlXPathContext* xpathCtxt):
+        self._xpathCtxt = xpathCtxt
+        self._context.set_context(xpathCtxt)
+
+    def evaluate(self, _eval_arg, **_variables):
+        u"""evaluate(self, _eval_arg, **_variables)
+
+        Evaluate an XPath expression.
+
+        Instead of calling this method, you can also call the evaluator object
+        itself.
+
+        Variables may be provided as keyword arguments.  Note that namespaces
+        are currently not supported for variables.
+
+        :deprecated: call the object, not its method.
+        """
+        return self(_eval_arg, **_variables)
+
+    cdef bint _checkAbsolutePath(self, char* path):
+        cdef char c
+        if path is NULL:
+            return 0
+        c = path[0]
+        while c == c' ' or c == c'\t':
+            path = path + 1
+            c = path[0]
+        return c == c'/'
+
+    @cython.final
+    cdef int _lock(self) except -1:
+        cdef int result
+        if config.ENABLE_THREADING and self._eval_lock != NULL:
+            with nogil:
+                result = python.PyThread_acquire_lock(
+                    self._eval_lock, python.WAIT_LOCK)
+            if result == 0:
+                raise XPathError, u"XPath evaluator locking failed"
+        return 0
+
+    @cython.final
+    cdef void _unlock(self):
+        if config.ENABLE_THREADING and self._eval_lock != NULL:
+            python.PyThread_release_lock(self._eval_lock)
+
+    cdef _raise_parse_error(self):
+        cdef _BaseErrorLog entries
+        entries = self._error_log.filter_types(_XPATH_SYNTAX_ERRORS)
+        if entries:
+            message = entries._buildExceptionMessage(None)
+            if message is not None:
+                raise XPathSyntaxError(message, self._error_log)
+        raise XPathSyntaxError(self._error_log._buildExceptionMessage(
+                u"Error in xpath expression"),
+                               self._error_log)
+
+    cdef _raise_eval_error(self):
+        cdef _BaseErrorLog entries
+        entries = self._error_log.filter_types(_XPATH_EVAL_ERRORS)
+        if not entries:
+            entries = self._error_log.filter_types(_XPATH_SYNTAX_ERRORS)
+        if entries:
+            message = entries._buildExceptionMessage(None)
+            if message is not None:
+                raise XPathEvalError(message, self._error_log)
+        raise XPathEvalError(self._error_log._buildExceptionMessage(
+                u"Error in xpath expression"),
+                             self._error_log)
+
+    cdef object _handle_result(self, xpath.xmlXPathObject* xpathObj, _Document doc):
+        if self._context._exc._has_raised():
+            if xpathObj is not NULL:
+                _freeXPathObject(xpathObj)
+                xpathObj = NULL
+            self._context._release_temp_refs()
+            self._context._exc._raise_if_stored()
+
+        if xpathObj is NULL:
+            self._context._release_temp_refs()
+            self._raise_eval_error()
+
+        try:
+            result = _unwrapXPathObject(xpathObj, doc, self._context)
+        finally:
+            _freeXPathObject(xpathObj)
+            self._context._release_temp_refs()
+
+        return result
+
+
+cdef class XPathElementEvaluator(_XPathEvaluatorBase):
+    u"""XPathElementEvaluator(self, element, namespaces=None, extensions=None, regexp=True, smart_strings=True)
+    Create an XPath evaluator for an element.
+
+    Absolute XPath expressions (starting with '/') will be evaluated against
+    the ElementTree as returned by getroottree().
+
+    Additional namespace declarations can be passed with the
+    'namespace' keyword argument.  EXSLT regular expression support
+    can be disabled with the 'regexp' boolean keyword (defaults to
+    True).  Smart strings will be returned for string results unless
+    you pass ``smart_strings=False``.
+    """
+    cdef _Element _element
+    def __init__(self, _Element element not None, *, namespaces=None,
+                 extensions=None, regexp=True, smart_strings=True):
+        cdef xpath.xmlXPathContext* xpathCtxt
+        cdef int ns_register_status
+        cdef _Document doc
+        _assertValidNode(element)
+        _assertValidDoc(element._doc)
+        self._element = element
+        doc = element._doc
+        _XPathEvaluatorBase.__init__(self, namespaces, extensions,
+                                     regexp, smart_strings)
+        xpathCtxt = xpath.xmlXPathNewContext(doc._c_doc)
+        if xpathCtxt is NULL:
+            raise MemoryError()
+        self.set_context(xpathCtxt)
+
+    def register_namespace(self, prefix, uri):
+        u"""Register a namespace with the XPath context.
+        """
+        assert self._xpathCtxt is not NULL, "XPath context not initialised"
+        self._context.addNamespace(prefix, uri)
+
+    def register_namespaces(self, namespaces):
+        u"""Register a prefix -> uri dict.
+        """
+        assert self._xpathCtxt is not NULL, "XPath context not initialised"
+        for prefix, uri in namespaces.items():
+            self._context.addNamespace(prefix, uri)
+
+    def __call__(self, _path, **_variables):
+        u"""__call__(self, _path, **_variables)
+
+        Evaluate an XPath expression on the document.
+
+        Variables may be provided as keyword arguments.  Note that namespaces
+        are currently not supported for variables.
+
+        Absolute XPath expressions (starting with '/') will be evaluated
+        against the ElementTree as returned by getroottree().
+        """
+        cdef xpath.xmlXPathObject*  xpathObj
+        cdef _Document doc
+        assert self._xpathCtxt is not NULL, "XPath context not initialised"
+        path = _utf8(_path)
+        doc = self._element._doc
+
+        self._lock()
+        self._xpathCtxt.node = self._element._c_node
+        try:
+            self._context.register_context(doc)
+            self._context.registerVariables(_variables)
+            c_path = _xcstr(path)
+            with nogil:
+                xpathObj = xpath.xmlXPathEvalExpression(
+                    c_path, self._xpathCtxt)
+            result = self._handle_result(xpathObj, doc)
+        finally:
+            self._context.unregister_context()
+            self._unlock()
+
+        return result
+
+
+cdef class XPathDocumentEvaluator(XPathElementEvaluator):
+    u"""XPathDocumentEvaluator(self, etree, namespaces=None, extensions=None, regexp=True, smart_strings=True)
+    Create an XPath evaluator for an ElementTree.
+
+    Additional namespace declarations can be passed with the
+    'namespace' keyword argument.  EXSLT regular expression support
+    can be disabled with the 'regexp' boolean keyword (defaults to
+    True).  Smart strings will be returned for string results unless
+    you pass ``smart_strings=False``.
+    """
+    def __init__(self, _ElementTree etree not None, *, namespaces=None,
+                 extensions=None, regexp=True, smart_strings=True):
+        XPathElementEvaluator.__init__(
+            self, etree._context_node, namespaces=namespaces, 
+            extensions=extensions, regexp=regexp,
+            smart_strings=smart_strings)
+
+    def __call__(self, _path, **_variables):
+        u"""__call__(self, _path, **_variables)
+
+        Evaluate an XPath expression on the document.
+
+        Variables may be provided as keyword arguments.  Note that namespaces
+        are currently not supported for variables.
+        """
+        cdef xpath.xmlXPathObject*  xpathObj
+        cdef xmlDoc* c_doc
+        cdef _Document doc
+        assert self._xpathCtxt is not NULL, "XPath context not initialised"
+        path = _utf8(_path)
+        doc = self._element._doc
+
+        self._lock()
+        try:
+            self._context.register_context(doc)
+            c_doc = _fakeRootDoc(doc._c_doc, self._element._c_node)
+            try:
+                self._context.registerVariables(_variables)
+                c_path = _xcstr(path)
+                with nogil:
+                    self._xpathCtxt.doc  = c_doc
+                    self._xpathCtxt.node = tree.xmlDocGetRootElement(c_doc)
+                    xpathObj = xpath.xmlXPathEvalExpression(
+                        c_path, self._xpathCtxt)
+                result = self._handle_result(xpathObj, doc)
+            finally:
+                _destroyFakeDoc(doc._c_doc, c_doc)
+                self._context.unregister_context()
+        finally:
+            self._unlock()
+
+        return result
+
+
+def XPathEvaluator(etree_or_element, *, namespaces=None, extensions=None,
+                   regexp=True, smart_strings=True):
+    u"""XPathEvaluator(etree_or_element, namespaces=None, extensions=None, regexp=True, smart_strings=True)
+
+    Creates an XPath evaluator for an ElementTree or an Element.
+
+    The resulting object can be called with an XPath expression as argument
+    and XPath variables provided as keyword arguments.
+
+    Additional namespace declarations can be passed with the
+    'namespace' keyword argument.  EXSLT regular expression support
+    can be disabled with the 'regexp' boolean keyword (defaults to
+    True).  Smart strings will be returned for string results unless
+    you pass ``smart_strings=False``.
+    """
+    if isinstance(etree_or_element, _ElementTree):
+        return XPathDocumentEvaluator(
+            etree_or_element, namespaces=namespaces,
+            extensions=extensions, regexp=regexp, smart_strings=smart_strings)
+    else:
+        return XPathElementEvaluator(
+            etree_or_element, namespaces=namespaces,
+            extensions=extensions, regexp=regexp, smart_strings=smart_strings)
+
+
+cdef class XPath(_XPathEvaluatorBase):
+    u"""XPath(self, path, namespaces=None, extensions=None, regexp=True, smart_strings=True)
+    A compiled XPath expression that can be called on Elements and ElementTrees.
+
+    Besides the XPath expression, you can pass prefix-namespace
+    mappings and extension functions to the constructor through the
+    keyword arguments ``namespaces`` and ``extensions``.  EXSLT
+    regular expression support can be disabled with the 'regexp'
+    boolean keyword (defaults to True).  Smart strings will be
+    returned for string results unless you pass
+    ``smart_strings=False``.
+    """
+    cdef xpath.xmlXPathCompExpr* _xpath
+    cdef bytes _path
+    def __cinit__(self):
+        self._xpath = NULL
+
+    def __init__(self, path, *, namespaces=None, extensions=None,
+                 regexp=True, smart_strings=True):
+        cdef xpath.xmlXPathContext* xpathCtxt
+        _XPathEvaluatorBase.__init__(self, namespaces, extensions,
+                                     regexp, smart_strings)
+        self._path = _utf8(path)
+        xpathCtxt = xpath.xmlXPathNewContext(NULL)
+        if xpathCtxt is NULL:
+            raise MemoryError()
+        self.set_context(xpathCtxt)
+        self._xpath = xpath.xmlXPathCtxtCompile(xpathCtxt, _xcstr(self._path))
+        if self._xpath is NULL:
+            self._raise_parse_error()
+
+    def __call__(self, _etree_or_element, **_variables):
+        u"__call__(self, _etree_or_element, **_variables)"
+        cdef xpath.xmlXPathObject*  xpathObj
+        cdef _Document document
+        cdef _Element element
+
+        assert self._xpathCtxt is not NULL, "XPath context not initialised"
+        document = _documentOrRaise(_etree_or_element)
+        element  = _rootNodeOrRaise(_etree_or_element)
+
+        self._lock()
+        self._xpathCtxt.doc  = document._c_doc
+        self._xpathCtxt.node = element._c_node
+
+        try:
+            self._context.register_context(document)
+            self._context.registerVariables(_variables)
+            with nogil:
+                xpathObj = xpath.xmlXPathCompiledEval(
+                    self._xpath, self._xpathCtxt)
+            result = self._handle_result(xpathObj, document)
+        finally:
+            self._context.unregister_context()
+            self._unlock()
+        return result
+
+    property path:
+        u"""The literal XPath expression.
+        """
+        def __get__(self):
+            return self._path.decode(u'UTF-8')
+
+    def __dealloc__(self):
+        if self._xpath is not NULL:
+            xpath.xmlXPathFreeCompExpr(self._xpath)
+
+    def __repr__(self):
+        return self.path
+
+
+cdef object _replace_strings
+cdef object _find_namespaces
+_replace_strings = re.compile(b'("[^"]*")|(\'[^\']*\')').sub
+_find_namespaces = re.compile(b'({[^}]+})').findall
+
+cdef class ETXPath(XPath):
+    u"""ETXPath(self, path, extensions=None, regexp=True, smart_strings=True)
+    Special XPath class that supports the ElementTree {uri} notation for namespaces.
+
+    Note that this class does not accept the ``namespace`` keyword
+    argument. All namespaces must be passed as part of the path
+    string.  Smart strings will be returned for string results unless
+    you pass ``smart_strings=False``.
+    """
+    def __init__(self, path, *, extensions=None, regexp=True,
+                 smart_strings=True):
+        path, namespaces = self._nsextract_path(path)
+        XPath.__init__(self, path, namespaces=namespaces,
+                       extensions=extensions, regexp=regexp,
+                       smart_strings=smart_strings)
+
+    cdef _nsextract_path(self, path):
+        # replace {namespaces} by new prefixes
+        cdef dict namespaces = {}
+        cdef list namespace_defs = []
+        cdef int i
+        path_utf = _utf8(path)
+        stripped_path = _replace_strings(b'', path_utf) # remove string literals
+        i = 1
+        for namespace_def in _find_namespaces(stripped_path):
+            if namespace_def not in namespace_defs:
+                prefix = python.PyBytes_FromFormat("__xpp%02d", i)
+                i += 1
+                namespace_defs.append(namespace_def)
+                namespace = namespace_def[1:-1] # remove '{}'
+                namespace = (<bytes>namespace).decode('utf8')
+                namespaces[prefix.decode('utf8')] = namespace
+                prefix_str = prefix + b':'
+                # FIXME: this also replaces {namespaces} within strings!
+                path_utf = path_utf.replace(namespace_def, prefix_str)
+        path = path_utf.decode('utf8')
+        return path, namespaces
diff --git a/lib/lxml/xslt.pxi b/lib/lxml/xslt.pxi
new file mode 100644
index 00000000..7fa2d231
--- /dev/null
+++ b/lib/lxml/xslt.pxi
@@ -0,0 +1,926 @@
+
+# XSLT
+from lxml.includes cimport xslt
+
+class XSLTError(LxmlError):
+    u"""Base class of all XSLT errors.
+    """
+    pass
+
+class XSLTParseError(XSLTError):
+    u"""Error parsing a stylesheet document.
+    """
+    pass
+
+class XSLTApplyError(XSLTError):
+    u"""Error running an XSL transformation.
+    """
+    pass
+
+class XSLTSaveError(XSLTError):
+    u"""Error serialising an XSLT result.
+    """
+    pass
+
+class XSLTExtensionError(XSLTError):
+    u"""Error registering an XSLT extension.
+    """
+    pass
+
+# version information
+LIBXSLT_COMPILED_VERSION = __unpackIntVersion(xslt.LIBXSLT_VERSION)
+LIBXSLT_VERSION = __unpackIntVersion(xslt.xsltLibxsltVersion)
+
+
+################################################################################
+# Where do we store what?
+#
+# xsltStylesheet->doc->_private
+#    == _XSLTResolverContext for XSL stylesheet
+#
+# xsltTransformContext->_private
+#    == _XSLTResolverContext for transformed document
+#
+################################################################################
+
+
+################################################################################
+# XSLT document loaders
+
+@cython.final
+@cython.internal
+cdef class _XSLTResolverContext(_ResolverContext):
+    cdef xmlDoc* _c_style_doc
+    cdef _BaseParser _parser
+
+    cdef _XSLTResolverContext _copy(self):
+        cdef _XSLTResolverContext context
+        context = _XSLTResolverContext()
+        _initXSLTResolverContext(context, self._parser)
+        context._c_style_doc = self._c_style_doc
+        return context
+
+cdef _initXSLTResolverContext(_XSLTResolverContext context,
+                              _BaseParser parser):
+    _initResolverContext(context, parser.resolvers)
+    context._parser = parser
+    context._c_style_doc = NULL
+
+cdef xmlDoc* _xslt_resolve_from_python(const_xmlChar* c_uri, void* c_context,
+                                       int parse_options, int* error) with gil:
+    # call the Python document loaders
+    cdef _XSLTResolverContext context
+    cdef _ResolverRegistry resolvers
+    cdef _InputDocument doc_ref
+    cdef xmlDoc* c_doc
+    cdef xmlDoc* c_return_doc = NULL
+
+    error[0] = 0
+    context = <_XSLTResolverContext>c_context
+
+    # shortcut if we resolve the stylesheet itself
+    c_doc = context._c_style_doc
+    try:
+        if c_doc is not NULL and c_doc.URL is not NULL:
+            if tree.xmlStrcmp(c_uri, c_doc.URL) == 0:
+                c_return_doc = _copyDoc(c_doc, 1)
+                return c_return_doc  # 'goto', see 'finally' below
+
+        # delegate to the Python resolvers
+        resolvers = context._resolvers
+        if tree.xmlStrncmp(<unsigned char*>'string://__STRING__XSLT__/', c_uri, 26) == 0:
+            c_uri += 26
+        uri = _decodeFilename(c_uri)
+        doc_ref = resolvers.resolve(uri, None, context)
+
+        if doc_ref is not None:
+            if doc_ref._type == PARSER_DATA_STRING:
+                c_return_doc = _parseDoc(
+                    doc_ref._data_bytes, doc_ref._filename, context._parser)
+            elif doc_ref._type == PARSER_DATA_FILENAME:
+                c_return_doc = _parseDocFromFile(
+                    doc_ref._filename, context._parser)
+            elif doc_ref._type == PARSER_DATA_FILE:
+                c_return_doc = _parseDocFromFilelike(
+                    doc_ref._file, doc_ref._filename, context._parser)
+            elif doc_ref._type == PARSER_DATA_EMPTY:
+                c_return_doc = _newXMLDoc()
+            if c_return_doc is not NULL and c_return_doc.URL is NULL:
+                c_return_doc.URL = tree.xmlStrdup(c_uri)
+    except:
+        error[0] = 1
+        context._store_raised()
+    finally:
+        return c_return_doc  # and swallow any further exceptions
+
+cdef void _xslt_store_resolver_exception(const_xmlChar* c_uri, void* context,
+                                         xslt.xsltLoadType c_type) with gil:
+    try:
+        message = u"Cannot resolve URI %s" % _decodeFilename(c_uri)
+        if c_type == xslt.XSLT_LOAD_DOCUMENT:
+            exception = XSLTApplyError(message)
+        else:
+            exception = XSLTParseError(message)
+        (<_XSLTResolverContext>context)._store_exception(exception)
+    except BaseException as e:
+        (<_XSLTResolverContext>context)._store_exception(e)
+
+cdef xmlDoc* _xslt_doc_loader(const_xmlChar* c_uri, tree.xmlDict* c_dict,
+                              int parse_options, void* c_ctxt,
+                              xslt.xsltLoadType c_type) nogil:
+    # nogil => no Python objects here, may be called without thread context !
+    cdef xmlDoc* c_doc
+    cdef xmlDoc* result
+    cdef void* c_pcontext
+    cdef int error = 0
+    # find resolver contexts of stylesheet and transformed doc
+    if c_type == xslt.XSLT_LOAD_DOCUMENT:
+        # transformation time
+        c_pcontext = (<xslt.xsltTransformContext*>c_ctxt)._private
+    elif c_type == xslt.XSLT_LOAD_STYLESHEET:
+        # include/import resolution while parsing
+        c_pcontext = (<xslt.xsltStylesheet*>c_ctxt).doc._private
+    else:
+        c_pcontext = NULL
+
+    if c_pcontext is NULL:
+        # can't call Python without context, fall back to default loader
+        return XSLT_DOC_DEFAULT_LOADER(
+            c_uri, c_dict, parse_options, c_ctxt, c_type)
+
+    c_doc = _xslt_resolve_from_python(c_uri, c_pcontext, parse_options, &error)
+    if c_doc is NULL and not error:
+        c_doc = XSLT_DOC_DEFAULT_LOADER(
+            c_uri, c_dict, parse_options, c_ctxt, c_type)
+        if c_doc is NULL:
+            _xslt_store_resolver_exception(c_uri, c_pcontext, c_type)
+
+    if c_doc is not NULL and c_type == xslt.XSLT_LOAD_STYLESHEET:
+        c_doc._private = c_pcontext
+    return c_doc
+
+cdef xslt.xsltDocLoaderFunc XSLT_DOC_DEFAULT_LOADER = xslt.xsltDocDefaultLoader
+xslt.xsltSetLoaderFunc(<xslt.xsltDocLoaderFunc>_xslt_doc_loader)
+
+################################################################################
+# XSLT file/network access control
+
+cdef class XSLTAccessControl:
+    u"""XSLTAccessControl(self, read_file=True, write_file=True, create_dir=True, read_network=True, write_network=True)
+
+    Access control for XSLT: reading/writing files, directories and
+    network I/O.  Access to a type of resource is granted or denied by
+    passing any of the following boolean keyword arguments.  All of
+    them default to True to allow access.
+
+    - read_file
+    - write_file
+    - create_dir
+    - read_network
+    - write_network
+
+    For convenience, there is also a class member `DENY_ALL` that
+    provides an XSLTAccessControl instance that is readily configured
+    to deny everything, and a `DENY_WRITE` member that denies all
+    write access but allows read access.
+
+    See `XSLT`.
+    """
+    cdef xslt.xsltSecurityPrefs* _prefs
+    def __cinit__(self):
+        self._prefs = xslt.xsltNewSecurityPrefs()
+        if self._prefs is NULL:
+            raise MemoryError()
+
+    def __init__(self, *, bint read_file=True, bint write_file=True, bint create_dir=True,
+                 bint read_network=True, bint write_network=True):
+        self._setAccess(xslt.XSLT_SECPREF_READ_FILE, read_file)
+        self._setAccess(xslt.XSLT_SECPREF_WRITE_FILE, write_file)
+        self._setAccess(xslt.XSLT_SECPREF_CREATE_DIRECTORY, create_dir)
+        self._setAccess(xslt.XSLT_SECPREF_READ_NETWORK, read_network)
+        self._setAccess(xslt.XSLT_SECPREF_WRITE_NETWORK, write_network)
+
+    DENY_ALL = XSLTAccessControl(
+        read_file=False, write_file=False, create_dir=False,
+        read_network=False, write_network=False)
+
+    DENY_WRITE = XSLTAccessControl(
+        read_file=True, write_file=False, create_dir=False,
+        read_network=True, write_network=False)
+
+    def __dealloc__(self):
+        if self._prefs is not NULL:
+            xslt.xsltFreeSecurityPrefs(self._prefs)
+
+    @cython.final
+    cdef _setAccess(self, xslt.xsltSecurityOption option, bint allow):
+        cdef xslt.xsltSecurityCheck function
+        if allow:
+            function = xslt.xsltSecurityAllow
+        else:
+            function = xslt.xsltSecurityForbid
+        xslt.xsltSetSecurityPrefs(self._prefs, option, function)
+
+    @cython.final
+    cdef void _register_in_context(self, xslt.xsltTransformContext* ctxt):
+        xslt.xsltSetCtxtSecurityPrefs(self._prefs, ctxt)
+
+    property options:
+        u"The access control configuration as a map of options."
+        def __get__(self):
+            return {
+                u'read_file': self._optval(xslt.XSLT_SECPREF_READ_FILE),
+                u'write_file': self._optval(xslt.XSLT_SECPREF_WRITE_FILE),
+                u'create_dir': self._optval(xslt.XSLT_SECPREF_CREATE_DIRECTORY),
+                u'read_network': self._optval(xslt.XSLT_SECPREF_READ_NETWORK),
+                u'write_network': self._optval(xslt.XSLT_SECPREF_WRITE_NETWORK),
+                }
+
+    @cython.final
+    cdef _optval(self, xslt.xsltSecurityOption option):
+        cdef xslt.xsltSecurityCheck function
+        function = xslt.xsltGetSecurityPrefs(self._prefs, option)
+        if function is <xslt.xsltSecurityCheck>xslt.xsltSecurityAllow:
+            return True
+        elif function is <xslt.xsltSecurityCheck>xslt.xsltSecurityForbid:
+            return False
+        else:
+            return None
+
+    def __repr__(self):
+        items = sorted(self.options.items())
+        return u"%s(%s)" % (
+            python._fqtypename(self).decode('UTF-8').split(u'.')[-1],
+            u', '.join([u"%s=%r" % item for item in items]))
+
+################################################################################
+# XSLT
+
+cdef int _register_xslt_function(void* ctxt, name_utf, ns_utf):
+    if ns_utf is None:
+        return 0
+    # libxml2 internalises the strings if ctxt has a dict
+    return xslt.xsltRegisterExtFunction(
+        <xslt.xsltTransformContext*>ctxt, _xcstr(name_utf), _xcstr(ns_utf),
+        <xslt.xmlXPathFunction>_xpath_function_call)
+
+cdef dict EMPTY_DICT = {}
+
+@cython.final
+@cython.internal
+cdef class _XSLTContext(_BaseContext):
+    cdef xslt.xsltTransformContext* _xsltCtxt
+    cdef _ReadOnlyElementProxy _extension_element_proxy
+    cdef dict _extension_elements
+    def __cinit__(self):
+        self._xsltCtxt = NULL
+        self._extension_elements = EMPTY_DICT
+
+    def __init__(self, namespaces, extensions, error_log, enable_regexp,
+                 build_smart_strings):
+        if extensions is not None and extensions:
+            for ns_name_tuple, extension in extensions.items():
+                if ns_name_tuple[0] is None:
+                    raise XSLTExtensionError, \
+                        u"extensions must not have empty namespaces"
+                if isinstance(extension, XSLTExtension):
+                    if self._extension_elements is EMPTY_DICT:
+                        self._extension_elements = {}
+                        extensions = extensions.copy()
+                    ns_utf   = _utf8(ns_name_tuple[0])
+                    name_utf = _utf8(ns_name_tuple[1])
+                    self._extension_elements[(ns_utf, name_utf)] = extension
+                    del extensions[ns_name_tuple]
+        _BaseContext.__init__(self, namespaces, extensions, error_log, enable_regexp,
+                              build_smart_strings)
+
+    cdef _BaseContext _copy(self):
+        cdef _XSLTContext context
+        context = <_XSLTContext>_BaseContext._copy(self)
+        context._extension_elements = self._extension_elements
+        return context
+
+    cdef register_context(self, xslt.xsltTransformContext* xsltCtxt,
+                               _Document doc):
+        self._xsltCtxt = xsltCtxt
+        self._set_xpath_context(xsltCtxt.xpathCtxt)
+        self._register_context(doc)
+        self.registerLocalFunctions(xsltCtxt, _register_xslt_function)
+        self.registerGlobalFunctions(xsltCtxt, _register_xslt_function)
+        _registerXSLTExtensions(xsltCtxt, self._extension_elements)
+
+    cdef free_context(self):
+        self._cleanup_context()
+        self._release_context()
+        if self._xsltCtxt is not NULL:
+            xslt.xsltFreeTransformContext(self._xsltCtxt)
+            self._xsltCtxt = NULL
+        self._release_temp_refs()
+
+
+@cython.final
+@cython.internal
+@cython.freelist(8)
+cdef class _XSLTQuotedStringParam:
+    u"""A wrapper class for literal XSLT string parameters that require
+    quote escaping.
+    """
+    cdef bytes strval
+    def __cinit__(self, strval):
+        self.strval = _utf8(strval)
+
+
+@cython.no_gc_clear
+cdef class XSLT:
+    u"""XSLT(self, xslt_input, extensions=None, regexp=True, access_control=None)
+
+    Turn an XSL document into an XSLT object.
+
+    Calling this object on a tree or Element will execute the XSLT::
+
+        transform = etree.XSLT(xsl_tree)
+        result = transform(xml_tree)
+
+    Keyword arguments of the constructor:
+
+    - extensions: a dict mapping ``(namespace, name)`` pairs to
+      extension functions or extension elements
+    - regexp: enable exslt regular expression support in XPath
+      (default: True)
+    - access_control: access restrictions for network or file
+      system (see `XSLTAccessControl`)
+
+    Keyword arguments of the XSLT call:
+
+    - profile_run: enable XSLT profiling (default: False)
+
+    Other keyword arguments of the call are passed to the stylesheet
+    as parameters.
+    """
+    cdef _XSLTContext _context
+    cdef xslt.xsltStylesheet* _c_style
+    cdef _XSLTResolverContext _xslt_resolver_context
+    cdef XSLTAccessControl _access_control
+    cdef _ErrorLog _error_log
+
+    def __cinit__(self):
+        self._c_style = NULL
+
+    def __init__(self, xslt_input, *, extensions=None, regexp=True,
+                 access_control=None):
+        cdef xslt.xsltStylesheet* c_style
+        cdef xmlDoc* c_doc
+        cdef _Document doc
+        cdef _Element root_node
+
+        doc = _documentOrRaise(xslt_input)
+        root_node = _rootNodeOrRaise(xslt_input)
+
+        # set access control or raise TypeError
+        self._access_control = access_control
+
+        # make a copy of the document as stylesheet parsing modifies it
+        c_doc = _copyDocRoot(doc._c_doc, root_node._c_node)
+
+        # make sure we always have a stylesheet URL
+        if c_doc.URL is NULL:
+            doc_url_utf = python.PyUnicode_AsASCIIString(
+                u"string://__STRING__XSLT__/%d.xslt" % id(self))
+            c_doc.URL = tree.xmlStrdup(_xcstr(doc_url_utf))
+
+        self._error_log = _ErrorLog()
+        self._xslt_resolver_context = _XSLTResolverContext()
+        _initXSLTResolverContext(self._xslt_resolver_context, doc._parser)
+        # keep a copy in case we need to access the stylesheet via 'document()'
+        self._xslt_resolver_context._c_style_doc = _copyDoc(c_doc, 1)
+        c_doc._private = <python.PyObject*>self._xslt_resolver_context
+
+        with self._error_log:
+            c_style = xslt.xsltParseStylesheetDoc(c_doc)
+
+        if c_style is NULL or c_style.errors:
+            tree.xmlFreeDoc(c_doc)
+            if c_style is not NULL:
+                xslt.xsltFreeStylesheet(c_style)
+            self._xslt_resolver_context._raise_if_stored()
+            # last error seems to be the most accurate here
+            if self._error_log.last_error is not None and \
+                    self._error_log.last_error.message:
+                raise XSLTParseError(self._error_log.last_error.message,
+                                     self._error_log)
+            else:
+                raise XSLTParseError(
+                    self._error_log._buildExceptionMessage(
+                        u"Cannot parse stylesheet"),
+                    self._error_log)
+
+        c_doc._private = NULL # no longer used!
+        self._c_style = c_style
+        self._context = _XSLTContext(None, extensions, self._error_log, regexp, True)
+
+    def __dealloc__(self):
+        if self._xslt_resolver_context is not None and \
+               self._xslt_resolver_context._c_style_doc is not NULL:
+            tree.xmlFreeDoc(self._xslt_resolver_context._c_style_doc)
+        # this cleans up the doc copy as well
+        if self._c_style is not NULL:
+            xslt.xsltFreeStylesheet(self._c_style)
+
+    property error_log:
+        u"The log of errors and warnings of an XSLT execution."
+        def __get__(self):
+            return self._error_log.copy()
+
+    @staticmethod
+    def strparam(strval):
+        u"""strparam(strval)
+
+        Mark an XSLT string parameter that requires quote escaping
+        before passing it into the transformation.  Use it like this::
+
+            result = transform(doc, some_strval = XSLT.strparam(
+                '''it's \"Monty Python's\" ...'''))
+
+        Escaped string parameters can be reused without restriction.
+        """
+        return _XSLTQuotedStringParam(strval)
+
+    @staticmethod
+    def set_global_max_depth(int max_depth):
+        u"""set_global_max_depth(max_depth)
+
+        The maximum traversal depth that the stylesheet engine will allow.
+        This does not only count the template recursion depth but also takes
+        the number of variables/parameters into account.  The required setting
+        for a run depends on both the stylesheet and the input data.
+
+        Example::
+
+            XSLT.set_global_max_depth(5000)
+
+        Note that this is currently a global, module-wide setting because
+        libxslt does not support it at a per-stylesheet level.
+        """
+        if max_depth < 0:
+            raise ValueError("cannot set a maximum stylesheet traversal depth < 0")
+        xslt.xsltMaxDepth = max_depth
+
+    def apply(self, _input, *, profile_run=False, **kw):
+        u"""apply(self, _input,  profile_run=False, **kw)
+        
+        :deprecated: call the object, not this method."""
+        return self(_input, profile_run=profile_run, **kw)
+
+    def tostring(self, _ElementTree result_tree):
+        u"""tostring(self, result_tree)
+
+        Save result doc to string based on stylesheet output method.
+
+        :deprecated: use str(result_tree) instead.
+        """
+        return str(result_tree)
+
+    def __deepcopy__(self, memo):
+        return self.__copy__()
+
+    def __copy__(self):
+        return _copyXSLT(self)
+
+    def __call__(self, _input, *, profile_run=False, **kw):
+        u"""__call__(self, _input, profile_run=False, **kw)
+
+        Execute the XSL transformation on a tree or Element.
+
+        Pass the ``profile_run`` option to get profile information
+        about the XSLT.  The result of the XSLT will have a property
+        xslt_profile that holds an XML tree with profiling data.
+        """
+        cdef _XSLTContext context = None
+        cdef _XSLTResolverContext resolver_context
+        cdef _Document input_doc
+        cdef _Element root_node
+        cdef _Document result_doc
+        cdef _Document profile_doc = None
+        cdef xmlDoc* c_profile_doc
+        cdef xslt.xsltTransformContext* transform_ctxt
+        cdef xmlDoc* c_result = NULL
+        cdef xmlDoc* c_doc
+        cdef tree.xmlDict* c_dict
+        cdef const_char** params = NULL
+
+        assert self._c_style is not NULL, "XSLT stylesheet not initialised"
+        input_doc = _documentOrRaise(_input)
+        root_node = _rootNodeOrRaise(_input)
+
+        c_doc = _fakeRootDoc(input_doc._c_doc, root_node._c_node)
+
+        transform_ctxt = xslt.xsltNewTransformContext(self._c_style, c_doc)
+        if transform_ctxt is NULL:
+            _destroyFakeDoc(input_doc._c_doc, c_doc)
+            raise MemoryError()
+
+        # using the stylesheet dict is safer than using a possibly
+        # unrelated dict from the current thread.  Almost all
+        # non-input tag/attr names will come from the stylesheet
+        # anyway.
+        if transform_ctxt.dict is not NULL:
+            xmlparser.xmlDictFree(transform_ctxt.dict)
+        if kw:
+            # parameter values are stored in the dict
+            # => avoid unnecessarily cluttering the global dict
+            transform_ctxt.dict = xmlparser.xmlDictCreateSub(self._c_style.doc.dict)
+            if transform_ctxt.dict is NULL:
+                xslt.xsltFreeTransformContext(transform_ctxt)
+                raise MemoryError()
+        else:
+            transform_ctxt.dict = self._c_style.doc.dict
+            xmlparser.xmlDictReference(transform_ctxt.dict)
+
+        xslt.xsltSetCtxtParseOptions(
+            transform_ctxt, input_doc._parser._parse_options)
+
+        if profile_run:
+            transform_ctxt.profile = 1
+
+        try:
+            context = self._context._copy()
+            context.register_context(transform_ctxt, input_doc)
+
+            resolver_context = self._xslt_resolver_context._copy()
+            transform_ctxt._private = <python.PyObject*>resolver_context
+
+            _convert_xslt_parameters(transform_ctxt, kw, &params)
+            c_result = self._run_transform(
+                c_doc, params, context, transform_ctxt)
+            if params is not NULL:
+                # deallocate space for parameters
+                python.PyMem_Free(params)
+
+            if transform_ctxt.state != xslt.XSLT_STATE_OK:
+                if c_result is not NULL:
+                    tree.xmlFreeDoc(c_result)
+                    c_result = NULL
+
+            if transform_ctxt.profile:
+                c_profile_doc = xslt.xsltGetProfileInformation(transform_ctxt)
+                if c_profile_doc is not NULL:
+                    profile_doc = _documentFactory(
+                        c_profile_doc, input_doc._parser)
+        finally:
+            if context is not None:
+                context.free_context()
+            _destroyFakeDoc(input_doc._c_doc, c_doc)
+
+        try:
+            if resolver_context is not None and resolver_context._has_raised():
+                if c_result is not NULL:
+                    tree.xmlFreeDoc(c_result)
+                    c_result = NULL
+                resolver_context._raise_if_stored()
+
+            if context._exc._has_raised():
+                if c_result is not NULL:
+                    tree.xmlFreeDoc(c_result)
+                    c_result = NULL
+                context._exc._raise_if_stored()
+
+            if c_result is NULL:
+                # last error seems to be the most accurate here
+                error = self._error_log.last_error
+                if error is not None and error.message:
+                    if error.line > 0:
+                        message = u"%s, line %d" % (error.message, error.line)
+                    else:
+                        message = error.message
+                elif error is not None and error.line > 0:
+                    message = u"Error applying stylesheet, line %d" % error.line
+                else:
+                    message = u"Error applying stylesheet"
+                raise XSLTApplyError(message, self._error_log)
+        finally:
+            if resolver_context is not None:
+                resolver_context.clear()
+
+        result_doc = _documentFactory(c_result, input_doc._parser)
+
+        c_dict = c_result.dict
+        xmlparser.xmlDictReference(c_dict)
+        __GLOBAL_PARSER_CONTEXT.initThreadDictRef(&c_result.dict)
+        if c_dict is not c_result.dict or \
+                self._c_style.doc.dict is not c_result.dict or \
+                input_doc._c_doc.dict is not c_result.dict:
+            with nogil:
+                if c_dict is not c_result.dict:
+                    fixThreadDictNames(<xmlNode*>c_result,
+                                       c_dict, c_result.dict)
+                if self._c_style.doc.dict is not c_result.dict:
+                    fixThreadDictNames(<xmlNode*>c_result,
+                                       self._c_style.doc.dict, c_result.dict)
+                if input_doc._c_doc.dict is not c_result.dict:
+                    fixThreadDictNames(<xmlNode*>c_result,
+                                       input_doc._c_doc.dict, c_result.dict)
+        xmlparser.xmlDictFree(c_dict)
+
+        return _xsltResultTreeFactory(result_doc, self, profile_doc)
+
+    cdef xmlDoc* _run_transform(self, xmlDoc* c_input_doc,
+                                const_char** params, _XSLTContext context,
+                                xslt.xsltTransformContext* transform_ctxt):
+        cdef xmlDoc* c_result
+        xslt.xsltSetTransformErrorFunc(transform_ctxt, <void*>self._error_log,
+                                       <xmlerror.xmlGenericErrorFunc>_receiveXSLTError)
+        if self._access_control is not None:
+            self._access_control._register_in_context(transform_ctxt)
+        with nogil:
+            c_result = xslt.xsltApplyStylesheetUser(
+                self._c_style, c_input_doc, params, NULL, NULL, transform_ctxt)
+        return c_result
+
+cdef _convert_xslt_parameters(xslt.xsltTransformContext* transform_ctxt,
+                              dict parameters, const_char*** params_ptr):
+    cdef Py_ssize_t i, parameter_count
+    cdef const_char** params
+    cdef tree.xmlDict* c_dict = transform_ctxt.dict
+    params_ptr[0] = NULL
+    parameter_count = len(parameters)
+    if parameter_count == 0:
+        return
+    # allocate space for parameters
+    # * 2 as we want an entry for both key and value,
+    # and + 1 as array is NULL terminated
+    params = <const_char**>python.PyMem_Malloc(
+        sizeof(const_char*) * (parameter_count * 2 + 1))
+    try:
+        i = 0
+        for key, value in parameters.iteritems():
+            k = _utf8(key)
+            if isinstance(value, _XSLTQuotedStringParam):
+                v = (<_XSLTQuotedStringParam>value).strval
+                xslt.xsltQuoteOneUserParam(
+                    transform_ctxt, _xcstr(k), _xcstr(v))
+            else:
+                if isinstance(value, XPath):
+                    v = (<XPath>value)._path
+                else:
+                    v = _utf8(value)
+                params[i] = <const_char*>tree.xmlDictLookup(c_dict, _xcstr(k), len(k))
+                i += 1
+                params[i] = <const_char*>tree.xmlDictLookup(c_dict, _xcstr(v), len(v))
+                i += 1
+    except:
+        python.PyMem_Free(params)
+        raise
+    params[i] = NULL
+    params_ptr[0] = params
+
+cdef XSLT _copyXSLT(XSLT stylesheet):
+    cdef XSLT new_xslt
+    cdef xmlDoc* c_doc
+    assert stylesheet._c_style is not NULL, "XSLT stylesheet not initialised"
+    new_xslt = XSLT.__new__(XSLT)
+    new_xslt._access_control = stylesheet._access_control
+    new_xslt._error_log = _ErrorLog()
+    new_xslt._context = stylesheet._context._copy()
+
+    new_xslt._xslt_resolver_context = stylesheet._xslt_resolver_context._copy()
+    new_xslt._xslt_resolver_context._c_style_doc = _copyDoc(
+        stylesheet._xslt_resolver_context._c_style_doc, 1)
+
+    c_doc = _copyDoc(stylesheet._c_style.doc, 1)
+    new_xslt._c_style = xslt.xsltParseStylesheetDoc(c_doc)
+    if new_xslt._c_style is NULL:
+        tree.xmlFreeDoc(c_doc)
+        raise MemoryError()
+
+    return new_xslt
+
+@cython.final
+cdef class _XSLTResultTree(_ElementTree):
+    cdef XSLT _xslt
+    cdef _Document _profile
+    cdef xmlChar* _buffer
+    cdef Py_ssize_t _buffer_len
+    cdef Py_ssize_t _buffer_refcnt
+    def __cinit__(self):
+        self._buffer = NULL
+        self._buffer_len = 0
+        self._buffer_refcnt = 0
+
+    cdef _saveToStringAndSize(self, xmlChar** s, int* l):
+        cdef _Document doc
+        cdef int r
+        if self._context_node is not None:
+            doc = self._context_node._doc
+        else:
+            doc = None
+        if doc is None:
+            doc = self._doc
+            if doc is None:
+                s[0] = NULL
+                return
+        with nogil:
+            r = xslt.xsltSaveResultToString(s, l, doc._c_doc,
+                                            self._xslt._c_style)
+        if r == -1:
+            raise MemoryError()
+
+    def __str__(self):
+        cdef xmlChar* s = NULL
+        cdef int l = 0
+        if python.IS_PYTHON3:
+            return self.__unicode__()
+        self._saveToStringAndSize(&s, &l)
+        if s is NULL:
+            return ''
+        # we must not use 'funicode' here as this is not always UTF-8
+        try:
+            result = <bytes>s[:l]
+        finally:
+            tree.xmlFree(s)
+        return result
+
+    def __unicode__(self):
+        cdef xmlChar* encoding
+        cdef xmlChar* s = NULL
+        cdef int l = 0
+        self._saveToStringAndSize(&s, &l)
+        if s is NULL:
+            return u''
+        encoding = self._xslt._c_style.encoding
+        try:
+            if encoding is NULL:
+                result = s[:l].decode('UTF-8')
+            else:
+                result = s[:l].decode(encoding)
+        finally:
+            tree.xmlFree(s)
+        return _stripEncodingDeclaration(result)
+
+    def __getbuffer__(self, Py_buffer* buffer, int flags):
+        cdef int l = 0
+        if buffer is NULL:
+            return
+        if self._buffer is NULL or flags & python.PyBUF_WRITABLE:
+            self._saveToStringAndSize(<xmlChar**>&buffer.buf, &l)
+            buffer.len = l
+            if self._buffer is NULL and not flags & python.PyBUF_WRITABLE:
+                self._buffer = <xmlChar*>buffer.buf
+                self._buffer_len = l
+                self._buffer_refcnt = 1
+        else:
+            buffer.buf = self._buffer
+            buffer.len = self._buffer_len
+            self._buffer_refcnt += 1
+        if flags & python.PyBUF_WRITABLE:
+            buffer.readonly = 0
+        else:
+            buffer.readonly = 1
+        if flags & python.PyBUF_FORMAT:
+            buffer.format = "B"
+        else:
+            buffer.format = NULL
+        buffer.ndim = 0
+        buffer.shape = NULL
+        buffer.strides = NULL
+        buffer.suboffsets = NULL
+        buffer.itemsize = 1
+        buffer.internal = NULL
+        if buffer.obj is not self: # set by Cython?
+            buffer.obj = self
+
+    def __releasebuffer__(self, Py_buffer* buffer):
+        if buffer is NULL:
+            return
+        if <xmlChar*>buffer.buf is self._buffer:
+            self._buffer_refcnt -= 1
+            if self._buffer_refcnt == 0:
+                tree.xmlFree(<char*>self._buffer)
+                self._buffer = NULL
+        else:
+            tree.xmlFree(<char*>buffer.buf)
+        buffer.buf = NULL
+
+    property xslt_profile:
+        u"""Return an ElementTree with profiling data for the stylesheet run.
+        """
+        def __get__(self):
+            cdef object root
+            if self._profile is None:
+                return None
+            root = self._profile.getroot()
+            if root is None:
+                return None
+            return ElementTree(root)
+
+        def __del__(self):
+            self._profile = None
+
+cdef _xsltResultTreeFactory(_Document doc, XSLT xslt, _Document profile):
+    cdef _XSLTResultTree result
+    result = <_XSLTResultTree>_newElementTree(doc, None, _XSLTResultTree)
+    result._xslt = xslt
+    result._profile = profile
+    return result
+
+# functions like "output" and "write" are a potential security risk, but we
+# rely on the user to configure XSLTAccessControl as needed
+xslt.xsltRegisterAllExtras()
+
+# enable EXSLT support for XSLT
+xslt.exsltRegisterAll()
+
+
+################################################################################
+# XSLT PI support
+
+cdef object _RE_PI_HREF = re.compile(ur'\s+href\s*=\s*(?:\'([^\']*)\'|"([^"]*)")')
+cdef object _FIND_PI_HREF = _RE_PI_HREF.findall
+cdef object _REPLACE_PI_HREF = _RE_PI_HREF.sub
+cdef XPath __findStylesheetByID = None
+
+cdef _findStylesheetByID(_Document doc, id):
+    global __findStylesheetByID
+    if __findStylesheetByID is None:
+        __findStylesheetByID = XPath(
+            u"//xsl:stylesheet[@xml:id = $id]",
+            namespaces={u"xsl" : u"http://www.w3.org/1999/XSL/Transform"})
+    return __findStylesheetByID(doc, id=id)
+
+cdef class _XSLTProcessingInstruction(PIBase):
+    def parseXSL(self, parser=None):
+        u"""parseXSL(self, parser=None)
+
+        Try to parse the stylesheet referenced by this PI and return
+        an ElementTree for it.  If the stylesheet is embedded in the
+        same document (referenced via xml:id), find and return an
+        ElementTree for the stylesheet Element.
+
+        The optional ``parser`` keyword argument can be passed to specify the
+        parser used to read from external stylesheet URLs.
+        """
+        cdef _Document result_doc
+        cdef _Element  result_node
+        cdef bytes href_utf
+        cdef const_xmlChar* c_href
+        cdef xmlAttr* c_attr
+        _assertValidNode(self)
+        if self._c_node.content is NULL:
+            raise ValueError, u"PI lacks content"
+        hrefs = _FIND_PI_HREF(u' ' + (<unsigned char*>self._c_node.content).decode('UTF-8'))
+        if len(hrefs) != 1:
+            raise ValueError, u"malformed PI attributes"
+        hrefs = hrefs[0]
+        href_utf = utf8(hrefs[0] or hrefs[1])
+        c_href = _xcstr(href_utf)
+
+        if c_href[0] != c'#':
+            # normal URL, try to parse from it
+            c_href = tree.xmlBuildURI(
+                c_href,
+                tree.xmlNodeGetBase(self._c_node.doc, self._c_node))
+            if c_href is not NULL:
+                try:
+                    href_utf = <unsigned char*>c_href
+                finally:
+                    tree.xmlFree(<char*>c_href)
+            result_doc = _parseDocumentFromURL(href_utf, parser)
+            return _elementTreeFactory(result_doc, None)
+
+        # ID reference to embedded stylesheet
+        # try XML:ID lookup
+        _assertValidDoc(self._doc)
+        c_href += 1 # skip leading '#'
+        c_attr = tree.xmlGetID(self._c_node.doc, c_href)
+        if c_attr is not NULL and c_attr.doc is self._c_node.doc:
+            result_node = _elementFactory(self._doc, c_attr.parent)
+            return _elementTreeFactory(result_node._doc, result_node)
+
+        # try XPath search
+        root = _findStylesheetByID(self._doc, funicode(c_href))
+        if not root:
+            raise ValueError, u"reference to non-existing embedded stylesheet"
+        elif len(root) > 1:
+            raise ValueError, u"ambiguous reference to embedded stylesheet"
+        result_node = root[0]
+        return _elementTreeFactory(result_node._doc, result_node)
+
+    def set(self, key, value):
+        u"""set(self, key, value)
+
+        Supports setting the 'href' pseudo-attribute in the text of
+        the processing instruction.
+        """
+        if key != u"href":
+            raise AttributeError, \
+                u"only setting the 'href' attribute is supported on XSLT-PIs"
+        if value is None:
+            attrib = u""
+        elif u'"' in value or u'>' in value:
+            raise ValueError, u"Invalid URL, must not contain '\"' or '>'"
+        else:
+            attrib = u' href="%s"' % value
+        text = u' ' + self.text
+        if _FIND_PI_HREF(text):
+            self.text = _REPLACE_PI_HREF(attrib, text)
+        else:
+            self.text = text + attrib
diff --git a/lib/lxml/xsltext.pxi b/lib/lxml/xsltext.pxi
new file mode 100644
index 00000000..87fbb58f
--- /dev/null
+++ b/lib/lxml/xsltext.pxi
@@ -0,0 +1,243 @@
+# XSLT extension elements
+
+cdef class XSLTExtension:
+    u"""Base class of an XSLT extension element.
+    """
+    def execute(self, context, self_node, input_node, output_parent):
+        u"""execute(self, context, self_node, input_node, output_parent)
+        Execute this extension element.
+
+        Subclasses must override this method.  They may append
+        elements to the `output_parent` element here, or set its text
+        content.  To this end, the `input_node` provides read-only
+        access to the current node in the input document, and the
+        `self_node` points to the extension element in the stylesheet.
+
+        Note that the `output_parent` parameter may be `None` if there
+        is no parent element in the current context (e.g. no content
+        was added to the output tree yet).
+        """
+        pass
+
+    def apply_templates(self, _XSLTContext context not None, node, output_parent=None,
+                        *, elements_only=False, remove_blank_text=False):
+        u"""apply_templates(self, context, node, output_parent=None, elements_only=False, remove_blank_text=False)
+
+        Call this method to retrieve the result of applying templates
+        to an element.
+
+        The return value is a list of elements or text strings that
+        were generated by the XSLT processor.  If you pass
+        ``elements_only=True``, strings will be discarded from the result
+        list.  The option ``remove_blank_text=True`` will only discard
+        strings that consist entirely of whitespace (e.g. formatting).
+        These options do not apply to Elements, only to bare string results.
+
+        If you pass an Element as `output_parent` parameter, the result
+        will instead be appended to the element (including attributes
+        etc.) and the return value will be `None`.  This is a safe way
+        to generate content into the output document directly, without
+        having to take care of special values like text or attributes.
+        Note that the string discarding options will be ignored in this
+        case.
+        """
+        cdef xmlNode* c_parent
+        cdef xmlNode* c_node
+        cdef xmlNode* c_context_node
+        assert context._xsltCtxt is not NULL, "XSLT context not initialised"
+        c_context_node = _roNodeOf(node)
+        #assert c_context_node.doc is context._xsltContext.node.doc, \
+        #    "switching input documents during transformation is not currently supported"
+
+        if output_parent is not None:
+            c_parent = _nonRoNodeOf(output_parent)
+        else:
+            c_parent = tree.xmlNewDocNode(
+                context._xsltCtxt.output, NULL, <unsigned char*>"fake-parent", NULL)
+
+        c_node = context._xsltCtxt.insert
+        context._xsltCtxt.insert = c_parent
+        xslt.xsltProcessOneNode(
+            context._xsltCtxt, c_context_node, NULL)
+        context._xsltCtxt.insert = c_node
+
+        if output_parent is not None:
+            return None
+
+        try:
+            return self._collectXSLTResultContent(
+                context, c_parent, elements_only, remove_blank_text)
+        finally:
+            # free all intermediate nodes that will not be freed by proxies
+            tree.xmlFreeNode(c_parent)
+
+    def process_children(self, _XSLTContext context not None, output_parent=None,
+                         *, elements_only=False, remove_blank_text=False):
+        u"""process_children(self, context, output_parent=None, elements_only=False, remove_blank_text=False)
+
+        Call this method to process the XSLT content of the extension
+        element itself.
+
+        The return value is a list of elements or text strings that
+        were generated by the XSLT processor.  If you pass
+        ``elements_only=True``, strings will be discarded from the result
+        list.  The option ``remove_blank_text=True`` will only discard
+        strings that consist entirely of whitespace (e.g. formatting).
+        These options do not apply to Elements, only to bare string results.
+
+        If you pass an Element as `output_parent` parameter, the result
+        will instead be appended to the element (including attributes
+        etc.) and the return value will be `None`.  This is a safe way
+        to generate content into the output document directly, without
+        having to take care of special values like text or attributes.
+        Note that the string discarding options will be ignored in this
+        case.
+        """
+        cdef xmlNode* c_parent
+        cdef xslt.xsltTransformContext* c_ctxt = context._xsltCtxt
+        cdef xmlNode* c_old_output_parent = c_ctxt.insert
+        assert context._xsltCtxt is not NULL, "XSLT context not initialised"
+
+        # output_parent node is used for adding results instead of
+        # elements list used in apply_templates, that's easier and allows to
+        # use attributes added to extension element with <xsl:attribute>.
+
+        if output_parent is not None:
+            c_parent = _nonRoNodeOf(output_parent)
+        else:
+            c_parent = tree.xmlNewDocNode(
+                context._xsltCtxt.output, NULL, <unsigned char*>"fake-parent", NULL)
+
+        c_ctxt.insert = _nonRoNodeOf(output_parent)
+        xslt.xsltApplyOneTemplate(c_ctxt,
+            c_ctxt.node, c_ctxt.inst.children, NULL, NULL)
+        c_ctxt.insert = c_old_output_parent
+
+        if output_parent is not None:
+            return None
+
+        try:
+            return self._collectXSLTResultContent(
+                context, c_parent, elements_only, remove_blank_text)
+        finally:
+            # free all intermediate nodes that will not be freed by proxies
+            tree.xmlFreeNode(c_parent)
+
+    cdef _collectXSLTResultContent(self, _XSLTContext context, xmlNode* c_parent,
+                                   bint elements_only, bint remove_blank_text):
+        cdef xmlNode* c_node
+        cdef xmlNode* c_next
+        cdef _ReadOnlyProxy proxy
+        cdef list results = [] # or maybe _collectAttributes(c_parent, 2) ?
+        c_node = c_parent.children
+        while c_node is not NULL:
+            c_next = c_node.next
+            if c_node.type == tree.XML_TEXT_NODE:
+                if not elements_only:
+                    s = funicode(c_node.content)
+                    if not remove_blank_text or s.strip():
+                        results.append(s)
+                    s = None
+            elif c_node.type == tree.XML_ELEMENT_NODE:
+                proxy = _newReadOnlyProxy(
+                    context._extension_element_proxy, c_node)
+                results.append(proxy)
+                # unlink node and make sure it will be freed later on
+                tree.xmlUnlinkNode(c_node)
+                proxy.free_after_use()
+            else:
+                raise TypeError, \
+                    u"unsupported XSLT result type: %d" % c_node.type
+            c_node = c_next
+        return results
+
+
+cdef _registerXSLTExtensions(xslt.xsltTransformContext* c_ctxt,
+                             extension_dict):
+    for ns_utf, name_utf in extension_dict:
+        xslt.xsltRegisterExtElement(
+            c_ctxt, _xcstr(name_utf), _xcstr(ns_utf),
+            <xslt.xsltTransformFunction>_callExtensionElement)
+
+cdef void _callExtensionElement(xslt.xsltTransformContext* c_ctxt,
+                                xmlNode* c_context_node,
+                                xmlNode* c_inst_node,
+                                void* dummy) with gil:
+    cdef _XSLTContext context
+    cdef XSLTExtension extension
+    cdef python.PyObject* dict_result
+    cdef xmlNode* c_node
+    cdef _ReadOnlyProxy context_node = None, self_node = None
+    cdef object output_parent # not restricted to ro-nodes
+    c_uri = _getNs(c_inst_node)
+    if c_uri is NULL:
+        # not allowed, and should never happen
+        return
+    if c_ctxt.xpathCtxt.userData is NULL:
+        # just for safety, should never happen
+        return
+    context = <_XSLTContext>c_ctxt.xpathCtxt.userData
+    try:
+        try:
+            dict_result = python.PyDict_GetItem(
+                context._extension_elements, (<unsigned char*>c_uri, <unsigned char*>c_inst_node.name))
+            if dict_result is NULL:
+                raise KeyError, \
+                    u"extension element %s not found" % funicode(c_inst_node.name)
+            extension = <object>dict_result
+
+            try:
+                # build the context proxy nodes
+                self_node = _newReadOnlyProxy(None, c_inst_node)
+                if _isElement(c_ctxt.insert):
+                    output_parent = _newAppendOnlyProxy(self_node, c_ctxt.insert)
+                else:
+                    # may be the document node or other stuff
+                    output_parent = _newOpaqueAppendOnlyNodeWrapper(c_ctxt.insert)
+                if c_context_node.type in (tree.XML_DOCUMENT_NODE,
+                                           tree.XML_HTML_DOCUMENT_NODE):
+                    c_node = tree.xmlDocGetRootElement(<xmlDoc*>c_context_node)
+                    if c_node is not NULL:
+                        context_node = _newReadOnlyProxy(self_node, c_node)
+                    else:
+                        context_node = None
+                elif c_context_node.type in (tree.XML_ATTRIBUTE_NODE,
+                                             tree.XML_TEXT_NODE,
+                                             tree.XML_CDATA_SECTION_NODE):
+                    # this isn't easy to support using read-only
+                    # nodes, as the smart-string factory must
+                    # instantiate the parent proxy somehow...
+                    raise TypeError("Unsupported element type: %d" % c_context_node.type)
+                else:
+                    context_node  = _newReadOnlyProxy(self_node, c_context_node)
+
+                # run the XSLT extension
+                context._extension_element_proxy = self_node
+                extension.execute(context, self_node, context_node, output_parent)
+            finally:
+                context._extension_element_proxy = None
+                if self_node is not None:
+                    _freeReadOnlyProxies(self_node)
+        except Exception, e:
+            try:
+                e = unicode(e).encode(u"UTF-8")
+            except:
+                e = repr(e).encode(u"UTF-8")
+            message = python.PyBytes_FromFormat(
+                "Error executing extension element '%s': %s",
+                c_inst_node.name, _cstr(e))
+            xslt.xsltTransformError(c_ctxt, NULL, c_inst_node, message)
+            context._exc._store_raised()
+        except:
+            # just in case
+            message = python.PyBytes_FromFormat(
+                "Error executing extension element '%s'", c_inst_node.name)
+            xslt.xsltTransformError(c_ctxt, NULL, c_inst_node, message)
+            context._exc._store_raised()
+    except:
+        # no Python functions here - everything can fail...
+        xslt.xsltTransformError(c_ctxt, NULL, c_inst_node,
+                                "Error during XSLT extension element evaluation")
+        context._exc._store_raised()
+    finally:
+        return  # swallow any further exceptions