20
19
# "XML is like violence: if it doesn't solve your problem, you aren't
21
20
# using enough of it." -- various
22
# importing this module is fairly slow because it has to load several
24
__copyright__ = "Copyright (C) 2005 Canonical Ltd."
25
__author__ = "Martin Pool <mbp@canonical.com>"
25
from bzrlib import registry
26
from bzrlib.trace import mutter, warning
28
from cElementTree import Element, ElementTree, SubElement
30
# it's in this package in python2.5
31
from xml.etree.cElementTree import (ElementTree, SubElement, Element,
32
XMLTreeBuilder, fromstring, tostring)
33
import xml.etree as elementtree
35
from cElementTree import (ElementTree, SubElement, Element,
36
XMLTreeBuilder, fromstring, tostring)
38
ParseError = SyntaxError
29
39
except ImportError:
30
from elementtree.ElementTree import Element, ElementTree, SubElement
33
from trace import mutter
37
raise Exception("XMLMixin.to_element must be overridden in concrete classes")
39
def write_xml(self, f):
40
ElementTree(self.to_element()).write(f, 'utf-8')
40
mutter('WARNING: using slower ElementTree; consider installing cElementTree'
41
" and make sure it's on your PYTHONPATH")
42
# this copy is shipped with bzr
43
from util.elementtree.ElementTree import (ElementTree, SubElement,
44
Element, XMLTreeBuilder,
46
import util.elementtree as elementtree
47
from xml.parsers.expat import ExpatError as ParseError
49
from bzrlib import errors
52
class Serializer(object):
53
"""Abstract object serialize/deserialize"""
55
def write_inventory(self, inv, f):
56
"""Write inventory to a file"""
57
raise NotImplementedError(self.write_inventory)
59
def write_inventory_to_string(self, inv):
60
raise NotImplementedError(self.write_inventory_to_string)
62
def read_inventory_from_string(self, xml_string, revision_id=None):
63
"""Read xml_string into an inventory object.
65
:param xml_string: The xml to read.
66
:param revision_id: If not-None, the expected revision id of the
67
inventory. Some serialisers use this to set the results' root
71
return self._unpack_inventory(fromstring(xml_string), revision_id)
73
raise errors.UnexpectedInventoryFormat(e)
75
def read_inventory(self, f, revision_id=None):
77
return self._unpack_inventory(self._read_element(f),
80
raise errors.UnexpectedInventoryFormat(e)
82
def write_revision(self, rev, f):
83
self._write_element(self._pack_revision(rev), f)
85
def write_revision_to_string(self, rev):
86
return tostring(self._pack_revision(rev)) + '\n'
88
def read_revision(self, f):
89
return self._unpack_revision(self._read_element(f))
91
def read_revision_from_string(self, xml_string):
92
return self._unpack_revision(fromstring(xml_string))
94
def _write_element(self, elt, f):
95
ElementTree(elt).write(f, 'utf-8')
44
return cls.from_element(ElementTree().parse(f))
46
read_xml = classmethod(read_xml)
98
def _read_element(self, f):
99
return ElementTree().parse(f)
102
# performance tuning for elementree's serialiser. This should be
103
# sent upstream - RBC 20060523.
104
# the functions here are patched into elementtree at runtime.
106
escape_re = re.compile("[&'\"<>]")
109
"'":"'", # FIXME: overkill
114
def _escape_replace(match, map=escape_map):
115
return map[match.group()]
117
def _escape_attrib(text, encoding=None, replace=None):
118
# escape attribute value
122
text = elementtree.ElementTree._encode(text, encoding)
124
return elementtree.ElementTree._encode_entity(text)
126
return escape_re.sub(_escape_replace, text)
128
text = replace(text, "&", "&")
129
text = replace(text, "'", "'") # FIXME: overkill
130
text = replace(text, "\"", """)
131
text = replace(text, "<", "<")
132
text = replace(text, ">", ">")
134
except (TypeError, AttributeError):
135
elementtree.ElementTree._raise_serialization_error(text)
137
elementtree.ElementTree._escape_attrib = _escape_attrib
139
escape_cdata_re = re.compile("[&<>]")
145
def _escape_cdata_replace(match, map=escape_cdata_map):
146
return map[match.group()]
148
def _escape_cdata(text, encoding=None, replace=None):
149
# escape character data
153
text = elementtree.ElementTree._encode(text, encoding)
155
return elementtree.ElementTree._encode_entity(text)
157
return escape_cdata_re.sub(_escape_cdata_replace, text)
159
text = replace(text, "&", "&")
160
text = replace(text, "<", "<")
161
text = replace(text, ">", ">")
163
except (TypeError, AttributeError):
164
elementtree.ElementTree._raise_serialization_error(text)
166
elementtree.ElementTree._escape_cdata = _escape_cdata
169
class SerializerRegistry(registry.Registry):
170
"""Registry for serializer objects"""
173
format_registry = SerializerRegistry()
174
format_registry.register_lazy('4', 'bzrlib.xml4', 'serializer_v4')
175
format_registry.register_lazy('5', 'bzrlib.xml5', 'serializer_v5')
176
format_registry.register_lazy('6', 'bzrlib.xml6', 'serializer_v6')
177
format_registry.register_lazy('7', 'bzrlib.xml7', 'serializer_v7')