~bzr-pqm/bzr/bzr.dev

1 by mbp at sourcefrog
import from baz patch-364
1
#! /usr/bin/env python
2
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
"""XML externalization support."""
18
48 by Martin Pool
witty comment
19
# "XML is like violence: if it doesn't solve your problem, you aren't
20
# using enough of it." -- various
21
1180 by Martin Pool
- start splitting code for xml (de)serialization away from objects
22
# importing this module is fairly slow because it has to load several
23
# ElementTree bits
24
1248 by Martin Pool
- new weave based cleanup [broken]
25
from bzrlib.trace import mutter, warning
26
802 by Martin Pool
- Remove XMLMixin class in favour of simple pack_xml, unpack_xml functions
27
try:
1283 by Martin Pool
- cElementTree is typically not installed in util
28
    from cElementTree import (ElementTree, SubElement, Element,
29
                              XMLTreeBuilder, fromstring, tostring)
802 by Martin Pool
- Remove XMLMixin class in favour of simple pack_xml, unpack_xml functions
30
except ImportError:
1282 by Martin Pool
- use regular python warnings for warning about cElementTree
31
    from warnings import warn
32
    warn('using slower ElementTree; consider installing cElementTree')
1227 by Martin Pool
- methods to deserialize objects from strings
33
    from util.elementtree.ElementTree import (ElementTree, SubElement,
1248 by Martin Pool
- new weave based cleanup [broken]
34
                                              Element, XMLTreeBuilder,
35
                                              fromstring, tostring)
802 by Martin Pool
- Remove XMLMixin class in favour of simple pack_xml, unpack_xml functions
36
1180 by Martin Pool
- start splitting code for xml (de)serialization away from objects
37
from bzrlib.inventory import ROOT_ID, Inventory, InventoryEntry
1182 by Martin Pool
- more disentangling of xml storage format from objects
38
from bzrlib.revision import Revision, RevisionReference        
1183 by Martin Pool
- implement version 5 xml storage, and tests
39
from bzrlib.errors import BzrError
1180 by Martin Pool
- start splitting code for xml (de)serialization away from objects
40
41
42
class Serializer(object):
43
    """Abstract object serialize/deserialize"""
44
    def write_inventory(self, inv, f):
45
        """Write inventory to a file"""
46
        elt = self._pack_inventory(inv)
47
        self._write_element(elt, f)
48
1248 by Martin Pool
- new weave based cleanup [broken]
49
    def write_inventory_to_string(self, inv):
50
        return tostring(self._pack_inventory(inv))
51
1227 by Martin Pool
- methods to deserialize objects from strings
52
    def read_inventory_from_string(self, xml_string):
1248 by Martin Pool
- new weave based cleanup [broken]
53
        return self._unpack_inventory(fromstring(xml_string))
1227 by Martin Pool
- methods to deserialize objects from strings
54
1180 by Martin Pool
- start splitting code for xml (de)serialization away from objects
55
    def read_inventory(self, f):
56
        return self._unpack_inventory(self._read_element(f))
57
1182 by Martin Pool
- more disentangling of xml storage format from objects
58
    def write_revision(self, rev, f):
59
        self._write_element(self._pack_revision(rev), f)
60
1248 by Martin Pool
- new weave based cleanup [broken]
61
    def write_revision_to_string(self, rev):
62
        return tostring(self._pack_revision(rev), f)
63
1182 by Martin Pool
- more disentangling of xml storage format from objects
64
    def read_revision(self, f):
65
        return self._unpack_revision(self._read_element(f))
66
1227 by Martin Pool
- methods to deserialize objects from strings
67
    def read_revision_from_string(self, xml_string):
1248 by Martin Pool
- new weave based cleanup [broken]
68
        return self._unpack_revision(fromstring(xml_string))
1227 by Martin Pool
- methods to deserialize objects from strings
69
1180 by Martin Pool
- start splitting code for xml (de)serialization away from objects
70
    def _write_element(self, elt, f):
71
        ElementTree(elt).write(f, 'utf-8')
72
        f.write('\n')
73
74
    def _read_element(self, f):
75
        return ElementTree().parse(f)
76
77
78
class _Serializer_v4(Serializer):
1183 by Martin Pool
- implement version 5 xml storage, and tests
79
    """Version 0.0.4 serializer
80
81
    You should use the serialzer_v4 singleton."""
1180 by Martin Pool
- start splitting code for xml (de)serialization away from objects
82
    
83
    __slots__ = []
84
    
85
    def _pack_inventory(self, inv):
86
        """Convert to XML Element"""
87
        e = Element('inventory')
88
        e.text = '\n'
89
        if inv.root.file_id not in (None, ROOT_ID):
90
            e.set('file_id', inv.root.file_id)
91
        for path, ie in inv.iter_entries():
92
            e.append(self._pack_entry(ie))
93
        return e
94
95
96
    def _pack_entry(self, ie):
97
        """Convert InventoryEntry to XML element"""
98
        e = Element('entry')
99
        e.set('name', ie.name)
100
        e.set('file_id', ie.file_id)
101
        e.set('kind', ie.kind)
102
103
        if ie.text_size != None:
104
            e.set('text_size', '%d' % ie.text_size)
105
106
        for f in ['text_id', 'text_sha1']:
107
            v = getattr(ie, f)
108
            if v != None:
109
                e.set(f, v)
110
111
        # to be conservative, we don't externalize the root pointers
112
        # for now, leaving them as null in the xml form.  in a future
113
        # version it will be implied by nested elements.
114
        if ie.parent_id != ROOT_ID:
115
            assert isinstance(ie.parent_id, basestring)
116
            e.set('parent_id', ie.parent_id)
117
118
        e.tail = '\n'
119
120
        return e
121
122
123
    def _unpack_inventory(self, elt):
124
        """Construct from XML Element
125
        """
126
        assert elt.tag == 'inventory'
127
        root_id = elt.get('file_id') or ROOT_ID
128
        inv = Inventory(root_id)
129
        for e in elt:
130
            ie = self._unpack_entry(e)
131
            if ie.parent_id == ROOT_ID:
132
                ie.parent_id = root_id
133
            inv.add(ie)
134
        return inv
135
136
137
    def _unpack_entry(self, elt):
138
        assert elt.tag == 'entry'
139
140
        ## original format inventories don't have a parent_id for
141
        ## nodes in the root directory, but it's cleaner to use one
142
        ## internally.
143
        parent_id = elt.get('parent_id')
144
        if parent_id == None:
145
            parent_id = ROOT_ID
146
147
        ie = InventoryEntry(elt.get('file_id'),
1189 by Martin Pool
- BROKEN: partial support for commit into weave
148
                            elt.get('name'),
149
                            elt.get('kind'),
150
                            parent_id)
1180 by Martin Pool
- start splitting code for xml (de)serialization away from objects
151
        ie.text_id = elt.get('text_id')
152
        ie.text_sha1 = elt.get('text_sha1')
153
154
        ## mutter("read inventoryentry: %r" % (elt.attrib))
155
156
        v = elt.get('text_size')
157
        ie.text_size = v and int(v)
158
159
        return ie
160
161
1182 by Martin Pool
- more disentangling of xml storage format from objects
162
    def _pack_revision(self, rev):
163
        """Revision object -> xml tree"""
164
        root = Element('revision',
165
                       committer = rev.committer,
166
                       timestamp = '%.9f' % rev.timestamp,
167
                       revision_id = rev.revision_id,
168
                       inventory_id = rev.inventory_id,
169
                       inventory_sha1 = rev.inventory_sha1,
170
                       )
171
        if rev.timezone:
172
            root.set('timezone', str(rev.timezone))
173
        root.text = '\n'
174
175
        msg = SubElement(root, 'message')
176
        msg.text = rev.message
177
        msg.tail = '\n'
178
179
        if rev.parents:
180
            pelts = SubElement(root, 'parents')
181
            pelts.tail = pelts.text = '\n'
182
            for rr in rev.parents:
183
                assert isinstance(rr, RevisionReference)
184
                p = SubElement(pelts, 'revision_ref')
185
                p.tail = '\n'
186
                assert rr.revision_id
187
                p.set('revision_id', rr.revision_id)
188
                if rr.revision_sha1:
189
                    p.set('revision_sha1', rr.revision_sha1)
190
191
        return root
192
193
    
194
    def _unpack_revision(self, elt):
195
        """XML Element -> Revision object"""
196
        
197
        # <changeset> is deprecated...
198
        if elt.tag not in ('revision', 'changeset'):
1183 by Martin Pool
- implement version 5 xml storage, and tests
199
            raise BzrError("unexpected tag in revision file: %r" % elt)
1182 by Martin Pool
- more disentangling of xml storage format from objects
200
201
        rev = Revision(committer = elt.get('committer'),
202
                       timestamp = float(elt.get('timestamp')),
203
                       revision_id = elt.get('revision_id'),
204
                       inventory_id = elt.get('inventory_id'),
205
                       inventory_sha1 = elt.get('inventory_sha1')
206
                       )
207
208
        precursor = elt.get('precursor')
209
        precursor_sha1 = elt.get('precursor_sha1')
210
211
        pelts = elt.find('parents')
212
213
        if pelts:
214
            for p in pelts:
215
                assert p.tag == 'revision_ref', \
216
                       "bad parent node tag %r" % p.tag
217
                rev_ref = RevisionReference(p.get('revision_id'),
218
                                            p.get('revision_sha1'))
219
                rev.parents.append(rev_ref)
220
221
            if precursor:
222
                # must be consistent
223
                prec_parent = rev.parents[0].revision_id
224
                assert prec_parent == precursor
225
        elif precursor:
226
            # revisions written prior to 0.0.5 have a single precursor
227
            # give as an attribute
228
            rev_ref = RevisionReference(precursor, precursor_sha1)
229
            rev.parents.append(rev_ref)
230
231
        v = elt.get('timezone')
232
        rev.timezone = v and int(v)
233
234
        rev.message = elt.findtext('message') # text of <message>
235
        return rev
236
237
238
1183 by Martin Pool
- implement version 5 xml storage, and tests
239
1180 by Martin Pool
- start splitting code for xml (de)serialization away from objects
240
"""singleton instance"""
241
serializer_v4 = _Serializer_v4()
1183 by Martin Pool
- implement version 5 xml storage, and tests
242