~bzr-pqm/bzr/bzr.dev

184 by mbp at sourcefrog
pychecker fixups
1
# (C) 2005 Canonical
1 by mbp at sourcefrog
import from baz patch-364
2
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
1185.16.40 by Martin Pool
todo
17
# TODO: Some kind of command-line display of revision properties: 
18
# perhaps show them in log -v and allow them as options to the commit command.
1 by mbp at sourcefrog
import from baz patch-364
19
1590.1.1 by Robert Collins
Improve common_ancestor performance.
20
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
21
import bzrlib.errors
1590.1.1 by Robert Collins
Improve common_ancestor performance.
22
import bzrlib.errors as errors
1594.2.15 by Robert Collins
Unfuck performance.
23
from bzrlib.graph import node_distances, select_farthest, all_descendants, Graph
1185.16.39 by Martin Pool
- constraints on revprops
24
from bzrlib.osutils import contains_whitespace
1534.9.1 by Aaron Bentley
Added progress bars to merge
25
from bzrlib.progress import DummyProgress
8 by mbp at sourcefrog
store committer's timezone in revision and show
26
974.1.90 by Aaron Bentley
Switched NULL revision ID to 'null:' per robertc's suggestion
27
NULL_REVISION="null:"
974.1.89 by Aaron Bentley
Fixed merging with multiple roots, by using null as graph root.
28
802 by Martin Pool
- Remove XMLMixin class in favour of simple pack_xml, unpack_xml functions
29
class Revision(object):
1 by mbp at sourcefrog
import from baz patch-364
30
    """Single revision on a branch.
31
32
    Revisions may know their revision_hash, but only once they've been
33
    written out.  This is not stored because you cannot write the hash
34
    into the file it describes.
35
697 by Martin Pool
- write out parent list for new revisions
36
    After bzr 0.0.5 revisions are allowed to have multiple parents.
696 by Martin Pool
- Refactor revision deserialization code
37
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
38
    parent_ids
39
        List of parent revision_ids
1185.16.39 by Martin Pool
- constraints on revprops
40
41
    properties
42
        Dictionary of revision properties.  These are attached to the
43
        revision as extra metadata.  The name must be a single 
44
        word; the value can be an arbitrary string.
1 by mbp at sourcefrog
import from baz patch-364
45
    """
696 by Martin Pool
- Refactor revision deserialization code
46
    
1185.16.35 by Martin Pool
- stub for revision properties
47
    def __init__(self, revision_id, properties=None, **args):
1092.2.25 by Robert Collins
support ghosts in commits
48
        self.revision_id = revision_id
1185.16.35 by Martin Pool
- stub for revision properties
49
        self.properties = properties or {}
1185.16.39 by Martin Pool
- constraints on revprops
50
        self._check_properties()
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
51
        self.parent_ids = []
1311 by Martin Pool
- remove RevisionReference; just hold parent ids directly
52
        self.parent_sha1s = []
1185.42.6 by Jelmer Vernooij
Don't clear Revision.parent_ids after it has been set from the arguments
53
        self.__dict__.update(args)
696 by Martin Pool
- Refactor revision deserialization code
54
1 by mbp at sourcefrog
import from baz patch-364
55
    def __repr__(self):
184 by mbp at sourcefrog
pychecker fixups
56
        return "<Revision id %s>" % self.revision_id
1 by mbp at sourcefrog
import from baz patch-364
57
1185 by Martin Pool
- add xml round-trip test for revisions
58
    def __eq__(self, other):
59
        if not isinstance(other, Revision):
60
            return False
1092.2.20 by Robert Collins
symlink and weaves, whaddya know
61
        # FIXME: rbc 20050930 parent_ids are not being compared
62
        return (
63
                self.inventory_sha1 == other.inventory_sha1
1185 by Martin Pool
- add xml round-trip test for revisions
64
                and self.revision_id == other.revision_id
65
                and self.timestamp == other.timestamp
66
                and self.message == other.message
67
                and self.timezone == other.timezone
1185.16.35 by Martin Pool
- stub for revision properties
68
                and self.committer == other.committer
69
                and self.properties == other.properties)
1185 by Martin Pool
- add xml round-trip test for revisions
70
71
    def __ne__(self, other):
72
        return not self.__eq__(other)
73
1185.16.39 by Martin Pool
- constraints on revprops
74
    def _check_properties(self):
75
        """Verify that all revision properties are OK.
76
        """
77
        for name, value in self.properties.iteritems():
78
            if not isinstance(name, basestring) or contains_whitespace(name):
79
                raise ValueError("invalid property name %r" % name)
80
            if not isinstance(value, basestring):
81
                raise ValueError("invalid property value %r for %r" % 
82
                                 (name, value))
83
1534.4.49 by Robert Collins
Provide a revision.get_history(repository) method for generating a synthetic revision history.
84
    def get_history(self, repository):
85
        """Return the canonical line-of-history for this revision.
86
87
        If ghosts are present this may differ in result from a ghost-free
88
        repository.
89
        """
90
        current_revision = self
91
        reversed_result = []
92
        while current_revision is not None:
93
            reversed_result.append(current_revision.revision_id)
94
            if not len (current_revision.parent_ids):
95
                reversed_result.append(None)
96
                current_revision = None
97
            else:
98
                next_revision_id = current_revision.parent_ids[0]
99
                current_revision = repository.get_revision(next_revision_id)
100
        reversed_result.reverse()
101
        return reversed_result
102
1268 by Martin Pool
- is_ancestor now works by looking at the Branch's stored ancestry
103
104
def is_ancestor(revision_id, candidate_id, branch):
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
105
    """Return true if candidate_id is an ancestor of revision_id.
1268 by Martin Pool
- is_ancestor now works by looking at the Branch's stored ancestry
106
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
107
    A false negative will be returned if any intermediate descendent of
108
    candidate_id is not present in any of the revision_sources.
810 by Martin Pool
- New validate_revision_id function
109
    
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
110
    revisions_source is an object supporting a get_revision operation that
111
    behaves like Branch's.
112
    """
1185.67.2 by Aaron Bentley
Renamed Branch.storage to Branch.repository
113
    return candidate_id in branch.repository.get_ancestry(revision_id)
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
114
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
115
116
def iter_ancestors(revision_id, revision_source, only_present=False):
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
117
    ancestors = (revision_id,)
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
118
    distance = 0
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
119
    while len(ancestors) > 0:
120
        new_ancestors = []
121
        for ancestor in ancestors:
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
122
            if not only_present:
123
                yield ancestor, distance
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
124
            try:
125
                revision = revision_source.get_revision(ancestor)
126
            except bzrlib.errors.NoSuchRevision, e:
127
                if e.revision == revision_id:
128
                    raise 
129
                else:
130
                    continue
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
131
            if only_present:
132
                yield ancestor, distance
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
133
            new_ancestors.extend(revision.parent_ids)
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
134
        ancestors = new_ancestors
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
135
        distance += 1
136
137
138
def find_present_ancestors(revision_id, revision_source):
1133 by Martin Pool
doc
139
    """Return the ancestors of a revision present in a branch.
140
141
    It's possible that a branch won't have the complete ancestry of
142
    one of its revisions.  
143
144
    """
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
145
    found_ancestors = {}
146
    anc_iter = enumerate(iter_ancestors(revision_id, revision_source,
147
                         only_present=True))
148
    for anc_order, (anc_id, anc_distance) in anc_iter:
149
        if not found_ancestors.has_key(anc_id):
150
            found_ancestors[anc_id] = (anc_order, anc_distance)
151
    return found_ancestors
152
    
1153 by Martin Pool
- clean up some code in revision.py
153
154
def __get_closest(intersection):
155
    intersection.sort()
156
    matches = [] 
157
    for entry in intersection:
158
        if entry[0] == intersection[0][0]:
159
            matches.append(entry[2])
160
    return matches
161
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
162
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
163
def revision_graph(revision, revision_source):
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
164
    """Produce a graph of the ancestry of the specified revision.
1590.1.1 by Robert Collins
Improve common_ancestor performance.
165
    
166
    :return: root, ancestors map, descendants map
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
167
    """
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
168
    revision_source.lock_read()
169
    try:
170
        return _revision_graph(revision, revision_source)
171
    finally:
172
        revision_source.unlock()
173
1590.1.1 by Robert Collins
Improve common_ancestor performance.
174
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
175
def _revision_graph(revision, revision_source):
176
    """See revision_graph."""
1590.1.1 by Robert Collins
Improve common_ancestor performance.
177
    from bzrlib.tsort import topo_sort
178
    graph = revision_source.get_revision_graph(revision)
179
    # mark all no-parent revisions as being NULL_REVISION parentage.
180
    for node, parents in graph.items():
181
        if len(parents) == 0:
182
            graph[node] = [NULL_REVISION]
183
    # add NULL_REVISION to the graph
184
    graph[NULL_REVISION] = []
185
186
    # pick a root. If there are multiple roots
187
    # this could pick a random one.
188
    topo_order = topo_sort(graph.items())
189
    root = topo_order[0]
190
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
191
    ancestors = {}
192
    descendants = {}
1590.1.1 by Robert Collins
Improve common_ancestor performance.
193
194
    # map the descendants of the graph.
195
    # and setup our set based return graph.
196
    for node in graph.keys():
197
        descendants[node] = {}
198
    for node, parents in graph.items():
199
        for parent in parents:
200
            descendants[parent][node] = 1
201
        ancestors[node] = set(parents)
202
974.1.63 by Aaron Bentley
Fixed graph-generation
203
    assert root not in descendants[root]
204
    assert root not in ancestors[root]
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
205
    return root, ancestors, descendants
206
1092.3.4 by Robert Collins
update symlink branch to integration
207
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
208
def combined_graph(revision_a, revision_b, revision_source):
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
209
    """Produce a combined ancestry graph.
210
    Return graph root, ancestors map, descendants map, set of common nodes"""
1590.1.1 by Robert Collins
Improve common_ancestor performance.
211
    root, ancestors, descendants = revision_graph(
212
        revision_a, revision_source)
213
    root_b, ancestors_b, descendants_b = revision_graph(
214
        revision_b, revision_source)
974.1.80 by Aaron Bentley
Improved merge error handling and testing
215
    if root != root_b:
216
        raise bzrlib.errors.NoCommonRoot(revision_a, revision_b)
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
217
    common = set()
218
    for node, node_anc in ancestors_b.iteritems():
219
        if node in ancestors:
220
            common.add(node)
221
        else:
222
            ancestors[node] = set()
223
        ancestors[node].update(node_anc)
224
    for node, node_dec in descendants_b.iteritems():
225
        if node not in descendants:
1185.8.1 by Aaron Bentley
Ensured combined_graph is order-insensitive
226
            descendants[node] = {}
974.1.63 by Aaron Bentley
Fixed graph-generation
227
        descendants[node].update(node_dec)
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
228
    return root, ancestors, descendants, common
229
1092.3.4 by Robert Collins
update symlink branch to integration
230
1534.9.1 by Aaron Bentley
Added progress bars to merge
231
def common_ancestor(revision_a, revision_b, revision_source, 
232
                    pb=DummyProgress()):
1587.1.11 by Robert Collins
Local commits appear to be working properly.
233
    if None in (revision_a, revision_b):
234
        return None
1594.2.15 by Robert Collins
Unfuck performance.
235
    # trivial optimisation
236
    if revision_a == revision_b:
237
        return revision_a
974.1.80 by Aaron Bentley
Improved merge error handling and testing
238
    try:
1534.9.1 by Aaron Bentley
Added progress bars to merge
239
        try:
240
            pb.update('Picking ancestor', 1, 3)
1594.2.15 by Robert Collins
Unfuck performance.
241
            graph = revision_source.get_revision_graph_with_ghosts(
242
                [revision_a, revision_b])
243
            # convert to a NULL_REVISION based graph.
244
            ancestors = graph.get_ancestors()
245
            descendants = graph.get_descendants()
246
            common = set(graph.get_ancestry(revision_a)).intersection(
247
                     set(graph.get_ancestry(revision_b)))
248
            descendants[NULL_REVISION] = {}
249
            ancestors[NULL_REVISION] = []
250
            for root in graph.roots:
251
                descendants[NULL_REVISION][root] = 1
252
                ancestors[root].append(NULL_REVISION)
1607.1.12 by Robert Collins
Fix common_ancestor to still calculate a common ancestor when ghosts are
253
            for ghost in graph.ghosts:
254
                # ghosts act as roots for the purpose of finding 
255
                # the longest paths from the root: any ghost *might*
256
                # be directly attached to the root, so we treat them
257
                # as being such.
258
                # ghost now descends from NULL
259
                descendants[NULL_REVISION][ghost] = 1
260
                # that is it has an ancestor of NULL
261
                ancestors[ghost] = [NULL_REVISION]
262
                # ghost is common if any of ghosts descendants are common:
263
                for ghost_descendant in descendants[ghost]:
264
                    if ghost_descendant in common:
265
                        common.add(ghost)
266
                
1594.2.15 by Robert Collins
Unfuck performance.
267
            root = NULL_REVISION
268
            common.add(NULL_REVISION)
1534.9.1 by Aaron Bentley
Added progress bars to merge
269
        except bzrlib.errors.NoCommonRoot:
270
            raise bzrlib.errors.NoCommonAncestor(revision_a, revision_b)
271
            
272
        pb.update('Picking ancestor', 2, 3)
273
        distances = node_distances (descendants, ancestors, root)
274
        pb.update('Picking ancestor', 3, 2)
275
        farthest = select_farthest(distances, common)
276
        if farthest is None or farthest == NULL_REVISION:
277
            raise bzrlib.errors.NoCommonAncestor(revision_a, revision_b)
278
    finally:
279
        pb.clear()
974.1.87 by Aaron Bentley
Refactored and documented graph stuff
280
    return farthest
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
281
282
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
283
class MultipleRevisionSources(object):
1153 by Martin Pool
- clean up some code in revision.py
284
    """Proxy that looks in multiple branches for revisions."""
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
285
    def __init__(self, *args):
286
        object.__init__(self)
287
        assert len(args) != 0
288
        self._revision_sources = args
289
1590.1.1 by Robert Collins
Improve common_ancestor performance.
290
    def revision_parents(self, revision_id):
291
        for source in self._revision_sources:
292
            try:
293
                return source.revision_parents(revision_id)
294
            except (errors.WeaveRevisionNotPresent, errors.NoSuchRevision), e:
295
                pass
296
        raise e
297
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
298
    def get_revision(self, revision_id):
299
        for source in self._revision_sources:
300
            try:
301
                return source.get_revision(revision_id)
302
            except bzrlib.errors.NoSuchRevision, e:
303
                pass
304
        raise e
974.2.7 by aaron.bentley at utoronto
Merged from bzr.24
305
1590.1.1 by Robert Collins
Improve common_ancestor performance.
306
    def get_revision_graph(self, revision_id):
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
307
        # we could probe incrementally until the pending
308
        # ghosts list stop growing, but its cheaper for now
309
        # to just ask for the complete graph for each repository.
310
        graphs = []
311
        for source in self._revision_sources:
312
            ghost_graph = source.get_revision_graph_with_ghosts()
313
            graphs.append(ghost_graph)
314
        absent = 0
315
        for graph in graphs:
316
            if not revision_id in graph.get_ancestors():
317
                absent += 1
318
        if absent == len(graphs):
319
            raise errors.NoSuchRevision(self._revision_sources[0], revision_id)
320
321
        # combine the graphs
1590.1.1 by Robert Collins
Improve common_ancestor performance.
322
        result = {}
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
323
        pending = set([revision_id])
324
        def find_parents(node_id):
325
            """find the parents for node_id."""
326
            for graph in graphs:
327
                ancestors = graph.get_ancestors()
328
                try:
329
                    return ancestors[node_id]
330
                except KeyError:
331
                    pass
332
            raise errors.NoSuchRevision(self._revision_sources[0], node_id)
333
        while len(pending):
334
            # all the graphs should have identical parent lists
335
            node_id = pending.pop()
1590.1.1 by Robert Collins
Improve common_ancestor performance.
336
            try:
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
337
                result[node_id] = find_parents(node_id)
338
                for parent_node in result[node_id]:
339
                    if not parent_node in result:
340
                        pending.add(parent_node)
341
            except errors.NoSuchRevision:
342
                # ghost, ignore it.
1590.1.1 by Robert Collins
Improve common_ancestor performance.
343
                pass
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
344
        return result
1590.1.1 by Robert Collins
Improve common_ancestor performance.
345
1594.2.15 by Robert Collins
Unfuck performance.
346
    def get_revision_graph_with_ghosts(self, revision_ids):
347
        # query all the sources for their entire graphs 
348
        # and then build a combined graph for just
349
        # revision_ids.
350
        graphs = []
351
        for source in self._revision_sources:
352
            ghost_graph = source.get_revision_graph_with_ghosts()
353
            graphs.append(ghost_graph.get_ancestors())
354
        for revision_id in revision_ids:
355
            absent = 0
356
            for graph in graphs:
357
                    if not revision_id in graph:
358
                        absent += 1
359
            if absent == len(graphs):
360
                raise errors.NoSuchRevision(self._revision_sources[0],
361
                                            revision_id)
362
363
        # combine the graphs
364
        result = Graph()
365
        pending = set(revision_ids)
366
        done = set()
367
        def find_parents(node_id):
368
            """find the parents for node_id."""
369
            for graph in graphs:
370
                try:
371
                    return graph[node_id]
372
                except KeyError:
373
                    pass
374
            raise errors.NoSuchRevision(self._revision_sources[0], node_id)
375
        while len(pending):
376
            # all the graphs should have identical parent lists
377
            node_id = pending.pop()
378
            try:
379
                parents = find_parents(node_id)
380
                for parent_node in parents:
381
                    # queued or done? 
382
                    if (parent_node not in pending and
383
                        parent_node not in done):
384
                        # no, queue
385
                        pending.add(parent_node)
386
                result.add_node(node_id, parents)
387
                done.add(node_id)
388
            except errors.NoSuchRevision:
389
                # ghost
390
                result.add_ghost(node_id)
391
                continue
392
        return result
393
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
394
    def lock_read(self):
395
        for source in self._revision_sources:
396
            source.lock_read()
397
398
    def unlock(self):
399
        for source in self._revision_sources:
400
            source.unlock()
401
1590.1.1 by Robert Collins
Improve common_ancestor performance.
402
974.2.7 by aaron.bentley at utoronto
Merged from bzr.24
403
def get_intervening_revisions(ancestor_id, rev_id, rev_source, 
404
                              revision_history=None):
405
    """Find the longest line of descent from maybe_ancestor to revision.
406
    Revision history is followed where possible.
407
408
    If ancestor_id == rev_id, list will be empty.
409
    Otherwise, rev_id will be the last entry.  ancestor_id will never appear.
410
    If ancestor_id is not an ancestor, NotAncestor will be thrown
411
    """
974.1.73 by Aaron Bentley
Reimplemented get_intervening_revisions for better scalability
412
    root, ancestors, descendants = revision_graph(rev_id, rev_source)
413
    if len(descendants) == 0:
414
        raise NoSuchRevision(rev_source, rev_id)
415
    if ancestor_id not in descendants:
416
        rev_source.get_revision(ancestor_id)
417
        raise bzrlib.errors.NotAncestor(rev_id, ancestor_id)
418
    root_descendants = all_descendants(descendants, ancestor_id)
419
    root_descendants.add(ancestor_id)
420
    if rev_id not in root_descendants:
421
        raise bzrlib.errors.NotAncestor(rev_id, ancestor_id)
422
    distances = node_distances(descendants, ancestors, ancestor_id,
423
                               root_descendants=root_descendants)
424
425
    def best_ancestor(rev_id):
426
        best = None
427
        for anc_id in ancestors[rev_id]:
428
            try:
429
                distance = distances[anc_id]
430
            except KeyError:
431
                continue
432
            if revision_history is not None and anc_id in revision_history:
433
                return anc_id
434
            elif best is None or distance > best[1]:
435
                best = (anc_id, distance)
436
        return best[0]
437
438
    next = rev_id
439
    path = []
440
    while next != ancestor_id:
441
        path.append(next)
442
        next = best_ancestor(next)
443
    path.reverse()
444
    return path