~bzr-pqm/bzr/bzr.dev

184 by mbp at sourcefrog
pychecker fixups
1
# (C) 2005 Canonical
1 by mbp at sourcefrog
import from baz patch-364
2
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
1185.16.40 by Martin Pool
todo
17
# TODO: Some kind of command-line display of revision properties: 
18
# perhaps show them in log -v and allow them as options to the commit command.
1 by mbp at sourcefrog
import from baz patch-364
19
1590.1.1 by Robert Collins
Improve common_ancestor performance.
20
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
21
import bzrlib.errors
1590.1.1 by Robert Collins
Improve common_ancestor performance.
22
import bzrlib.errors as errors
1594.2.15 by Robert Collins
Unfuck performance.
23
from bzrlib.graph import node_distances, select_farthest, all_descendants, Graph
1185.16.39 by Martin Pool
- constraints on revprops
24
from bzrlib.osutils import contains_whitespace
1534.9.1 by Aaron Bentley
Added progress bars to merge
25
from bzrlib.progress import DummyProgress
8 by mbp at sourcefrog
store committer's timezone in revision and show
26
974.1.90 by Aaron Bentley
Switched NULL revision ID to 'null:' per robertc's suggestion
27
NULL_REVISION="null:"
974.1.89 by Aaron Bentley
Fixed merging with multiple roots, by using null as graph root.
28
802 by Martin Pool
- Remove XMLMixin class in favour of simple pack_xml, unpack_xml functions
29
class Revision(object):
1 by mbp at sourcefrog
import from baz patch-364
30
    """Single revision on a branch.
31
32
    Revisions may know their revision_hash, but only once they've been
33
    written out.  This is not stored because you cannot write the hash
34
    into the file it describes.
35
697 by Martin Pool
- write out parent list for new revisions
36
    After bzr 0.0.5 revisions are allowed to have multiple parents.
696 by Martin Pool
- Refactor revision deserialization code
37
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
38
    parent_ids
39
        List of parent revision_ids
1185.16.39 by Martin Pool
- constraints on revprops
40
41
    properties
42
        Dictionary of revision properties.  These are attached to the
43
        revision as extra metadata.  The name must be a single 
44
        word; the value can be an arbitrary string.
1 by mbp at sourcefrog
import from baz patch-364
45
    """
696 by Martin Pool
- Refactor revision deserialization code
46
    
1185.16.35 by Martin Pool
- stub for revision properties
47
    def __init__(self, revision_id, properties=None, **args):
1092.2.25 by Robert Collins
support ghosts in commits
48
        self.revision_id = revision_id
1185.16.35 by Martin Pool
- stub for revision properties
49
        self.properties = properties or {}
1185.16.39 by Martin Pool
- constraints on revprops
50
        self._check_properties()
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
51
        self.parent_ids = []
1311 by Martin Pool
- remove RevisionReference; just hold parent ids directly
52
        self.parent_sha1s = []
1185.42.6 by Jelmer Vernooij
Don't clear Revision.parent_ids after it has been set from the arguments
53
        self.__dict__.update(args)
696 by Martin Pool
- Refactor revision deserialization code
54
1 by mbp at sourcefrog
import from baz patch-364
55
    def __repr__(self):
184 by mbp at sourcefrog
pychecker fixups
56
        return "<Revision id %s>" % self.revision_id
1 by mbp at sourcefrog
import from baz patch-364
57
1185 by Martin Pool
- add xml round-trip test for revisions
58
    def __eq__(self, other):
59
        if not isinstance(other, Revision):
60
            return False
1092.2.20 by Robert Collins
symlink and weaves, whaddya know
61
        # FIXME: rbc 20050930 parent_ids are not being compared
62
        return (
63
                self.inventory_sha1 == other.inventory_sha1
1185 by Martin Pool
- add xml round-trip test for revisions
64
                and self.revision_id == other.revision_id
65
                and self.timestamp == other.timestamp
66
                and self.message == other.message
67
                and self.timezone == other.timezone
1185.16.35 by Martin Pool
- stub for revision properties
68
                and self.committer == other.committer
69
                and self.properties == other.properties)
1185 by Martin Pool
- add xml round-trip test for revisions
70
71
    def __ne__(self, other):
72
        return not self.__eq__(other)
73
1185.16.39 by Martin Pool
- constraints on revprops
74
    def _check_properties(self):
75
        """Verify that all revision properties are OK.
76
        """
77
        for name, value in self.properties.iteritems():
78
            if not isinstance(name, basestring) or contains_whitespace(name):
79
                raise ValueError("invalid property name %r" % name)
80
            if not isinstance(value, basestring):
81
                raise ValueError("invalid property value %r for %r" % 
82
                                 (name, value))
83
1534.4.49 by Robert Collins
Provide a revision.get_history(repository) method for generating a synthetic revision history.
84
    def get_history(self, repository):
85
        """Return the canonical line-of-history for this revision.
86
87
        If ghosts are present this may differ in result from a ghost-free
88
        repository.
89
        """
90
        current_revision = self
91
        reversed_result = []
92
        while current_revision is not None:
93
            reversed_result.append(current_revision.revision_id)
94
            if not len (current_revision.parent_ids):
95
                reversed_result.append(None)
96
                current_revision = None
97
            else:
98
                next_revision_id = current_revision.parent_ids[0]
99
                current_revision = repository.get_revision(next_revision_id)
100
        reversed_result.reverse()
101
        return reversed_result
102
1268 by Martin Pool
- is_ancestor now works by looking at the Branch's stored ancestry
103
104
def is_ancestor(revision_id, candidate_id, branch):
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
105
    """Return true if candidate_id is an ancestor of revision_id.
1268 by Martin Pool
- is_ancestor now works by looking at the Branch's stored ancestry
106
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
107
    A false negative will be returned if any intermediate descendent of
108
    candidate_id is not present in any of the revision_sources.
810 by Martin Pool
- New validate_revision_id function
109
    
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
110
    revisions_source is an object supporting a get_revision operation that
111
    behaves like Branch's.
112
    """
1185.67.2 by Aaron Bentley
Renamed Branch.storage to Branch.repository
113
    return candidate_id in branch.repository.get_ancestry(revision_id)
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
114
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
115
116
def iter_ancestors(revision_id, revision_source, only_present=False):
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
117
    ancestors = (revision_id,)
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
118
    distance = 0
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
119
    while len(ancestors) > 0:
120
        new_ancestors = []
121
        for ancestor in ancestors:
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
122
            if not only_present:
123
                yield ancestor, distance
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
124
            try:
125
                revision = revision_source.get_revision(ancestor)
126
            except bzrlib.errors.NoSuchRevision, e:
127
                if e.revision == revision_id:
128
                    raise 
129
                else:
130
                    continue
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
131
            if only_present:
132
                yield ancestor, distance
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
133
            new_ancestors.extend(revision.parent_ids)
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
134
        ancestors = new_ancestors
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
135
        distance += 1
136
137
138
def find_present_ancestors(revision_id, revision_source):
1133 by Martin Pool
doc
139
    """Return the ancestors of a revision present in a branch.
140
141
    It's possible that a branch won't have the complete ancestry of
142
    one of its revisions.  
143
144
    """
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
145
    found_ancestors = {}
146
    anc_iter = enumerate(iter_ancestors(revision_id, revision_source,
147
                         only_present=True))
148
    for anc_order, (anc_id, anc_distance) in anc_iter:
149
        if not found_ancestors.has_key(anc_id):
150
            found_ancestors[anc_id] = (anc_order, anc_distance)
151
    return found_ancestors
152
    
1153 by Martin Pool
- clean up some code in revision.py
153
154
def __get_closest(intersection):
155
    intersection.sort()
156
    matches = [] 
157
    for entry in intersection:
158
        if entry[0] == intersection[0][0]:
159
            matches.append(entry[2])
160
    return matches
161
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
162
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
163
def revision_graph(revision, revision_source):
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
164
    """Produce a graph of the ancestry of the specified revision.
1590.1.1 by Robert Collins
Improve common_ancestor performance.
165
    
166
    :return: root, ancestors map, descendants map
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
167
    """
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
168
    revision_source.lock_read()
169
    try:
170
        return _revision_graph(revision, revision_source)
171
    finally:
172
        revision_source.unlock()
173
1590.1.1 by Robert Collins
Improve common_ancestor performance.
174
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
175
def _revision_graph(revision, revision_source):
176
    """See revision_graph."""
1590.1.1 by Robert Collins
Improve common_ancestor performance.
177
    from bzrlib.tsort import topo_sort
178
    graph = revision_source.get_revision_graph(revision)
179
    # mark all no-parent revisions as being NULL_REVISION parentage.
180
    for node, parents in graph.items():
181
        if len(parents) == 0:
182
            graph[node] = [NULL_REVISION]
183
    # add NULL_REVISION to the graph
184
    graph[NULL_REVISION] = []
185
186
    # pick a root. If there are multiple roots
187
    # this could pick a random one.
188
    topo_order = topo_sort(graph.items())
189
    root = topo_order[0]
190
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
191
    ancestors = {}
192
    descendants = {}
1590.1.1 by Robert Collins
Improve common_ancestor performance.
193
194
    # map the descendants of the graph.
195
    # and setup our set based return graph.
196
    for node in graph.keys():
197
        descendants[node] = {}
198
    for node, parents in graph.items():
199
        for parent in parents:
200
            descendants[parent][node] = 1
201
        ancestors[node] = set(parents)
202
974.1.63 by Aaron Bentley
Fixed graph-generation
203
    assert root not in descendants[root]
204
    assert root not in ancestors[root]
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
205
    return root, ancestors, descendants
206
1092.3.4 by Robert Collins
update symlink branch to integration
207
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
208
def combined_graph(revision_a, revision_b, revision_source):
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
209
    """Produce a combined ancestry graph.
210
    Return graph root, ancestors map, descendants map, set of common nodes"""
1590.1.1 by Robert Collins
Improve common_ancestor performance.
211
    root, ancestors, descendants = revision_graph(
212
        revision_a, revision_source)
213
    root_b, ancestors_b, descendants_b = revision_graph(
214
        revision_b, revision_source)
974.1.80 by Aaron Bentley
Improved merge error handling and testing
215
    if root != root_b:
216
        raise bzrlib.errors.NoCommonRoot(revision_a, revision_b)
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
217
    common = set()
218
    for node, node_anc in ancestors_b.iteritems():
219
        if node in ancestors:
220
            common.add(node)
221
        else:
222
            ancestors[node] = set()
223
        ancestors[node].update(node_anc)
224
    for node, node_dec in descendants_b.iteritems():
225
        if node not in descendants:
1185.8.1 by Aaron Bentley
Ensured combined_graph is order-insensitive
226
            descendants[node] = {}
974.1.63 by Aaron Bentley
Fixed graph-generation
227
        descendants[node].update(node_dec)
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
228
    return root, ancestors, descendants, common
229
1092.3.4 by Robert Collins
update symlink branch to integration
230
1534.9.1 by Aaron Bentley
Added progress bars to merge
231
def common_ancestor(revision_a, revision_b, revision_source, 
232
                    pb=DummyProgress()):
1587.1.11 by Robert Collins
Local commits appear to be working properly.
233
    if None in (revision_a, revision_b):
234
        return None
1594.2.15 by Robert Collins
Unfuck performance.
235
    # trivial optimisation
236
    if revision_a == revision_b:
237
        return revision_a
974.1.80 by Aaron Bentley
Improved merge error handling and testing
238
    try:
1534.9.1 by Aaron Bentley
Added progress bars to merge
239
        try:
240
            pb.update('Picking ancestor', 1, 3)
1594.2.15 by Robert Collins
Unfuck performance.
241
            graph = revision_source.get_revision_graph_with_ghosts(
242
                [revision_a, revision_b])
243
            # convert to a NULL_REVISION based graph.
244
            ancestors = graph.get_ancestors()
245
            descendants = graph.get_descendants()
246
            common = set(graph.get_ancestry(revision_a)).intersection(
247
                     set(graph.get_ancestry(revision_b)))
248
            descendants[NULL_REVISION] = {}
249
            ancestors[NULL_REVISION] = []
250
            for root in graph.roots:
251
                descendants[NULL_REVISION][root] = 1
252
                ancestors[root].append(NULL_REVISION)
253
            if len(graph.roots) == 0:
254
                # no reachable roots - not handled yet.
255
                raise bzrlib.errors.NoCommonAncestor(revision_a, revision_b)
256
            root = NULL_REVISION
257
            common.add(NULL_REVISION)
1534.9.1 by Aaron Bentley
Added progress bars to merge
258
        except bzrlib.errors.NoCommonRoot:
259
            raise bzrlib.errors.NoCommonAncestor(revision_a, revision_b)
260
            
261
        pb.update('Picking ancestor', 2, 3)
262
        distances = node_distances (descendants, ancestors, root)
263
        pb.update('Picking ancestor', 3, 2)
264
        farthest = select_farthest(distances, common)
265
        if farthest is None or farthest == NULL_REVISION:
266
            raise bzrlib.errors.NoCommonAncestor(revision_a, revision_b)
267
    finally:
268
        pb.clear()
974.1.87 by Aaron Bentley
Refactored and documented graph stuff
269
    return farthest
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
270
271
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
272
class MultipleRevisionSources(object):
1153 by Martin Pool
- clean up some code in revision.py
273
    """Proxy that looks in multiple branches for revisions."""
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
274
    def __init__(self, *args):
275
        object.__init__(self)
276
        assert len(args) != 0
277
        self._revision_sources = args
278
1590.1.1 by Robert Collins
Improve common_ancestor performance.
279
    def revision_parents(self, revision_id):
280
        for source in self._revision_sources:
281
            try:
282
                return source.revision_parents(revision_id)
283
            except (errors.WeaveRevisionNotPresent, errors.NoSuchRevision), e:
284
                pass
285
        raise e
286
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
287
    def get_revision(self, revision_id):
288
        for source in self._revision_sources:
289
            try:
290
                return source.get_revision(revision_id)
291
            except bzrlib.errors.NoSuchRevision, e:
292
                pass
293
        raise e
974.2.7 by aaron.bentley at utoronto
Merged from bzr.24
294
1590.1.1 by Robert Collins
Improve common_ancestor performance.
295
    def get_revision_graph(self, revision_id):
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
296
        # we could probe incrementally until the pending
297
        # ghosts list stop growing, but its cheaper for now
298
        # to just ask for the complete graph for each repository.
299
        graphs = []
300
        for source in self._revision_sources:
301
            ghost_graph = source.get_revision_graph_with_ghosts()
302
            graphs.append(ghost_graph)
303
        absent = 0
304
        for graph in graphs:
305
            if not revision_id in graph.get_ancestors():
306
                absent += 1
307
        if absent == len(graphs):
308
            raise errors.NoSuchRevision(self._revision_sources[0], revision_id)
309
310
        # combine the graphs
1590.1.1 by Robert Collins
Improve common_ancestor performance.
311
        result = {}
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
312
        pending = set([revision_id])
313
        def find_parents(node_id):
314
            """find the parents for node_id."""
315
            for graph in graphs:
316
                ancestors = graph.get_ancestors()
317
                try:
318
                    return ancestors[node_id]
319
                except KeyError:
320
                    pass
321
            raise errors.NoSuchRevision(self._revision_sources[0], node_id)
322
        while len(pending):
323
            # all the graphs should have identical parent lists
324
            node_id = pending.pop()
1590.1.1 by Robert Collins
Improve common_ancestor performance.
325
            try:
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
326
                result[node_id] = find_parents(node_id)
327
                for parent_node in result[node_id]:
328
                    if not parent_node in result:
329
                        pending.add(parent_node)
330
            except errors.NoSuchRevision:
331
                # ghost, ignore it.
1590.1.1 by Robert Collins
Improve common_ancestor performance.
332
                pass
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
333
        return result
1590.1.1 by Robert Collins
Improve common_ancestor performance.
334
1594.2.15 by Robert Collins
Unfuck performance.
335
    def get_revision_graph_with_ghosts(self, revision_ids):
336
        # query all the sources for their entire graphs 
337
        # and then build a combined graph for just
338
        # revision_ids.
339
        graphs = []
340
        for source in self._revision_sources:
341
            ghost_graph = source.get_revision_graph_with_ghosts()
342
            graphs.append(ghost_graph.get_ancestors())
343
        for revision_id in revision_ids:
344
            absent = 0
345
            for graph in graphs:
346
                    if not revision_id in graph:
347
                        absent += 1
348
            if absent == len(graphs):
349
                raise errors.NoSuchRevision(self._revision_sources[0],
350
                                            revision_id)
351
352
        # combine the graphs
353
        result = Graph()
354
        pending = set(revision_ids)
355
        done = set()
356
        def find_parents(node_id):
357
            """find the parents for node_id."""
358
            for graph in graphs:
359
                try:
360
                    return graph[node_id]
361
                except KeyError:
362
                    pass
363
            raise errors.NoSuchRevision(self._revision_sources[0], node_id)
364
        while len(pending):
365
            # all the graphs should have identical parent lists
366
            node_id = pending.pop()
367
            try:
368
                parents = find_parents(node_id)
369
                for parent_node in parents:
370
                    # queued or done? 
371
                    if (parent_node not in pending and
372
                        parent_node not in done):
373
                        # no, queue
374
                        pending.add(parent_node)
375
                result.add_node(node_id, parents)
376
                done.add(node_id)
377
            except errors.NoSuchRevision:
378
                # ghost
379
                result.add_ghost(node_id)
380
                continue
381
        return result
382
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
383
    def lock_read(self):
384
        for source in self._revision_sources:
385
            source.lock_read()
386
387
    def unlock(self):
388
        for source in self._revision_sources:
389
            source.unlock()
390
1590.1.1 by Robert Collins
Improve common_ancestor performance.
391
974.2.7 by aaron.bentley at utoronto
Merged from bzr.24
392
def get_intervening_revisions(ancestor_id, rev_id, rev_source, 
393
                              revision_history=None):
394
    """Find the longest line of descent from maybe_ancestor to revision.
395
    Revision history is followed where possible.
396
397
    If ancestor_id == rev_id, list will be empty.
398
    Otherwise, rev_id will be the last entry.  ancestor_id will never appear.
399
    If ancestor_id is not an ancestor, NotAncestor will be thrown
400
    """
974.1.73 by Aaron Bentley
Reimplemented get_intervening_revisions for better scalability
401
    root, ancestors, descendants = revision_graph(rev_id, rev_source)
402
    if len(descendants) == 0:
403
        raise NoSuchRevision(rev_source, rev_id)
404
    if ancestor_id not in descendants:
405
        rev_source.get_revision(ancestor_id)
406
        raise bzrlib.errors.NotAncestor(rev_id, ancestor_id)
407
    root_descendants = all_descendants(descendants, ancestor_id)
408
    root_descendants.add(ancestor_id)
409
    if rev_id not in root_descendants:
410
        raise bzrlib.errors.NotAncestor(rev_id, ancestor_id)
411
    distances = node_distances(descendants, ancestors, ancestor_id,
412
                               root_descendants=root_descendants)
413
414
    def best_ancestor(rev_id):
415
        best = None
416
        for anc_id in ancestors[rev_id]:
417
            try:
418
                distance = distances[anc_id]
419
            except KeyError:
420
                continue
421
            if revision_history is not None and anc_id in revision_history:
422
                return anc_id
423
            elif best is None or distance > best[1]:
424
                best = (anc_id, distance)
425
        return best[0]
426
427
    next = rev_id
428
    path = []
429
    while next != ancestor_id:
430
        path.append(next)
431
        next = best_ancestor(next)
432
    path.reverse()
433
    return path