~bzr-pqm/bzr/bzr.dev

184 by mbp at sourcefrog
pychecker fixups
1
# (C) 2005 Canonical
1 by mbp at sourcefrog
import from baz patch-364
2
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
1185.16.40 by Martin Pool
todo
17
# TODO: Some kind of command-line display of revision properties: 
18
# perhaps show them in log -v and allow them as options to the commit command.
1 by mbp at sourcefrog
import from baz patch-364
19
1590.1.1 by Robert Collins
Improve common_ancestor performance.
20
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
21
import bzrlib.errors
1590.1.1 by Robert Collins
Improve common_ancestor performance.
22
import bzrlib.errors as errors
974.1.87 by Aaron Bentley
Refactored and documented graph stuff
23
from bzrlib.graph import node_distances, select_farthest, all_descendants
1185.16.39 by Martin Pool
- constraints on revprops
24
from bzrlib.osutils import contains_whitespace
1534.9.1 by Aaron Bentley
Added progress bars to merge
25
from bzrlib.progress import DummyProgress
8 by mbp at sourcefrog
store committer's timezone in revision and show
26
974.1.90 by Aaron Bentley
Switched NULL revision ID to 'null:' per robertc's suggestion
27
NULL_REVISION="null:"
974.1.89 by Aaron Bentley
Fixed merging with multiple roots, by using null as graph root.
28
802 by Martin Pool
- Remove XMLMixin class in favour of simple pack_xml, unpack_xml functions
29
class Revision(object):
1 by mbp at sourcefrog
import from baz patch-364
30
    """Single revision on a branch.
31
32
    Revisions may know their revision_hash, but only once they've been
33
    written out.  This is not stored because you cannot write the hash
34
    into the file it describes.
35
697 by Martin Pool
- write out parent list for new revisions
36
    After bzr 0.0.5 revisions are allowed to have multiple parents.
696 by Martin Pool
- Refactor revision deserialization code
37
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
38
    parent_ids
39
        List of parent revision_ids
1185.16.39 by Martin Pool
- constraints on revprops
40
41
    properties
42
        Dictionary of revision properties.  These are attached to the
43
        revision as extra metadata.  The name must be a single 
44
        word; the value can be an arbitrary string.
1 by mbp at sourcefrog
import from baz patch-364
45
    """
696 by Martin Pool
- Refactor revision deserialization code
46
    
1185.16.35 by Martin Pool
- stub for revision properties
47
    def __init__(self, revision_id, properties=None, **args):
1092.2.25 by Robert Collins
support ghosts in commits
48
        self.revision_id = revision_id
1185.16.35 by Martin Pool
- stub for revision properties
49
        self.properties = properties or {}
1185.16.39 by Martin Pool
- constraints on revprops
50
        self._check_properties()
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
51
        self.parent_ids = []
1311 by Martin Pool
- remove RevisionReference; just hold parent ids directly
52
        self.parent_sha1s = []
1185.42.6 by Jelmer Vernooij
Don't clear Revision.parent_ids after it has been set from the arguments
53
        self.__dict__.update(args)
696 by Martin Pool
- Refactor revision deserialization code
54
1 by mbp at sourcefrog
import from baz patch-364
55
    def __repr__(self):
184 by mbp at sourcefrog
pychecker fixups
56
        return "<Revision id %s>" % self.revision_id
1 by mbp at sourcefrog
import from baz patch-364
57
1185 by Martin Pool
- add xml round-trip test for revisions
58
    def __eq__(self, other):
59
        if not isinstance(other, Revision):
60
            return False
1092.2.20 by Robert Collins
symlink and weaves, whaddya know
61
        # FIXME: rbc 20050930 parent_ids are not being compared
62
        return (
63
                self.inventory_sha1 == other.inventory_sha1
1185 by Martin Pool
- add xml round-trip test for revisions
64
                and self.revision_id == other.revision_id
65
                and self.timestamp == other.timestamp
66
                and self.message == other.message
67
                and self.timezone == other.timezone
1185.16.35 by Martin Pool
- stub for revision properties
68
                and self.committer == other.committer
69
                and self.properties == other.properties)
1185 by Martin Pool
- add xml round-trip test for revisions
70
71
    def __ne__(self, other):
72
        return not self.__eq__(other)
73
1185.16.39 by Martin Pool
- constraints on revprops
74
    def _check_properties(self):
75
        """Verify that all revision properties are OK.
76
        """
77
        for name, value in self.properties.iteritems():
78
            if not isinstance(name, basestring) or contains_whitespace(name):
79
                raise ValueError("invalid property name %r" % name)
80
            if not isinstance(value, basestring):
81
                raise ValueError("invalid property value %r for %r" % 
82
                                 (name, value))
83
1534.4.49 by Robert Collins
Provide a revision.get_history(repository) method for generating a synthetic revision history.
84
    def get_history(self, repository):
85
        """Return the canonical line-of-history for this revision.
86
87
        If ghosts are present this may differ in result from a ghost-free
88
        repository.
89
        """
90
        current_revision = self
91
        reversed_result = []
92
        while current_revision is not None:
93
            reversed_result.append(current_revision.revision_id)
94
            if not len (current_revision.parent_ids):
95
                reversed_result.append(None)
96
                current_revision = None
97
            else:
98
                next_revision_id = current_revision.parent_ids[0]
99
                current_revision = repository.get_revision(next_revision_id)
100
        reversed_result.reverse()
101
        return reversed_result
102
1268 by Martin Pool
- is_ancestor now works by looking at the Branch's stored ancestry
103
104
def is_ancestor(revision_id, candidate_id, branch):
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
105
    """Return true if candidate_id is an ancestor of revision_id.
1268 by Martin Pool
- is_ancestor now works by looking at the Branch's stored ancestry
106
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
107
    A false negative will be returned if any intermediate descendent of
108
    candidate_id is not present in any of the revision_sources.
810 by Martin Pool
- New validate_revision_id function
109
    
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
110
    revisions_source is an object supporting a get_revision operation that
111
    behaves like Branch's.
112
    """
1185.67.2 by Aaron Bentley
Renamed Branch.storage to Branch.repository
113
    return candidate_id in branch.repository.get_ancestry(revision_id)
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
114
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
115
116
def iter_ancestors(revision_id, revision_source, only_present=False):
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
117
    ancestors = (revision_id,)
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
118
    distance = 0
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
119
    while len(ancestors) > 0:
120
        new_ancestors = []
121
        for ancestor in ancestors:
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
122
            if not only_present:
123
                yield ancestor, distance
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
124
            try:
125
                revision = revision_source.get_revision(ancestor)
126
            except bzrlib.errors.NoSuchRevision, e:
127
                if e.revision == revision_id:
128
                    raise 
129
                else:
130
                    continue
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
131
            if only_present:
132
                yield ancestor, distance
1313 by Martin Pool
- rename to Revision.parent_ids to avoid confusion with old usage
133
            new_ancestors.extend(revision.parent_ids)
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
134
        ancestors = new_ancestors
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
135
        distance += 1
136
137
138
def find_present_ancestors(revision_id, revision_source):
1133 by Martin Pool
doc
139
    """Return the ancestors of a revision present in a branch.
140
141
    It's possible that a branch won't have the complete ancestry of
142
    one of its revisions.  
143
144
    """
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
145
    found_ancestors = {}
146
    anc_iter = enumerate(iter_ancestors(revision_id, revision_source,
147
                         only_present=True))
148
    for anc_order, (anc_id, anc_distance) in anc_iter:
149
        if not found_ancestors.has_key(anc_id):
150
            found_ancestors[anc_id] = (anc_order, anc_distance)
151
    return found_ancestors
152
    
1153 by Martin Pool
- clean up some code in revision.py
153
154
def __get_closest(intersection):
155
    intersection.sort()
156
    matches = [] 
157
    for entry in intersection:
158
        if entry[0] == intersection[0][0]:
159
            matches.append(entry[2])
160
    return matches
161
974.1.35 by aaron.bentley at utoronto
Added revision-based common-ancestor checking
162
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
163
def revision_graph(revision, revision_source):
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
164
    """Produce a graph of the ancestry of the specified revision.
1590.1.1 by Robert Collins
Improve common_ancestor performance.
165
    
166
    :return: root, ancestors map, descendants map
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
167
    """
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
168
    revision_source.lock_read()
169
    try:
170
        return _revision_graph(revision, revision_source)
171
    finally:
172
        revision_source.unlock()
173
1590.1.1 by Robert Collins
Improve common_ancestor performance.
174
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
175
def _revision_graph(revision, revision_source):
176
    """See revision_graph."""
1590.1.1 by Robert Collins
Improve common_ancestor performance.
177
    from bzrlib.tsort import topo_sort
178
    graph = revision_source.get_revision_graph(revision)
179
    # mark all no-parent revisions as being NULL_REVISION parentage.
180
    for node, parents in graph.items():
181
        if len(parents) == 0:
182
            graph[node] = [NULL_REVISION]
183
    # add NULL_REVISION to the graph
184
    graph[NULL_REVISION] = []
185
186
    # pick a root. If there are multiple roots
187
    # this could pick a random one.
188
    topo_order = topo_sort(graph.items())
189
    root = topo_order[0]
190
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
191
    ancestors = {}
192
    descendants = {}
1590.1.1 by Robert Collins
Improve common_ancestor performance.
193
194
    # map the descendants of the graph.
195
    # and setup our set based return graph.
196
    for node in graph.keys():
197
        descendants[node] = {}
198
    for node, parents in graph.items():
199
        for parent in parents:
200
            descendants[parent][node] = 1
201
        ancestors[node] = set(parents)
202
974.1.63 by Aaron Bentley
Fixed graph-generation
203
    assert root not in descendants[root]
204
    assert root not in ancestors[root]
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
205
    return root, ancestors, descendants
206
1092.3.4 by Robert Collins
update symlink branch to integration
207
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
208
def combined_graph(revision_a, revision_b, revision_source):
974.1.66 by Aaron Bentley
more cleanups, docs, sorting stuff
209
    """Produce a combined ancestry graph.
210
    Return graph root, ancestors map, descendants map, set of common nodes"""
1590.1.1 by Robert Collins
Improve common_ancestor performance.
211
    root, ancestors, descendants = revision_graph(
212
        revision_a, revision_source)
213
    root_b, ancestors_b, descendants_b = revision_graph(
214
        revision_b, revision_source)
974.1.80 by Aaron Bentley
Improved merge error handling and testing
215
    if root != root_b:
216
        raise bzrlib.errors.NoCommonRoot(revision_a, revision_b)
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
217
    common = set()
218
    for node, node_anc in ancestors_b.iteritems():
219
        if node in ancestors:
220
            common.add(node)
221
        else:
222
            ancestors[node] = set()
223
        ancestors[node].update(node_anc)
224
    for node, node_dec in descendants_b.iteritems():
225
        if node not in descendants:
1185.8.1 by Aaron Bentley
Ensured combined_graph is order-insensitive
226
            descendants[node] = {}
974.1.63 by Aaron Bentley
Fixed graph-generation
227
        descendants[node].update(node_dec)
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
228
    return root, ancestors, descendants, common
229
1092.3.4 by Robert Collins
update symlink branch to integration
230
1534.9.1 by Aaron Bentley
Added progress bars to merge
231
def common_ancestor(revision_a, revision_b, revision_source, 
232
                    pb=DummyProgress()):
1587.1.11 by Robert Collins
Local commits appear to be working properly.
233
    if None in (revision_a, revision_b):
234
        return None
974.1.80 by Aaron Bentley
Improved merge error handling and testing
235
    try:
1534.9.1 by Aaron Bentley
Added progress bars to merge
236
        try:
237
            pb.update('Picking ancestor', 1, 3)
238
            root, ancestors, descendants, common = \
1590.1.1 by Robert Collins
Improve common_ancestor performance.
239
                combined_graph(revision_a,
240
                               revision_b,
241
                               revision_source)
1534.9.1 by Aaron Bentley
Added progress bars to merge
242
        except bzrlib.errors.NoCommonRoot:
243
            raise bzrlib.errors.NoCommonAncestor(revision_a, revision_b)
244
            
245
        pb.update('Picking ancestor', 2, 3)
246
        distances = node_distances (descendants, ancestors, root)
247
        pb.update('Picking ancestor', 3, 2)
248
        farthest = select_farthest(distances, common)
249
        if farthest is None or farthest == NULL_REVISION:
250
            raise bzrlib.errors.NoCommonAncestor(revision_a, revision_b)
251
    finally:
252
        pb.clear()
974.1.87 by Aaron Bentley
Refactored and documented graph stuff
253
    return farthest
974.1.60 by aaron.bentley at utoronto
Initial import of common-ancestor detection
254
255
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
256
class MultipleRevisionSources(object):
1153 by Martin Pool
- clean up some code in revision.py
257
    """Proxy that looks in multiple branches for revisions."""
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
258
    def __init__(self, *args):
259
        object.__init__(self)
260
        assert len(args) != 0
261
        self._revision_sources = args
262
1590.1.1 by Robert Collins
Improve common_ancestor performance.
263
    def revision_parents(self, revision_id):
264
        for source in self._revision_sources:
265
            try:
266
                return source.revision_parents(revision_id)
267
            except (errors.WeaveRevisionNotPresent, errors.NoSuchRevision), e:
268
                pass
269
        raise e
270
974.1.26 by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472
271
    def get_revision(self, revision_id):
272
        for source in self._revision_sources:
273
            try:
274
                return source.get_revision(revision_id)
275
            except bzrlib.errors.NoSuchRevision, e:
276
                pass
277
        raise e
974.2.7 by aaron.bentley at utoronto
Merged from bzr.24
278
1590.1.1 by Robert Collins
Improve common_ancestor performance.
279
    def get_revision_graph(self, revision_id):
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
280
        # we could probe incrementally until the pending
281
        # ghosts list stop growing, but its cheaper for now
282
        # to just ask for the complete graph for each repository.
283
        graphs = []
284
        for source in self._revision_sources:
285
            ghost_graph = source.get_revision_graph_with_ghosts()
286
            graphs.append(ghost_graph)
287
        absent = 0
288
        for graph in graphs:
289
            if not revision_id in graph.get_ancestors():
290
                absent += 1
291
        if absent == len(graphs):
292
            raise errors.NoSuchRevision(self._revision_sources[0], revision_id)
293
294
        # combine the graphs
1590.1.1 by Robert Collins
Improve common_ancestor performance.
295
        result = {}
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
296
        pending = set([revision_id])
297
        def find_parents(node_id):
298
            """find the parents for node_id."""
299
            for graph in graphs:
300
                ancestors = graph.get_ancestors()
301
                try:
302
                    return ancestors[node_id]
303
                except KeyError:
304
                    pass
305
            raise errors.NoSuchRevision(self._revision_sources[0], node_id)
306
        while len(pending):
307
            # all the graphs should have identical parent lists
308
            node_id = pending.pop()
1590.1.1 by Robert Collins
Improve common_ancestor performance.
309
            try:
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
310
                result[node_id] = find_parents(node_id)
311
                for parent_node in result[node_id]:
312
                    if not parent_node in result:
313
                        pending.add(parent_node)
314
            except errors.NoSuchRevision:
315
                # ghost, ignore it.
1590.1.1 by Robert Collins
Improve common_ancestor performance.
316
                pass
1594.2.3 by Robert Collins
bugfix revision.MultipleRevisionSources.get_revision_graph to integrate ghosts between sources. [slow on weaves, fast on knits.
317
        return result
1590.1.1 by Robert Collins
Improve common_ancestor performance.
318
1587.1.4 by Robert Collins
Quick, urgent fix for common_ancestor performance.
319
    def lock_read(self):
320
        for source in self._revision_sources:
321
            source.lock_read()
322
323
    def unlock(self):
324
        for source in self._revision_sources:
325
            source.unlock()
326
1590.1.1 by Robert Collins
Improve common_ancestor performance.
327
974.2.7 by aaron.bentley at utoronto
Merged from bzr.24
328
def get_intervening_revisions(ancestor_id, rev_id, rev_source, 
329
                              revision_history=None):
330
    """Find the longest line of descent from maybe_ancestor to revision.
331
    Revision history is followed where possible.
332
333
    If ancestor_id == rev_id, list will be empty.
334
    Otherwise, rev_id will be the last entry.  ancestor_id will never appear.
335
    If ancestor_id is not an ancestor, NotAncestor will be thrown
336
    """
974.1.73 by Aaron Bentley
Reimplemented get_intervening_revisions for better scalability
337
    root, ancestors, descendants = revision_graph(rev_id, rev_source)
338
    if len(descendants) == 0:
339
        raise NoSuchRevision(rev_source, rev_id)
340
    if ancestor_id not in descendants:
341
        rev_source.get_revision(ancestor_id)
342
        raise bzrlib.errors.NotAncestor(rev_id, ancestor_id)
343
    root_descendants = all_descendants(descendants, ancestor_id)
344
    root_descendants.add(ancestor_id)
345
    if rev_id not in root_descendants:
346
        raise bzrlib.errors.NotAncestor(rev_id, ancestor_id)
347
    distances = node_distances(descendants, ancestors, ancestor_id,
348
                               root_descendants=root_descendants)
349
350
    def best_ancestor(rev_id):
351
        best = None
352
        for anc_id in ancestors[rev_id]:
353
            try:
354
                distance = distances[anc_id]
355
            except KeyError:
356
                continue
357
            if revision_history is not None and anc_id in revision_history:
358
                return anc_id
359
            elif best is None or distance > best[1]:
360
                best = (anc_id, distance)
361
        return best[0]
362
363
    next = rev_id
364
    path = []
365
    while next != ancestor_id:
366
        path.append(next)
367
        next = best_ancestor(next)
368
    path.reverse()
369
    return path