~bzr-pqm/bzr/bzr.dev

3350.6.10 by Martin Pool
VersionedFiles review cleanups
1
# Copyright (C) 2005, 2006, 2008 Canonical Ltd
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
2
#
1110 by Martin Pool
- merge aaron's merge improvements:
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
7
#
1110 by Martin Pool
- merge aaron's merge improvements:
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
12
#
1110 by Martin Pool
- merge aaron's merge improvements:
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
1545.2.3 by Aaron Bentley
Updated following j-a-meinel's comments
17
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
18
import errno
19
from itertools import chain
1185.1.2 by Martin Pool
- merge various windows and other fixes from Ollie Rutherfurd
20
import os
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
21
import warnings
1113 by Martin Pool
- fix is_ancestor import problem in merge
22
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
23
from bzrlib import (
1551.19.17 by Aaron Bentley
Add debugging flag for merges
24
    debug,
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
25
    errors,
3514.2.14 by John Arbash Meinel
Bring in the code to collapse linear portions of the graph.
26
    graph as _mod_graph,
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
27
    osutils,
1551.15.46 by Aaron Bentley
Move plan merge to tree
28
    patiencediff,
2221.4.15 by Aaron Bentley
Use RegistryOption for merge type
29
    registry,
2598.5.1 by Aaron Bentley
Start eliminating the use of None to indicate null revision
30
    revision as _mod_revision,
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
31
    tsort,
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
32
    )
1185.11.5 by John Arbash Meinel
Merged up-to-date against mainline, still broken.
33
from bzrlib.branch import Branch
1666.1.4 by Robert Collins
* 'Metadir' is now the default disk format. This improves behaviour in
34
from bzrlib.conflicts import ConflictList, Conflict
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
35
from bzrlib.errors import (BzrCommandError,
1534.4.28 by Robert Collins
first cut at merge from integration.
36
                           BzrError,
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
37
                           NoCommonAncestor,
38
                           NoCommits,
1534.4.28 by Robert Collins
first cut at merge from integration.
39
                           NoSuchRevision,
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
40
                           NoSuchFile,
1545.2.6 by Aaron Bentley
Removed _merge, renamed MergeConflictHandler to _MergeConflictHandler
41
                           NotBranchError,
1185.33.27 by Martin Pool
[merge] much integrated work from robert and john
42
                           NotVersionedError,
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
43
                           UnrelatedBranches,
1534.10.12 by Aaron Bentley
Merge produces new conflicts
44
                           UnsupportedOperation,
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
45
                           WorkingTreeNotRevision,
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
46
                           BinaryFile,
1534.4.28 by Robert Collins
first cut at merge from integration.
47
                           )
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
48
from bzrlib.graph import Graph
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
49
from bzrlib.merge3 import Merge3
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
50
from bzrlib.osutils import rename, pathjoin
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
51
from progress import DummyProgress, ProgressPhase
3052.1.3 by John Arbash Meinel
deprecate revision.is_ancestor, update the callers and the tests.
52
from bzrlib.revision import (NULL_REVISION, ensure_null)
1558.15.5 by Aaron Bentley
Fixed binary handling in weave merge
53
from bzrlib.textfile import check_text_lines
3200.1.1 by James Westby
Make pull --quiet more quiet. Fixes #185907.
54
from bzrlib.trace import mutter, warning, note, is_quiet
3008.1.9 by Michael Hudson
wanton hacking that lets me write an efficient version of get_diff_as_merged
55
from bzrlib.transform import (TransformPreview, TreeTransform,
56
                              resolve_conflicts, cook_conflicts,
2590.2.8 by Aaron Bentley
Restore conflict handling changes
57
                              conflict_pass, FinalPaths, create_by_entry,
58
                              unique_add, ROOT_PARENT)
1551.15.46 by Aaron Bentley
Move plan merge to tree
59
from bzrlib.versionedfile import PlanWeaveMerge
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
60
from bzrlib import ui
1545.2.6 by Aaron Bentley
Removed _merge, renamed MergeConflictHandler to _MergeConflictHandler
61
62
# TODO: Report back as changes are merged in
63
2325.3.1 by John Arbash Meinel
New helper function for merge, which allows us to re-use the existing workingtree, rather than opening it again.
64
1185.35.4 by Aaron Bentley
Implemented remerge
65
def transform_tree(from_tree, to_tree, interesting_ids=None):
66
    merge_inner(from_tree.branch, to_tree, from_tree, ignore_zero=True,
1558.1.3 by Aaron Bentley
Fixed deprecated op use in test suite
67
                interesting_ids=interesting_ids, this_tree=from_tree)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
68
1457.1.12 by Robert Collins
Update comment to reflect author.
69
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
70
class Merger(object):
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
71
    def __init__(self, this_branch, other_tree=None, base_tree=None,
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
72
                 this_tree=None, pb=DummyProgress(), change_reporter=None,
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
73
                 recurse='down', revision_graph=None):
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
74
        object.__init__(self)
75
        self.this_branch = this_branch
2598.5.4 by Aaron Bentley
Restore original Branch.last_revision behavior, fix bits that care
76
        self.this_basis = _mod_revision.ensure_null(
77
            this_branch.last_revision())
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
78
        self.this_rev_id = None
1534.4.26 by Robert Collins
Move working tree initialisation out from Branch.initialize, deprecated Branch.initialize to Branch.create.
79
        self.this_tree = this_tree
1185.12.83 by Aaron Bentley
Preliminary weave merge support
80
        self.this_revision_tree = None
1185.35.5 by Aaron Bentley
Made weave merge succeed if interesting files match history
81
        self.this_basis_tree = None
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
82
        self.other_tree = other_tree
2100.3.29 by Aaron Bentley
Get merge working initially
83
        self.other_branch = None
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
84
        self.base_tree = base_tree
85
        self.ignore_zero = False
86
        self.backup_files = False
87
        self.interesting_ids = None
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
88
        self.interesting_files = None
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
89
        self.show_base = False
1185.24.3 by Aaron Bentley
Integrated reprocessing into the rest of the merge stuff
90
        self.reprocess = False
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
91
        self._pb = pb
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
92
        self.pp = None
2100.3.29 by Aaron Bentley
Get merge working initially
93
        self.recurse = recurse
1551.11.9 by Aaron Bentley
Apply change reporting to merge
94
        self.change_reporter = change_reporter
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
95
        self._cached_trees = {}
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
96
        self._revision_graph = revision_graph
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
97
        self._base_is_ancestor = None
98
        self._base_is_other_ancestor = None
99
100
    @property
101
    def revision_graph(self):
102
        if self._revision_graph is None:
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
103
            self._revision_graph = self.this_branch.repository.get_graph()
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
104
        return self._revision_graph
105
106
    def _set_base_is_ancestor(self, value):
107
        self._base_is_ancestor = value
108
109
    def _get_base_is_ancestor(self):
110
        if self._base_is_ancestor is None:
111
            self._base_is_ancestor = self.revision_graph.is_ancestor(
112
                self.base_rev_id, self.this_basis)
113
        return self._base_is_ancestor
114
115
    base_is_ancestor = property(_get_base_is_ancestor, _set_base_is_ancestor)
116
117
    def _set_base_is_other_ancestor(self, value):
118
        self._base_is_other_ancestor = value
119
120
    def _get_base_is_other_ancestor(self):
121
        if self._base_is_other_ancestor is None:
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
122
            if self.other_basis is None:
123
                return True
124
            self._base_is_other_ancestor = self.revision_graph.is_ancestor(
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
125
                self.base_rev_id, self.other_basis)
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
126
        return self._base_is_other_ancestor
127
128
    base_is_other_ancestor = property(_get_base_is_other_ancestor,
129
                                      _set_base_is_other_ancestor)
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
130
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
131
    @staticmethod
132
    def from_uncommitted(tree, other_tree, pb):
1551.15.74 by Aaron Bentley
Textual updates from review
133
        """Return a Merger for uncommitted changes in other_tree.
134
135
        :param tree: The tree to merge into
136
        :param other_tree: The tree to get uncommitted changes from
137
        :param pb: A progress indicator
138
        """
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
139
        merger = Merger(tree.branch, other_tree, other_tree.basis_tree(), tree,
140
                        pb)
141
        merger.base_rev_id = merger.base_tree.get_revision_id()
142
        merger.other_rev_id = None
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
143
        merger.other_basis = merger.base_rev_id
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
144
        return merger
145
146
    @classmethod
147
    def from_mergeable(klass, tree, mergeable, pb):
1551.15.74 by Aaron Bentley
Textual updates from review
148
        """Return a Merger for a bundle or merge directive.
149
150
        :param tree: The tree to merge changes into
151
        :param mergeable: A merge directive or bundle
152
        :param pb: A progress indicator
153
        """
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
154
        mergeable.install_revisions(tree.branch.repository)
155
        base_revision_id, other_revision_id, verified =\
156
            mergeable.get_merge_request(tree.branch.repository)
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
157
        revision_graph = tree.branch.repository.get_graph()
1551.19.44 by Aaron Bentley
Fix handling of old merge directives with stricter get_parent_map
158
        if base_revision_id is not None:
159
            if (base_revision_id != _mod_revision.NULL_REVISION and
160
                revision_graph.is_ancestor(
161
                base_revision_id, tree.branch.last_revision())):
162
                base_revision_id = None
163
            else:
164
                warning('Performing cherrypick')
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
165
        merger = klass.from_revision_ids(pb, tree, other_revision_id,
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
166
                                         base_revision_id, revision_graph=
167
                                         revision_graph)
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
168
        return merger, verified
169
170
    @staticmethod
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
171
    def from_revision_ids(pb, tree, other, base=None, other_branch=None,
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
172
                          base_branch=None, revision_graph=None):
1551.15.74 by Aaron Bentley
Textual updates from review
173
        """Return a Merger for revision-ids.
174
175
        :param tree: The tree to merge changes into
176
        :param other: The revision-id to use as OTHER
177
        :param base: The revision-id to use as BASE.  If not specified, will
178
            be auto-selected.
179
        :param other_branch: A branch containing the other revision-id.  If
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
180
            not supplied, tree.branch is used.
1551.15.74 by Aaron Bentley
Textual updates from review
181
        :param base_branch: A branch containing the base revision-id.  If
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
182
            not supplied, other_branch or tree.branch will be used.
183
        :param revision_graph: If you have a revision_graph precomputed, pass
184
            it in, otherwise it will be created for you.
1551.15.74 by Aaron Bentley
Textual updates from review
185
        :param pb: A progress indicator
186
        """
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
187
        merger = Merger(tree.branch, this_tree=tree, pb=pb,
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
188
                        revision_graph=revision_graph)
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
189
        if other_branch is None:
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
190
            other_branch = tree.branch
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
191
        merger.set_other_revision(other, other_branch)
192
        if base is None:
193
            merger.find_base()
194
        else:
195
            if base_branch is None:
196
                base_branch = other_branch
197
            merger.set_base_revision(base, base_branch)
198
        return merger
199
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
200
    def revision_tree(self, revision_id, branch=None):
201
        if revision_id not in self._cached_trees:
202
            if branch is None:
203
                branch = self.this_branch
204
            try:
205
                tree = self.this_tree.revision_tree(revision_id)
206
            except errors.NoSuchRevisionInTree:
207
                tree = branch.repository.revision_tree(revision_id)
208
            self._cached_trees[revision_id] = tree
209
        return self._cached_trees[revision_id]
210
2485.8.58 by Vincent Ladeuil
merge bzr.dev@1617
211
    def _get_tree(self, treespec, possible_transports=None):
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
212
        from bzrlib import workingtree
213
        location, revno = treespec
214
        if revno is None:
215
            tree = workingtree.WorkingTree.open_containing(location)[0]
216
            return tree.branch, tree
2485.8.58 by Vincent Ladeuil
merge bzr.dev@1617
217
        branch = Branch.open_containing(location, possible_transports)[0]
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
218
        if revno == -1:
219
            revision_id = branch.last_revision()
220
        else:
221
            revision_id = branch.get_rev_id(revno)
222
        revision_id = ensure_null(revision_id)
223
        return branch, self.revision_tree(revision_id, branch)
1185.12.83 by Aaron Bentley
Preliminary weave merge support
224
225
    def ensure_revision_trees(self):
226
        if self.this_revision_tree is None:
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
227
            self.this_basis_tree = self.revision_tree(self.this_basis)
1185.35.5 by Aaron Bentley
Made weave merge succeed if interesting files match history
228
            if self.this_basis == self.this_rev_id:
229
                self.this_revision_tree = self.this_basis_tree
230
1185.12.83 by Aaron Bentley
Preliminary weave merge support
231
        if self.other_rev_id is None:
232
            other_basis_tree = self.revision_tree(self.other_basis)
1852.10.3 by Robert Collins
Remove all uses of compare_trees and replace with Tree.changes_from throughout bzrlib.
233
            changes = other_basis_tree.changes_from(self.other_tree)
1185.12.83 by Aaron Bentley
Preliminary weave merge support
234
            if changes.has_changed():
235
                raise WorkingTreeNotRevision(self.this_tree)
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
236
            other_rev_id = self.other_basis
1185.12.83 by Aaron Bentley
Preliminary weave merge support
237
            self.other_tree = other_basis_tree
238
239
    def file_revisions(self, file_id):
240
        self.ensure_revision_trees()
241
        def get_id(tree, file_id):
242
            revision_id = tree.inventory[file_id].revision
243
            return revision_id
1185.35.5 by Aaron Bentley
Made weave merge succeed if interesting files match history
244
        if self.this_rev_id is None:
245
            if self.this_basis_tree.get_file_sha1(file_id) != \
246
                self.this_tree.get_file_sha1(file_id):
247
                raise WorkingTreeNotRevision(self.this_tree)
248
249
        trees = (self.this_basis_tree, self.other_tree)
1185.12.83 by Aaron Bentley
Preliminary weave merge support
250
        return [get_id(tree, file_id) for tree in trees]
251
1185.82.44 by Aaron Bentley
Switch to merge_changeset in test suite
252
    def check_basis(self, check_clean, require_commits=True):
253
        if self.this_basis is None and require_commits is True:
2249.3.1 by John Arbash Meinel
Mention using 'bzr pull' if there are no commits in current branch
254
            raise BzrCommandError("This branch has no commits."
255
                                  " (perhaps you would prefer 'bzr pull')")
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
256
        if check_clean:
257
            self.compare_basis()
258
            if self.this_basis != self.this_rev_id:
2796.2.1 by Aaron Bentley
Begin work on reconfigure command
259
                raise errors.UncommittedChanges(self.this_tree)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
260
261
    def compare_basis(self):
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
262
        try:
263
            basis_tree = self.revision_tree(self.this_tree.last_revision())
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
264
        except errors.NoSuchRevision:
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
265
            basis_tree = self.this_tree.basis_tree()
266
        changes = self.this_tree.changes_from(basis_tree)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
267
        if not changes.has_changed():
268
            self.this_rev_id = self.this_basis
269
270
    def set_interesting_files(self, file_list):
2590.2.7 by Aaron Bentley
Misc cleanup
271
        self.interesting_files = file_list
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
272
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
273
    def set_pending(self):
2644.1.1 by Wouter van Heyst
Fix bug #127115 by checking for self.other_rev_id being None in Merger.set_pending()
274
        if not self.base_is_ancestor or not self.base_is_other_ancestor or self.other_rev_id is None:
1185.12.77 by Aaron Bentley
Prevented all ancestors from being marked as pending merges
275
            return
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
276
        self._add_parent()
277
278
    def _add_parent(self):
279
        new_parents = self.this_tree.get_parent_ids() + [self.other_rev_id]
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
280
        new_parent_trees = []
281
        for revision_id in new_parents:
282
            try:
283
                tree = self.revision_tree(revision_id)
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
284
            except errors.NoSuchRevision:
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
285
                tree = None
286
            else:
287
                tree.lock_read()
288
            new_parent_trees.append((revision_id, tree))
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
289
        try:
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
290
            self.this_tree.set_parent_trees(new_parent_trees,
291
                                            allow_leftmost_as_ghost=True)
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
292
        finally:
293
            for _revision_id, tree in new_parent_trees:
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
294
                if tree is not None:
295
                    tree.unlock()
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
296
2485.8.37 by Vincent Ladeuil
Fix merge multiple connections. Test suite *not* passing (sftp
297
    def set_other(self, other_revision, possible_transports=None):
1979.2.1 by Robert Collins
(robertc) adds a convenience method "merge_from_branch" to WorkingTree.
298
        """Set the revision and tree to merge from.
299
300
        This sets the other_tree, other_rev_id, other_basis attributes.
301
302
        :param other_revision: The [path, revision] list to merge from.
303
        """
2485.8.58 by Vincent Ladeuil
merge bzr.dev@1617
304
        self.other_branch, self.other_tree = self._get_tree(other_revision,
305
                                                            possible_transports)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
306
        if other_revision[1] == -1:
2598.5.4 by Aaron Bentley
Restore original Branch.last_revision behavior, fix bits that care
307
            self.other_rev_id = _mod_revision.ensure_null(
308
                self.other_branch.last_revision())
2598.5.1 by Aaron Bentley
Start eliminating the use of None to indicate null revision
309
            if _mod_revision.is_null(self.other_rev_id):
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
310
                raise NoCommits(self.other_branch)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
311
            self.other_basis = self.other_rev_id
312
        elif other_revision[1] is not None:
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
313
            self.other_rev_id = self.other_branch.get_rev_id(other_revision[1])
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
314
            self.other_basis = self.other_rev_id
315
        else:
316
            self.other_rev_id = None
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
317
            self.other_basis = self.other_branch.last_revision()
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
318
            if self.other_basis is None:
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
319
                raise NoCommits(self.other_branch)
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
320
        if self.other_rev_id is not None:
321
            self._cached_trees[self.other_rev_id] = self.other_tree
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
322
        self._maybe_fetch(self.other_branch,self.this_branch, self.other_basis)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
323
2100.3.29 by Aaron Bentley
Get merge working initially
324
    def set_other_revision(self, revision_id, other_branch):
325
        """Set 'other' based on a branch and revision id
326
327
        :param revision_id: The revision to use for a tree
328
        :param other_branch: The branch containing this tree
329
        """
330
        self.other_rev_id = revision_id
331
        self.other_branch = other_branch
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
332
        self._maybe_fetch(other_branch, self.this_branch, self.other_rev_id)
2100.3.29 by Aaron Bentley
Get merge working initially
333
        self.other_tree = self.revision_tree(revision_id)
334
        self.other_basis = revision_id
335
2520.4.110 by Aaron Bentley
Implement cherrypick support for merge directives
336
    def set_base_revision(self, revision_id, branch):
337
        """Set 'base' based on a branch and revision id
338
339
        :param revision_id: The revision to use for a tree
340
        :param branch: The branch containing this tree
341
        """
342
        self.base_rev_id = revision_id
343
        self.base_branch = branch
2520.4.132 by Aaron Bentley
Merge from bzr.dev
344
        self._maybe_fetch(branch, self.this_branch, revision_id)
2520.4.110 by Aaron Bentley
Implement cherrypick support for merge directives
345
        self.base_tree = self.revision_tree(revision_id)
2520.4.132 by Aaron Bentley
Merge from bzr.dev
346
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
347
    def _maybe_fetch(self, source, target, revision_id):
2665.5.2 by Aaron Bentley
Switch commit and merge to Repository.has_same_location
348
        if not source.repository.has_same_location(target.repository):
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
349
            target.fetch(source, revision_id)
2520.4.110 by Aaron Bentley
Implement cherrypick support for merge directives
350
1185.82.25 by Aaron Bentley
Added changeset-merging functionality
351
    def find_base(self):
2590.2.22 by Aaron Bentley
Remove cruft
352
        revisions = [ensure_null(self.this_basis),
353
                     ensure_null(self.other_basis)]
354
        if NULL_REVISION in revisions:
355
            self.base_rev_id = NULL_REVISION
356
        else:
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
357
            self.base_rev_id, steps = self.revision_graph.find_unique_lca(
358
                revisions[0], revisions[1], count_steps=True)
2590.2.22 by Aaron Bentley
Remove cruft
359
            if self.base_rev_id == NULL_REVISION:
360
                raise UnrelatedBranches()
1551.19.10 by Aaron Bentley
Merge now warns when it encounters a criss-cross
361
            if steps > 1:
1551.19.11 by Aaron Bentley
Add criss-cross help topic
362
                warning('Warning: criss-cross merge encountered.  See bzr'
363
                        ' help criss-cross.')
2590.2.13 by Aaron Bentley
Make find_base implement the base_finding code
364
        self.base_tree = self.revision_tree(self.base_rev_id)
365
        self.base_is_ancestor = True
2590.2.18 by Aaron Bentley
Merge is_ancestor fix
366
        self.base_is_other_ancestor = True
1185.82.25 by Aaron Bentley
Added changeset-merging functionality
367
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
368
    def set_base(self, base_revision):
1979.2.1 by Robert Collins
(robertc) adds a convenience method "merge_from_branch" to WorkingTree.
369
        """Set the base revision to use for the merge.
370
371
        :param base_revision: A 2-list containing a path and revision number.
372
        """
1185.12.96 by Aaron Bentley
Merge from mpool
373
        mutter("doing merge() with no base_revision specified")
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
374
        if base_revision == [None, None]:
2590.2.13 by Aaron Bentley
Make find_base implement the base_finding code
375
            self.find_base()
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
376
        else:
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
377
            base_branch, self.base_tree = self._get_tree(base_revision)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
378
            if base_revision[1] == -1:
379
                self.base_rev_id = base_branch.last_revision()
380
            elif base_revision[1] is None:
2598.5.3 by Aaron Bentley
Push NULL_REVISION deeper
381
                self.base_rev_id = _mod_revision.NULL_REVISION
493 by Martin Pool
- Merge aaron's merge command
382
            else:
2598.5.3 by Aaron Bentley
Push NULL_REVISION deeper
383
                self.base_rev_id = _mod_revision.ensure_null(
384
                    base_branch.get_rev_id(base_revision[1]))
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
385
            self._maybe_fetch(base_branch, self.this_branch, self.base_rev_id)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
386
3008.1.8 by Michael Hudson
extract merger creation into a method
387
    def make_merger(self):
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
388
        kwargs = {'working_tree':self.this_tree, 'this_tree': self.this_tree,
389
                  'other_tree': self.other_tree,
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
390
                  'interesting_ids': self.interesting_ids,
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
391
                  'interesting_files': self.interesting_files,
3008.1.11 by Michael Hudson
restore the default behaviour of Merge3Merger.__init__().
392
                  'pp': self.pp,
393
                  'do_merge': False}
1534.7.84 by Aaron Bentley
Added reprocess support, support for varying merge types
394
        if self.merge_type.requires_base:
395
            kwargs['base_tree'] = self.base_tree
1534.7.137 by Aaron Bentley
Avoided generating a new tree for every weave merge
396
        if self.merge_type.supports_reprocess:
397
            kwargs['reprocess'] = self.reprocess
398
        elif self.reprocess:
1551.6.14 by Aaron Bentley
Tweaks from merge review
399
            raise BzrError("Conflict reduction is not supported for merge"
400
                                  " type %s." % self.merge_type)
1534.7.137 by Aaron Bentley
Avoided generating a new tree for every weave merge
401
        if self.merge_type.supports_show_base:
402
            kwargs['show_base'] = self.show_base
403
        elif self.show_base:
1534.8.2 by Aaron Bentley
Implemented weave merge
404
            raise BzrError("Showing base is not supported for this"
3008.1.14 by Michael Hudson
trivial commit for testing
405
                           " merge type. %s" % self.merge_type)
3062.2.7 by Aaron Bentley
Prevent reverse cherry-picking with weave
406
        if (not getattr(self.merge_type, 'supports_reverse_cherrypick', True)
407
            and not self.base_is_other_ancestor):
408
            raise errors.CannotReverseCherrypick()
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
409
        if self.merge_type.supports_cherrypick:
3062.2.9 by Aaron Bentley
Don't use the base if not cherrypicking
410
            kwargs['cherrypick'] = (not self.base_is_ancestor or
411
                                    not self.base_is_other_ancestor)
3008.1.8 by Michael Hudson
extract merger creation into a method
412
        return self.merge_type(pb=self._pb,
413
                               change_reporter=self.change_reporter,
414
                               **kwargs)
415
416
    def do_merge(self):
2255.2.50 by John Arbash Meinel
merge only needs a lock_tree_write() on the working tree, not a full lock_write()
417
        self.this_tree.lock_tree_write()
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
418
        if self.base_tree is not None:
419
            self.base_tree.lock_read()
420
        if self.other_tree is not None:
421
            self.other_tree.lock_read()
422
        try:
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
423
            merge = self.make_merger()
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
424
            merge.do_merge()
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
425
            if self.recurse == 'down':
3504.2.2 by John Arbash Meinel
Find some code that thought we were dealing in absolute paths
426
                for relpath, file_id in self.this_tree.iter_references():
427
                    sub_tree = self.this_tree.get_nested_tree(file_id, relpath)
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
428
                    other_revision = self.other_tree.get_reference_revision(
3504.2.2 by John Arbash Meinel
Find some code that thought we were dealing in absolute paths
429
                        file_id, relpath)
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
430
                    if  other_revision == sub_tree.last_revision():
431
                        continue
432
                    sub_merge = Merger(sub_tree.branch, this_tree=sub_tree)
433
                    sub_merge.merge_type = self.merge_type
434
                    other_branch = self.other_branch.reference_parent(file_id, relpath)
435
                    sub_merge.set_other_revision(other_revision, other_branch)
436
                    base_revision = self.base_tree.get_reference_revision(file_id)
437
                    sub_merge.base_tree = \
438
                        sub_tree.branch.repository.revision_tree(base_revision)
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
439
                    sub_merge.base_rev_id = base_revision
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
440
                    sub_merge.do_merge()
441
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
442
        finally:
443
            if self.other_tree is not None:
444
                self.other_tree.unlock()
445
            if self.base_tree is not None:
446
                self.base_tree.unlock()
447
            self.this_tree.unlock()
1534.7.151 by Aaron Bentley
Fixed all changes applied successfully
448
        if len(merge.cooked_conflicts) == 0:
3200.1.1 by James Westby
Make pull --quiet more quiet. Fixes #185907.
449
            if not self.ignore_zero and not is_quiet():
1534.7.141 by Aaron Bentley
Added conflict reporting
450
                note("All changes applied successfully.")
451
        else:
452
            note("%d conflicts encountered." % len(merge.cooked_conflicts))
453
1534.7.134 by Aaron Bentley
Hid raw conflicts
454
        return len(merge.cooked_conflicts)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
455
1545.2.4 by Aaron Bentley
PEP8 fixes
456
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
457
class Merge3Merger(object):
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
458
    """Three-way merger that uses the merge3 text merger"""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
459
    requires_base = True
460
    supports_reprocess = True
461
    supports_show_base = True
462
    history_based = False
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
463
    supports_cherrypick = True
3062.2.7 by Aaron Bentley
Prevent reverse cherry-picking with weave
464
    supports_reverse_cherrypick = True
2590.2.7 by Aaron Bentley
Misc cleanup
465
    winner_idx = {"this": 2, "other": 1, "conflict": 1}
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
466
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
467
    def __init__(self, working_tree, this_tree, base_tree, other_tree, 
1558.2.2 by Aaron Bentley
Make remerge honour interesting-ids
468
                 interesting_ids=None, reprocess=False, show_base=False,
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
469
                 pb=DummyProgress(), pp=None, change_reporter=None,
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
470
                 interesting_files=None, do_merge=True,
471
                 cherrypick=False):
2590.2.10 by Aaron Bentley
Updates from review
472
        """Initialize the merger object and perform the merge.
473
474
        :param working_tree: The working tree to apply the merge to
475
        :param this_tree: The local tree in the merge operation
476
        :param base_tree: The common tree in the merge operation
477
        :param other_tree: The other other tree to merge changes from
478
        :param interesting_ids: The file_ids of files that should be
479
            participate in the merge.  May not be combined with
480
            interesting_files.
481
        :param: reprocess If True, perform conflict-reduction processing.
482
        :param show_base: If True, show the base revision in text conflicts.
483
            (incompatible with reprocess)
484
        :param pb: A Progress bar
485
        :param pp: A ProgressPhase object
486
        :param change_reporter: An object that should report changes made
487
        :param interesting_files: The tree-relative paths of files that should
488
            participate in the merge.  If these paths refer to directories,
489
            the contents of those directories will also be included.  May not
490
            be combined with interesting_ids.  If neither interesting_files nor
491
            interesting_ids is specified, all files may participate in the
492
            merge.
493
        """
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
494
        object.__init__(self)
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
495
        if interesting_files is not None and interesting_ids is not None:
496
            raise ValueError(
497
                'specify either interesting_ids or interesting_files')
2590.2.4 by Aaron Bentley
Move entry generation to a helper
498
        self.interesting_ids = interesting_ids
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
499
        self.interesting_files = interesting_files
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
500
        self.this_tree = working_tree
501
        self.base_tree = base_tree
502
        self.other_tree = other_tree
503
        self._raw_conflicts = []
504
        self.cooked_conflicts = []
505
        self.reprocess = reprocess
506
        self.show_base = show_base
1534.9.1 by Aaron Bentley
Added progress bars to merge
507
        self.pb = pb
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
508
        self.pp = pp
1551.11.9 by Aaron Bentley
Apply change reporting to merge
509
        self.change_reporter = change_reporter
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
510
        self.cherrypick = cherrypick
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
511
        if self.pp is None:
512
            self.pp = ProgressPhase("Merge phase", 3, self.pb)
3008.1.11 by Michael Hudson
restore the default behaviour of Merge3Merger.__init__().
513
        if do_merge:
514
            self.do_merge()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
515
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
516
    def do_merge(self):
517
        self.this_tree.lock_tree_write()
518
        self.base_tree.lock_read()
519
        self.other_tree.lock_read()
520
        self.tt = TreeTransform(self.this_tree, self.pb)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
521
        try:
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
522
            self.pp.next_phase()
3008.1.21 by Aaron Bentley
Make compute_transform private, test make_preview_transform
523
            self._compute_transform()
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
524
            self.pp.next_phase()
2590.2.17 by Aaron Bentley
Avoid redundant conflict check
525
            results = self.tt.apply(no_conflicts=True)
1558.4.3 by Aaron Bentley
Merge_modified performance/concurrency fix
526
            self.write_modified(results)
1534.10.12 by Aaron Bentley
Merge produces new conflicts
527
            try:
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
528
                self.this_tree.add_conflicts(self.cooked_conflicts)
1534.10.12 by Aaron Bentley
Merge produces new conflicts
529
            except UnsupportedOperation:
530
                pass
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
531
        finally:
1711.7.7 by John Arbash Meinel
Don't squelch errors in tt.finalize()
532
            self.tt.finalize()
2255.7.52 by Robert Collins
Lock trees in Merge3Merger correctly.
533
            self.other_tree.unlock()
534
            self.base_tree.unlock()
535
            self.this_tree.unlock()
1551.2.31 by Aaron Bentley
Got merge and revert using nested pbs
536
            self.pb.clear()
1534.7.192 by Aaron Bentley
Record hashes produced by merges
537
3008.1.9 by Michael Hudson
wanton hacking that lets me write an efficient version of get_diff_as_merged
538
    def make_preview_transform(self):
539
        self.base_tree.lock_read()
540
        self.other_tree.lock_read()
541
        self.tt = TransformPreview(self.this_tree)
542
        try:
543
            self.pp.next_phase()
3008.1.21 by Aaron Bentley
Make compute_transform private, test make_preview_transform
544
            self._compute_transform()
3008.1.9 by Michael Hudson
wanton hacking that lets me write an efficient version of get_diff_as_merged
545
            self.pp.next_phase()
546
        finally:
547
            self.other_tree.unlock()
548
            self.base_tree.unlock()
549
            self.pb.clear()
550
        return self.tt
551
3008.1.21 by Aaron Bentley
Make compute_transform private, test make_preview_transform
552
    def _compute_transform(self):
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
553
        entries = self._entries3()
554
        child_pb = ui.ui_factory.nested_progress_bar()
555
        try:
556
            for num, (file_id, changed, parents3, names3,
557
                      executable3) in enumerate(entries):
558
                child_pb.update('Preparing file merge', num, len(entries))
559
                self._merge_names(file_id, parents3, names3)
560
                if changed:
561
                    file_status = self.merge_contents(file_id)
562
                else:
563
                    file_status = 'unmodified'
564
                self._merge_executable(file_id,
565
                    executable3, file_status)
566
        finally:
567
            child_pb.finished()
568
        self.fix_root()
569
        self.pp.next_phase()
570
        child_pb = ui.ui_factory.nested_progress_bar()
571
        try:
572
            fs_conflicts = resolve_conflicts(self.tt, child_pb,
573
                lambda t, c: conflict_pass(t, c, self.other_tree))
574
        finally:
575
            child_pb.finished()
576
        if self.change_reporter is not None:
577
            from bzrlib import delta
578
            delta.report_changes(
3254.1.1 by Aaron Bentley
Make Tree.iter_changes a public method
579
                self.tt.iter_changes(), self.change_reporter)
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
580
        self.cook_conflicts(fs_conflicts)
581
        for conflict in self.cooked_conflicts:
582
            warning(conflict)
583
2590.2.4 by Aaron Bentley
Move entry generation to a helper
584
    def _entries3(self):
2590.2.7 by Aaron Bentley
Misc cleanup
585
        """Gather data about files modified between three trees.
586
587
        Return a list of tuples of file_id, changed, parents3, names3,
588
        executable3.  changed is a boolean indicating whether the file contents
589
        or kind were changed.  parents3 is a tuple of parent ids for base,
590
        other and this.  names3 is a tuple of names for base, other and this.
591
        executable3 is a tuple of execute-bit values for base, other and this.
592
        """
2590.2.4 by Aaron Bentley
Move entry generation to a helper
593
        result = []
3254.1.1 by Aaron Bentley
Make Tree.iter_changes a public method
594
        iterator = self.other_tree.iter_changes(self.base_tree,
3514.2.16 by John Arbash Meinel
Review feedback from Ian.
595
                include_unchanged=True, specific_files=self.interesting_files,
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
596
                extra_trees=[self.this_tree])
2590.2.4 by Aaron Bentley
Move entry generation to a helper
597
        for (file_id, paths, changed, versioned, parents, names, kind,
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
598
             executable) in iterator:
2590.2.4 by Aaron Bentley
Move entry generation to a helper
599
            if (self.interesting_ids is not None and
600
                file_id not in self.interesting_ids):
601
                continue
602
            if file_id in self.this_tree.inventory:
603
                entry = self.this_tree.inventory[file_id]
604
                this_name = entry.name
605
                this_parent = entry.parent_id
606
                this_executable = entry.executable
607
            else:
608
                this_name = None
609
                this_parent = None
610
                this_executable = None
611
            parents3 = parents + (this_parent,)
612
            names3 = names + (this_name,)
613
            executable3 = executable + (this_executable,)
614
            result.append((file_id, changed, parents3, names3, executable3))
615
        return result
616
1731.1.33 by Aaron Bentley
Revert no-special-root changes
617
    def fix_root(self):
618
        try:
619
            self.tt.final_kind(self.tt.root)
620
        except NoSuchFile:
621
            self.tt.cancel_deletion(self.tt.root)
622
        if self.tt.final_file_id(self.tt.root) is None:
623
            self.tt.version_file(self.tt.tree_file_id(self.tt.root), 
624
                                 self.tt.root)
625
        if self.other_tree.inventory.root is None:
626
            return
2946.3.3 by John Arbash Meinel
Prefer tree.get_root_id() as more explicit than tree.path2id('')
627
        other_root_file_id = self.other_tree.get_root_id()
1731.1.33 by Aaron Bentley
Revert no-special-root changes
628
        other_root = self.tt.trans_id_file_id(other_root_file_id)
629
        if other_root == self.tt.root:
630
            return
631
        try:
632
            self.tt.final_kind(other_root)
633
        except NoSuchFile:
634
            return
635
        self.reparent_children(self.other_tree.inventory.root, self.tt.root)
636
        self.tt.cancel_creation(other_root)
637
        self.tt.cancel_versioning(other_root)
638
639
    def reparent_children(self, ie, target):
640
        for thing, child in ie.children.iteritems():
641
            trans_id = self.tt.trans_id_file_id(child.file_id)
642
            self.tt.adjust_path(self.tt.final_name(trans_id), target, trans_id)
643
1534.7.192 by Aaron Bentley
Record hashes produced by merges
644
    def write_modified(self, results):
645
        modified_hashes = {}
646
        for path in results.modified_paths:
647
            file_id = self.this_tree.path2id(self.this_tree.relpath(path))
648
            if file_id is None:
649
                continue
650
            hash = self.this_tree.get_file_sha1(file_id)
651
            if hash is None:
652
                continue
653
            modified_hashes[file_id] = hash
654
        self.this_tree.set_merge_modified(modified_hashes)
655
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
656
    @staticmethod
657
    def parent(entry, file_id):
1534.7.157 by Aaron Bentley
Added more docs
658
        """Determine the parent for a file_id (used as a key method)"""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
659
        if entry is None:
660
            return None
661
        return entry.parent_id
662
663
    @staticmethod
664
    def name(entry, file_id):
1534.7.157 by Aaron Bentley
Added more docs
665
        """Determine the name for a file_id (used as a key method)"""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
666
        if entry is None:
667
            return None
668
        return entry.name
669
    
670
    @staticmethod
671
    def contents_sha1(tree, file_id):
1534.7.157 by Aaron Bentley
Added more docs
672
        """Determine the sha1 of the file contents (used as a key method)."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
673
        if file_id not in tree:
674
            return None
675
        return tree.get_file_sha1(file_id)
676
677
    @staticmethod
678
    def executable(tree, file_id):
1534.7.157 by Aaron Bentley
Added more docs
679
        """Determine the executability of a file-id (used as a key method)."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
680
        if file_id not in tree:
681
            return None
682
        if tree.kind(file_id) != "file":
683
            return False
684
        return tree.is_executable(file_id)
685
686
    @staticmethod
687
    def kind(tree, file_id):
1534.7.157 by Aaron Bentley
Added more docs
688
        """Determine the kind of a file-id (used as a key method)."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
689
        if file_id not in tree:
690
            return None
691
        return tree.kind(file_id)
692
693
    @staticmethod
2590.2.8 by Aaron Bentley
Restore conflict handling changes
694
    def _three_way(base, other, this):
695
        #if base == other, either they all agree, or only THIS has changed.
696
        if base == other:
697
            return 'this'
2590.2.10 by Aaron Bentley
Updates from review
698
        elif this not in (base, other):
2590.2.8 by Aaron Bentley
Restore conflict handling changes
699
            return 'conflict'
2590.2.10 by Aaron Bentley
Updates from review
700
        # "Ambiguous clean merge" -- both sides have made the same change.
2590.2.8 by Aaron Bentley
Restore conflict handling changes
701
        elif this == other:
702
            return "this"
2590.2.10 by Aaron Bentley
Updates from review
703
        # this == base: only other has changed.
2590.2.8 by Aaron Bentley
Restore conflict handling changes
704
        else:
705
            return "other"
706
707
    @staticmethod
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
708
    def scalar_three_way(this_tree, base_tree, other_tree, file_id, key):
709
        """Do a three-way test on a scalar.
710
        Return "this", "other" or "conflict", depending whether a value wins.
711
        """
712
        key_base = key(base_tree, file_id)
713
        key_other = key(other_tree, file_id)
714
        #if base == other, either they all agree, or only THIS has changed.
715
        if key_base == key_other:
716
            return "this"
717
        key_this = key(this_tree, file_id)
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
718
        # "Ambiguous clean merge"
719
        if key_this == key_other:
720
            return "this"
721
        elif key_this == key_base:
722
            return "other"
723
        else:
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
724
            return "conflict"
725
726
    def merge_names(self, file_id):
727
        def get_entry(tree):
728
            if file_id in tree.inventory:
729
                return tree.inventory[file_id]
730
            else:
731
                return None
732
        this_entry = get_entry(self.this_tree)
733
        other_entry = get_entry(self.other_tree)
734
        base_entry = get_entry(self.base_tree)
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
735
        entries = (base_entry, other_entry, this_entry)
736
        names = []
737
        parents = []
738
        for entry in entries:
739
            if entry is None:
740
                names.append(None)
741
                parents.append(None)
742
            else:
743
                names.append(entry.name)
744
                parents.append(entry.parent_id)
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
745
        return self._merge_names(file_id, parents, names)
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
746
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
747
    def _merge_names(self, file_id, parents, names):
2590.2.7 by Aaron Bentley
Misc cleanup
748
        """Perform a merge on file_id names and parents"""
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
749
        base_name, other_name, this_name = names
750
        base_parent, other_parent, this_parent = parents
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
751
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
752
        name_winner = self._three_way(*names)
753
754
        parent_id_winner = self._three_way(*parents)
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
755
        if this_name is None:
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
756
            if name_winner == "this":
757
                name_winner = "other"
758
            if parent_id_winner == "this":
759
                parent_id_winner = "other"
760
        if name_winner == "this" and parent_id_winner == "this":
761
            return
762
        if name_winner == "conflict":
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
763
            trans_id = self.tt.trans_id_file_id(file_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
764
            self._raw_conflicts.append(('name conflict', trans_id, 
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
765
                                        this_name, other_name))
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
766
        if parent_id_winner == "conflict":
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
767
            trans_id = self.tt.trans_id_file_id(file_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
768
            self._raw_conflicts.append(('parent conflict', trans_id, 
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
769
                                        this_parent, other_parent))
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
770
        if other_name is None:
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
771
            # it doesn't matter whether the result was 'other' or 
772
            # 'conflict'-- if there's no 'other', we leave it alone.
773
            return
774
        # if we get here, name_winner and parent_winner are set to safe values.
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
775
        trans_id = self.tt.trans_id_file_id(file_id)
2590.2.7 by Aaron Bentley
Misc cleanup
776
        parent_id = parents[self.winner_idx[parent_id_winner]]
1731.1.33 by Aaron Bentley
Revert no-special-root changes
777
        if parent_id is not None:
778
            parent_trans_id = self.tt.trans_id_file_id(parent_id)
2590.2.7 by Aaron Bentley
Misc cleanup
779
            self.tt.adjust_path(names[self.winner_idx[name_winner]],
1731.1.33 by Aaron Bentley
Revert no-special-root changes
780
                                parent_trans_id, trans_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
781
782
    def merge_contents(self, file_id):
1534.7.157 by Aaron Bentley
Added more docs
783
        """Performa a merge on file_id contents."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
784
        def contents_pair(tree):
785
            if file_id not in tree:
786
                return (None, None)
787
            kind = tree.kind(file_id)
788
            if kind == "file":
789
                contents = tree.get_file_sha1(file_id)
790
            elif kind == "symlink":
791
                contents = tree.get_symlink_target(file_id)
792
            else:
793
                contents = None
794
            return kind, contents
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
795
796
        def contents_conflict():
797
            trans_id = self.tt.trans_id_file_id(file_id)
798
            name = self.tt.final_name(trans_id)
799
            parent_id = self.tt.final_parent(trans_id)
800
            if file_id in self.this_tree.inventory:
801
                self.tt.unversion_file(trans_id)
1551.10.2 by Aaron Bentley
Handle merge with dangling inventory entries
802
                if file_id in self.this_tree:
803
                    self.tt.delete_contents(trans_id)
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
804
            file_group = self._dump_conflicts(name, parent_id, file_id, 
805
                                              set_version=True)
806
            self._raw_conflicts.append(('contents conflict', file_group))
807
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
808
        # See SPOT run.  run, SPOT, run.
809
        # So we're not QUITE repeating ourselves; we do tricky things with
810
        # file kind...
811
        base_pair = contents_pair(self.base_tree)
812
        other_pair = contents_pair(self.other_tree)
813
        if base_pair == other_pair:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
814
            # OTHER introduced no changes
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
815
            return "unmodified"
816
        this_pair = contents_pair(self.this_tree)
817
        if this_pair == other_pair:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
818
            # THIS and OTHER introduced the same changes
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
819
            return "unmodified"
820
        else:
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
821
            trans_id = self.tt.trans_id_file_id(file_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
822
            if this_pair == base_pair:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
823
                # only OTHER introduced changes
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
824
                if file_id in self.this_tree:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
825
                    # Remove any existing contents
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
826
                    self.tt.delete_contents(trans_id)
1534.7.147 by Aaron Bentley
Tweak to check inventory, not tree for file ids
827
                if file_id in self.other_tree:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
828
                    # OTHER changed the file
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
829
                    create_by_entry(self.tt, 
830
                                    self.other_tree.inventory[file_id], 
831
                                    self.other_tree, trans_id)
1534.7.147 by Aaron Bentley
Tweak to check inventory, not tree for file ids
832
                    if file_id not in self.this_tree.inventory:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
833
                        self.tt.version_file(file_id, trans_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
834
                    return "modified"
1534.7.147 by Aaron Bentley
Tweak to check inventory, not tree for file ids
835
                elif file_id in self.this_tree.inventory:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
836
                    # OTHER deleted the file
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
837
                    self.tt.unversion_file(trans_id)
838
                    return "deleted"
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
839
            #BOTH THIS and OTHER introduced changes; scalar conflict
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
840
            elif this_pair[0] == "file" and other_pair[0] == "file":
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
841
                # THIS and OTHER are both files, so text merge.  Either
842
                # BASE is a file, or both converted to files, so at least we
843
                # have agreement that output should be a file.
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
844
                try:
845
                    self.text_merge(file_id, trans_id)
846
                except BinaryFile:
847
                    return contents_conflict()
1534.7.147 by Aaron Bentley
Tweak to check inventory, not tree for file ids
848
                if file_id not in self.this_tree.inventory:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
849
                    self.tt.version_file(file_id, trans_id)
1534.7.152 by Aaron Bentley
Fixed overwrites
850
                try:
851
                    self.tt.tree_kind(trans_id)
852
                    self.tt.delete_contents(trans_id)
853
                except NoSuchFile:
854
                    pass
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
855
                return "modified"
856
            else:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
857
                # Scalar conflict, can't text merge.  Dump conflicts
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
858
                return contents_conflict()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
859
860
    def get_lines(self, tree, file_id):
1534.7.157 by Aaron Bentley
Added more docs
861
        """Return the lines in a file, or an empty list."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
862
        if file_id in tree:
863
            return tree.get_file(file_id).readlines()
864
        else:
865
            return []
866
867
    def text_merge(self, file_id, trans_id):
868
        """Perform a three-way text merge on a file_id"""
869
        # it's possible that we got here with base as a different type.
870
        # if so, we just want two-way text conflicts.
871
        if file_id in self.base_tree and \
872
            self.base_tree.kind(file_id) == "file":
873
            base_lines = self.get_lines(self.base_tree, file_id)
874
        else:
875
            base_lines = []
876
        other_lines = self.get_lines(self.other_tree, file_id)
877
        this_lines = self.get_lines(self.this_tree, file_id)
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
878
        m3 = Merge3(base_lines, this_lines, other_lines,
879
                    is_cherrypick=self.cherrypick)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
880
        start_marker = "!START OF MERGE CONFLICT!" + "I HOPE THIS IS UNIQUE"
881
        if self.show_base is True:
882
            base_marker = '|' * 7
883
        else:
884
            base_marker = None
885
886
        def iter_merge3(retval):
887
            retval["text_conflicts"] = False
888
            for line in m3.merge_lines(name_a = "TREE", 
889
                                       name_b = "MERGE-SOURCE", 
890
                                       name_base = "BASE-REVISION",
891
                                       start_marker=start_marker, 
892
                                       base_marker=base_marker,
893
                                       reprocess=self.reprocess):
894
                if line.startswith(start_marker):
895
                    retval["text_conflicts"] = True
896
                    yield line.replace(start_marker, '<' * 7)
897
                else:
898
                    yield line
899
        retval = {}
900
        merge3_iterator = iter_merge3(retval)
901
        self.tt.create_file(merge3_iterator, trans_id)
902
        if retval["text_conflicts"] is True:
903
            self._raw_conflicts.append(('text conflict', trans_id))
904
            name = self.tt.final_name(trans_id)
905
            parent_id = self.tt.final_parent(trans_id)
906
            file_group = self._dump_conflicts(name, parent_id, file_id, 
907
                                              this_lines, base_lines,
908
                                              other_lines)
909
            file_group.append(trans_id)
910
911
    def _dump_conflicts(self, name, parent_id, file_id, this_lines=None, 
912
                        base_lines=None, other_lines=None, set_version=False,
913
                        no_base=False):
1534.7.157 by Aaron Bentley
Added more docs
914
        """Emit conflict files.
915
        If this_lines, base_lines, or other_lines are omitted, they will be
916
        determined automatically.  If set_version is true, the .OTHER, .THIS
917
        or .BASE (in that order) will be created as versioned files.
918
        """
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
919
        data = [('OTHER', self.other_tree, other_lines), 
920
                ('THIS', self.this_tree, this_lines)]
921
        if not no_base:
922
            data.append(('BASE', self.base_tree, base_lines))
923
        versioned = False
924
        file_group = []
925
        for suffix, tree, lines in data:
926
            if file_id in tree:
927
                trans_id = self._conflict_file(name, parent_id, tree, file_id,
928
                                               suffix, lines)
929
                file_group.append(trans_id)
930
                if set_version and not versioned:
931
                    self.tt.version_file(file_id, trans_id)
932
                    versioned = True
933
        return file_group
934
           
935
    def _conflict_file(self, name, parent_id, tree, file_id, suffix, 
936
                       lines=None):
1534.7.157 by Aaron Bentley
Added more docs
937
        """Emit a single conflict file."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
938
        name = name + '.' + suffix
939
        trans_id = self.tt.create_path(name, parent_id)
940
        entry = tree.inventory[file_id]
941
        create_by_entry(self.tt, entry, tree, trans_id, lines)
942
        return trans_id
943
944
    def merge_executable(self, file_id, file_status):
1534.7.157 by Aaron Bentley
Added more docs
945
        """Perform a merge on the execute bit."""
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
946
        executable = [self.executable(t, file_id) for t in (self.base_tree,
947
                      self.other_tree, self.this_tree)]
948
        self._merge_executable(file_id, executable, file_status)
949
950
    def _merge_executable(self, file_id, executable, file_status):
951
        """Perform a merge on the execute bit."""
952
        base_executable, other_executable, this_executable = executable
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
953
        if file_status == "deleted":
954
            return
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
955
        winner = self._three_way(*executable)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
956
        if winner == "conflict":
957
        # There must be a None in here, if we have a conflict, but we
958
        # need executability since file status was not deleted.
1534.10.35 by Aaron Bentley
Merge handles contents + executable + deletion conflict
959
            if self.executable(self.other_tree, file_id) is None:
1534.7.142 by Aaron Bentley
Fixed executability conflicts
960
                winner = "this"
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
961
            else:
1534.7.142 by Aaron Bentley
Fixed executability conflicts
962
                winner = "other"
1551.19.30 by Aaron Bentley
Accelerate merge by skipping file existence check when merging execute bit
963
        if winner == 'this' and file_status != "modified":
964
            return
965
        trans_id = self.tt.trans_id_file_id(file_id)
966
        try:
967
            if self.tt.final_kind(trans_id) != "file":
968
                return
969
        except NoSuchFile:
970
            return
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
971
        if winner == "this":
1551.19.30 by Aaron Bentley
Accelerate merge by skipping file existence check when merging execute bit
972
            executability = this_executable
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
973
        else:
974
            if file_id in self.other_tree:
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
975
                executability = other_executable
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
976
            elif file_id in self.this_tree:
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
977
                executability = this_executable
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
978
            elif file_id in self.base_tree:
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
979
                executability = base_executable
1551.19.30 by Aaron Bentley
Accelerate merge by skipping file existence check when merging execute bit
980
        if executability is not None:
981
            trans_id = self.tt.trans_id_file_id(file_id)
982
            self.tt.set_executability(executability, trans_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
983
1534.7.172 by Aaron Bentley
Integrated fs conflicts with merge conflicts.
984
    def cook_conflicts(self, fs_conflicts):
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
985
        """Convert all conflicts into a form that doesn't depend on trans_id"""
1534.10.19 by Aaron Bentley
Stanza conversion, cooking
986
        from conflicts import Conflict
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
987
        name_conflicts = {}
1534.7.172 by Aaron Bentley
Integrated fs conflicts with merge conflicts.
988
        self.cooked_conflicts.extend(cook_conflicts(fs_conflicts, self.tt))
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
989
        fp = FinalPaths(self.tt)
990
        for conflict in self._raw_conflicts:
991
            conflict_type = conflict[0]
992
            if conflict_type in ('name conflict', 'parent conflict'):
993
                trans_id = conflict[1]
994
                conflict_args = conflict[2:]
995
                if trans_id not in name_conflicts:
996
                    name_conflicts[trans_id] = {}
997
                unique_add(name_conflicts[trans_id], conflict_type, 
998
                           conflict_args)
999
            if conflict_type == 'contents conflict':
1000
                for trans_id in conflict[1]:
1001
                    file_id = self.tt.final_file_id(trans_id)
1002
                    if file_id is not None:
1003
                        break
1004
                path = fp.get_path(trans_id)
1005
                for suffix in ('.BASE', '.THIS', '.OTHER'):
1006
                    if path.endswith(suffix):
1007
                        path = path[:-len(suffix)]
1008
                        break
1534.10.19 by Aaron Bentley
Stanza conversion, cooking
1009
                c = Conflict.factory(conflict_type, path=path, file_id=file_id)
1010
                self.cooked_conflicts.append(c)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1011
            if conflict_type == 'text conflict':
1012
                trans_id = conflict[1]
1013
                path = fp.get_path(trans_id)
1014
                file_id = self.tt.final_file_id(trans_id)
1534.10.19 by Aaron Bentley
Stanza conversion, cooking
1015
                c = Conflict.factory(conflict_type, path=path, file_id=file_id)
1016
                self.cooked_conflicts.append(c)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1017
1018
        for trans_id, conflicts in name_conflicts.iteritems():
1019
            try:
1020
                this_parent, other_parent = conflicts['parent conflict']
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1021
                if this_parent == other_parent:
1022
                    raise AssertionError()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1023
            except KeyError:
1024
                this_parent = other_parent = \
1025
                    self.tt.final_file_id(self.tt.final_parent(trans_id))
1026
            try:
1027
                this_name, other_name = conflicts['name conflict']
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1028
                if this_name == other_name:
1029
                    raise AssertionError()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1030
            except KeyError:
1031
                this_name = other_name = self.tt.final_name(trans_id)
1032
            other_path = fp.get_path(trans_id)
1551.16.2 by Aaron Bentley
Don't crash on merging renamed deleted files (#110279)
1033
            if this_parent is not None and this_name is not None:
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1034
                this_parent_path = \
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
1035
                    fp.get_path(self.tt.trans_id_file_id(this_parent))
1534.7.166 by Aaron Bentley
Swapped os.path.join for pathjoin everywhere
1036
                this_path = pathjoin(this_parent_path, this_name)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1037
            else:
1038
                this_path = "<deleted>"
1039
            file_id = self.tt.final_file_id(trans_id)
1534.10.20 by Aaron Bentley
Got all tests passing
1040
            c = Conflict.factory('path conflict', path=this_path,
1534.10.19 by Aaron Bentley
Stanza conversion, cooking
1041
                                 conflict_path=other_path, file_id=file_id)
1042
            self.cooked_conflicts.append(c)
1666.1.4 by Robert Collins
* 'Metadir' is now the default disk format. This improves behaviour in
1043
        self.cooked_conflicts.sort(key=Conflict.sort_key)
1534.7.141 by Aaron Bentley
Added conflict reporting
1044
1045
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1046
class WeaveMerger(Merge3Merger):
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
1047
    """Three-way tree merger, text weave merger."""
1551.6.8 by Aaron Bentley
Implemented reprocess for weave
1048
    supports_reprocess = True
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1049
    supports_show_base = False
3062.2.7 by Aaron Bentley
Prevent reverse cherry-picking with weave
1050
    supports_reverse_cherrypick = False
3062.2.9 by Aaron Bentley
Don't use the base if not cherrypicking
1051
    history_based = True
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1052
1053
    def _merged_lines(self, file_id):
1054
        """Generate the merged lines.
1055
        There is no distinction between lines that are meant to contain <<<<<<<
1056
        and conflicts.
1057
        """
3062.2.9 by Aaron Bentley
Don't use the base if not cherrypicking
1058
        if self.cherrypick:
1059
            base = self.base_tree
1060
        else:
1061
            base = None
3062.2.4 by Aaron Bentley
Start supporting merge-with-base
1062
        plan = self.this_tree.plan_file_merge(file_id, self.other_tree,
3062.2.9 by Aaron Bentley
Don't use the base if not cherrypicking
1063
                                              base=base)
1551.19.17 by Aaron Bentley
Add debugging flag for merges
1064
        if 'merge' in debug.debug_flags:
1065
            plan = list(plan)
1066
            trans_id = self.tt.trans_id_file_id(file_id)
1067
            name = self.tt.final_name(trans_id) + '.plan'
1068
            contents = ('%10s|%s' % l for l in plan)
1069
            self.tt.new_file(name, self.tt.final_parent(trans_id), contents)
1551.15.52 by Aaron Bentley
Tweak from review comments
1070
        textmerge = PlanWeaveMerge(plan, '<<<<<<< TREE\n',
1071
            '>>>>>>> MERGE-SOURCE\n')
1072
        return textmerge.merge_lines(self.reprocess)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1073
1074
    def text_merge(self, file_id, trans_id):
1534.7.157 by Aaron Bentley
Added more docs
1075
        """Perform a (weave) text merge for a given file and file-id.
1076
        If conflicts are encountered, .THIS and .OTHER files will be emitted,
1077
        and a conflict will be noted.
1078
        """
1551.6.12 by Aaron Bentley
Indicate conflicts from merge_lines, insead of guessing
1079
        lines, conflicts = self._merged_lines(file_id)
1558.15.10 by Aaron Bentley
Merge bzr.dev
1080
        lines = list(lines)
1558.15.5 by Aaron Bentley
Fixed binary handling in weave merge
1081
        # Note we're checking whether the OUTPUT is binary in this case, 
1082
        # because we don't want to get into weave merge guts.
1083
        check_text_lines(lines)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1084
        self.tt.create_file(lines, trans_id)
1085
        if conflicts:
1086
            self._raw_conflicts.append(('text conflict', trans_id))
1087
            name = self.tt.final_name(trans_id)
1088
            parent_id = self.tt.final_parent(trans_id)
1089
            file_group = self._dump_conflicts(name, parent_id, file_id, 
1090
                                              no_base=True)
1091
            file_group.append(trans_id)
1092
1093
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1094
class LCAMerger(WeaveMerger):
1095
1096
    def _merged_lines(self, file_id):
1097
        """Generate the merged lines.
1098
        There is no distinction between lines that are meant to contain <<<<<<<
1099
        and conflicts.
1100
        """
1101
        if self.cherrypick:
1102
            base = self.base_tree
1103
        else:
1104
            base = None
1105
        plan = self.this_tree.plan_file_lca_merge(file_id, self.other_tree,
1106
                                                  base=base)
1107
        if 'merge' in debug.debug_flags:
1108
            plan = list(plan)
1109
            trans_id = self.tt.trans_id_file_id(file_id)
1110
            name = self.tt.final_name(trans_id) + '.plan'
1111
            contents = ('%10s|%s' % l for l in plan)
1112
            self.tt.new_file(name, self.tt.final_parent(trans_id), contents)
1113
        textmerge = PlanWeaveMerge(plan, '<<<<<<< TREE\n',
1114
            '>>>>>>> MERGE-SOURCE\n')
1115
        return textmerge.merge_lines(self.reprocess)
1116
1117
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1118
class Diff3Merger(Merge3Merger):
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
1119
    """Three-way merger using external diff3 for text merging"""
1711.7.20 by John Arbash Meinel
always close files, minor PEP8 cleanup
1120
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1121
    def dump_file(self, temp_dir, name, tree, file_id):
1122
        out_path = pathjoin(temp_dir, name)
1711.7.20 by John Arbash Meinel
always close files, minor PEP8 cleanup
1123
        out_file = open(out_path, "wb")
1124
        try:
1125
            in_file = tree.get_file(file_id)
1126
            for line in in_file:
1127
                out_file.write(line)
1128
        finally:
1129
            out_file.close()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1130
        return out_path
1131
1132
    def text_merge(self, file_id, trans_id):
1534.7.157 by Aaron Bentley
Added more docs
1133
        """Perform a diff3 merge using a specified file-id and trans-id.
1134
        If conflicts are encountered, .BASE, .THIS. and .OTHER conflict files
1135
        will be dumped, and a will be conflict noted.
1136
        """
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1137
        import bzrlib.patch
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
1138
        temp_dir = osutils.mkdtemp(prefix="bzr-")
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1139
        try:
1534.7.166 by Aaron Bentley
Swapped os.path.join for pathjoin everywhere
1140
            new_file = pathjoin(temp_dir, "new")
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1141
            this = self.dump_file(temp_dir, "this", self.this_tree, file_id)
1142
            base = self.dump_file(temp_dir, "base", self.base_tree, file_id)
1143
            other = self.dump_file(temp_dir, "other", self.other_tree, file_id)
1144
            status = bzrlib.patch.diff3(new_file, this, base, other)
1145
            if status not in (0, 1):
1146
                raise BzrError("Unhandled diff3 exit code")
1711.7.20 by John Arbash Meinel
always close files, minor PEP8 cleanup
1147
            f = open(new_file, 'rb')
1148
            try:
1149
                self.tt.create_file(f, trans_id)
1150
            finally:
1151
                f.close()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1152
            if status == 1:
1153
                name = self.tt.final_name(trans_id)
1154
                parent_id = self.tt.final_parent(trans_id)
1155
                self._dump_conflicts(name, parent_id, file_id)
1551.8.39 by Aaron Bentley
Fix diff3 conflict-reporting bug
1156
                self._raw_conflicts.append(('text conflict', trans_id))
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1157
        finally:
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
1158
            osutils.rmtree(temp_dir)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1159
1160
1161
def merge_inner(this_branch, other_tree, base_tree, ignore_zero=False,
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1162
                backup_files=False,
1163
                merge_type=Merge3Merger,
1164
                interesting_ids=None,
1165
                show_base=False,
1166
                reprocess=False,
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1167
                other_rev_id=None,
1168
                interesting_files=None,
1534.9.9 by Aaron Bentley
Added progress bar to pull
1169
                this_tree=None,
1551.11.10 by Aaron Bentley
Add change reporting to pull
1170
                pb=DummyProgress(),
1171
                change_reporter=None):
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1172
    """Primary interface for merging. 
1173
1174
        typical use is probably 
1175
        'merge_inner(branch, branch.get_revision_tree(other_revision),
1176
                     branch.get_revision_tree(base_revision))'
1177
        """
1178
    if this_tree is None:
2367.2.1 by Robert Collins
Remove bzrlib 0.8 compatability where it was making the code unclear or messy. (Robert Collins)
1179
        raise BzrError("bzrlib.merge.merge_inner requires a this_tree "
1180
            "parameter as of bzrlib version 0.8.")
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1181
    merger = Merger(this_branch, other_tree, base_tree, this_tree=this_tree,
1551.11.10 by Aaron Bentley
Add change reporting to pull
1182
                    pb=pb, change_reporter=change_reporter)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1183
    merger.backup_files = backup_files
1184
    merger.merge_type = merge_type
1185
    merger.interesting_ids = interesting_ids
1551.2.23 by Aaron Bentley
Got merge_inner's ignore_zero parameter working
1186
    merger.ignore_zero = ignore_zero
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1187
    if interesting_files:
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1188
        if interesting_ids:
1189
            raise ValueError('Only supply interesting_ids'
1190
                             ' or interesting_files')
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
1191
        merger.interesting_files = interesting_files
1979.2.1 by Robert Collins
(robertc) adds a convenience method "merge_from_branch" to WorkingTree.
1192
    merger.show_base = show_base
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1193
    merger.reprocess = reprocess
1194
    merger.other_rev_id = other_rev_id
1195
    merger.other_basis = other_rev_id
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
1196
    get_revision_id = getattr(base_tree, 'get_revision_id', None)
1197
    if get_revision_id is None:
1198
        get_revision_id = base_tree.last_revision
1199
    merger.set_base_revision(get_revision_id(), this_branch)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1200
    return merger.do_merge()
1201
2221.4.15 by Aaron Bentley
Use RegistryOption for merge type
1202
def get_merge_type_registry():
2221.4.17 by Aaron Bentley
PEP8-ness
1203
    """Merge type registry is in bzrlib.option to avoid circular imports.
2221.4.15 by Aaron Bentley
Use RegistryOption for merge type
1204
1205
    This method provides a sanctioned way to retrieve it.
1206
    """
1207
    from bzrlib import option
2221.4.16 by Aaron Bentley
Add tests for get_merge_type_registry
1208
    return option._merge_type_registry
1551.15.46 by Aaron Bentley
Move plan merge to tree
1209
1210
1211
def _plan_annotate_merge(annotated_a, annotated_b, ancestors_a, ancestors_b):
1212
    def status_a(revision, text):
1213
        if revision in ancestors_b:
1214
            return 'killed-b', text
1215
        else:
1216
            return 'new-a', text
1217
1218
    def status_b(revision, text):
1219
        if revision in ancestors_a:
1220
            return 'killed-a', text
1221
        else:
1222
            return 'new-b', text
1223
1224
    plain_a = [t for (a, t) in annotated_a]
1225
    plain_b = [t for (a, t) in annotated_b]
1226
    matcher = patiencediff.PatienceSequenceMatcher(None, plain_a, plain_b)
1227
    blocks = matcher.get_matching_blocks()
1228
    a_cur = 0
1229
    b_cur = 0
1230
    for ai, bi, l in blocks:
1231
        # process all mismatched sections
1232
        # (last mismatched section is handled because blocks always
1233
        # includes a 0-length last block)
1234
        for revision, text in annotated_a[a_cur:ai]:
1235
            yield status_a(revision, text)
1236
        for revision, text in annotated_b[b_cur:bi]:
1237
            yield status_b(revision, text)
1238
        # and now the matched section
1239
        a_cur = ai + l
1240
        b_cur = bi + l
3376.2.8 by Martin Pool
Some review cleanups for assertion removal
1241
        for text_a in plain_a[ai:a_cur]:
1551.15.46 by Aaron Bentley
Move plan merge to tree
1242
            yield "unchanged", text_a
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1243
1244
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1245
class _PlanMergeBase(object):
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1246
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1247
    def __init__(self, a_rev, b_rev, vf, key_prefix):
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1248
        """Contructor.
1249
1250
        :param a_rev: Revision-id of one revision to merge
1251
        :param b_rev: Revision-id of the other revision to merge
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1252
        :param vf: A VersionedFiles containing both revisions
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1253
        :param key_prefix: A prefix for accessing keys in vf, typically
1254
            (file_id,).
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1255
        """
1256
        self.a_rev = a_rev
1257
        self.b_rev = b_rev
1258
        self.vf = vf
3062.1.12 by Aaron Bentley
Implement simple text cache
1259
        self._last_lines = None
1260
        self._last_lines_revision_id = None
3144.3.7 by Aaron Bentley
Update from review
1261
        self._cached_matching_blocks = {}
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1262
        self._key_prefix = key_prefix
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1263
        self._precache_tip_lines()
1264
1265
    def _precache_tip_lines(self):
1266
        lines = self.get_lines([self.a_rev, self.b_rev])
1267
        self.lines_a = lines[self.a_rev]
1268
        self.lines_b = lines[self.b_rev]
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1269
1270
    def get_lines(self, revisions):
1271
        """Get lines for revisions from the backing VersionedFiles.
1272
        
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1273
        :raises RevisionNotPresent: on absent texts.
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1274
        """
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1275
        keys = [(self._key_prefix + (rev,)) for rev in revisions]
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1276
        result = {}
1277
        for record in self.vf.get_record_stream(keys, 'unordered', True):
1278
            if record.storage_kind == 'absent':
1279
                raise errors.RevisionNotPresent(record.key, self.vf)
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1280
            result[record.key[-1]] = osutils.split_lines(
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1281
                record.get_bytes_as('fulltext'))
1282
        return result
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1283
1284
    def plan_merge(self):
1285
        """Generate a 'plan' for merging the two revisions.
1286
1287
        This involves comparing their texts and determining the cause of
1288
        differences.  If text A has a line and text B does not, then either the
1289
        line was added to text A, or it was deleted from B.  Once the causes
1290
        are combined, they are written out in the format described in
1291
        VersionedFile.plan_merge
1292
        """
1293
        blocks = self._get_matching_blocks(self.a_rev, self.b_rev)
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1294
        unique_a, unique_b = self._unique_lines(blocks)
1295
        new_a, killed_b = self._determine_status(self.a_rev, unique_a)
1296
        new_b, killed_a = self._determine_status(self.b_rev, unique_b)
1297
        return self._iter_plan(blocks, new_a, killed_b, new_b, killed_a)
1298
1299
    def _iter_plan(self, blocks, new_a, killed_b, new_b, killed_a):
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1300
        last_i = 0
1301
        last_j = 0
1302
        for i, j, n in blocks:
1303
            for a_index in range(last_i, i):
1304
                if a_index in new_a:
3144.3.2 by Aaron Bentley
Get conflict handling working
1305
                    if a_index in killed_b:
1306
                        yield 'conflicted-a', self.lines_a[a_index]
1307
                    else:
1308
                        yield 'new-a', self.lines_a[a_index]
1309
                else:
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1310
                    yield 'killed-b', self.lines_a[a_index]
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1311
            for b_index in range(last_j, j):
1312
                if b_index in new_b:
3144.3.2 by Aaron Bentley
Get conflict handling working
1313
                    if b_index in killed_a:
3144.3.10 by Aaron Bentley
Use correct index when emitting conflicted-b
1314
                        yield 'conflicted-b', self.lines_b[b_index]
3144.3.2 by Aaron Bentley
Get conflict handling working
1315
                    else:
1316
                        yield 'new-b', self.lines_b[b_index]
1317
                else:
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1318
                    yield 'killed-a', self.lines_b[b_index]
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1319
            # handle common lines
1320
            for a_index in range(i, i+n):
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1321
                yield 'unchanged', self.lines_a[a_index]
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1322
            last_i = i+n
1323
            last_j = j+n
1324
1325
    def _get_matching_blocks(self, left_revision, right_revision):
1326
        """Return a description of which sections of two revisions match.
1327
1328
        See SequenceMatcher.get_matching_blocks
1329
        """
3144.3.7 by Aaron Bentley
Update from review
1330
        cached = self._cached_matching_blocks.get((left_revision,
1331
                                                   right_revision))
1332
        if cached is not None:
1333
            return cached
3062.1.12 by Aaron Bentley
Implement simple text cache
1334
        if self._last_lines_revision_id == left_revision:
1335
            left_lines = self._last_lines
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1336
            right_lines = self.get_lines([right_revision])[right_revision]
3062.1.12 by Aaron Bentley
Implement simple text cache
1337
        else:
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1338
            lines = self.get_lines([left_revision, right_revision])
1339
            left_lines = lines[left_revision]
1340
            right_lines = lines[right_revision]
3062.1.12 by Aaron Bentley
Implement simple text cache
1341
        self._last_lines = right_lines
1342
        self._last_lines_revision_id = right_revision
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1343
        matcher = patiencediff.PatienceSequenceMatcher(None, left_lines,
1344
                                                       right_lines)
1345
        return matcher.get_matching_blocks()
1346
1347
    def _unique_lines(self, matching_blocks):
1348
        """Analyse matching_blocks to determine which lines are unique
1349
1350
        :return: a tuple of (unique_left, unique_right), where the values are
1351
            sets of line numbers of unique lines.
1352
        """
1353
        last_i = 0
1354
        last_j = 0
1355
        unique_left = []
1356
        unique_right = []
1357
        for i, j, n in matching_blocks:
1358
            unique_left.extend(range(last_i, i))
1359
            unique_right.extend(range(last_j, j))
1360
            last_i = i + n
1361
            last_j = j + n
1362
        return unique_left, unique_right
1363
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1364
    @staticmethod
1365
    def _subtract_plans(old_plan, new_plan):
3144.3.7 by Aaron Bentley
Update from review
1366
        """Remove changes from new_plan that came from old_plan.
1367
1368
        It is assumed that the difference between the old_plan and new_plan
1369
        is their choice of 'b' text.
1370
1371
        All lines from new_plan that differ from old_plan are emitted
1372
        verbatim.  All lines from new_plan that match old_plan but are
1373
        not about the 'b' revision are emitted verbatim.
1374
1375
        Lines that match and are about the 'b' revision are the lines we
1376
        don't want, so we convert 'killed-b' -> 'unchanged', and 'new-b'
1377
        is skipped entirely.
1378
        """
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1379
        matcher = patiencediff.PatienceSequenceMatcher(None, old_plan,
1380
                                                       new_plan)
1381
        last_j = 0
1382
        for i, j, n in matcher.get_matching_blocks():
1383
            for jj in range(last_j, j):
1384
                yield new_plan[jj]
1385
            for jj in range(j, j+n):
1386
                plan_line = new_plan[jj]
1387
                if plan_line[0] == 'new-b':
1388
                    pass
1389
                elif plan_line[0] == 'killed-b':
1390
                    yield 'unchanged', plan_line[1]
1391
                else:
1392
                    yield plan_line
1393
            last_j = j + n
1394
1395
1396
class _PlanMerge(_PlanMergeBase):
1397
    """Plan an annotate merge using on-the-fly annotation"""
1398
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1399
    def __init__(self, a_rev, b_rev, vf, key_prefix):
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1400
        super(_PlanMerge, self).__init__(a_rev, b_rev, vf, key_prefix)
1401
        self.a_key = self._key_prefix + (self.a_rev,)
1402
        self.b_key = self._key_prefix + (self.b_rev,)
1403
        self.graph = Graph(self.vf)
3514.2.11 by John Arbash Meinel
Shortcut the case when one revision is in the ancestry of the other.
1404
        heads = self.graph.heads((self.a_key, self.b_key))
1405
        if len(heads) == 1:
1406
            # one side dominates, so we can just return its values, yay for
1407
            # per-file graphs
1408
            # Ideally we would know that before we get this far
1409
            self._head_key = heads.pop()
1410
            if self._head_key == self.a_key:
1411
                other = b_rev
1412
            else:
1413
                other = a_rev
1414
            mutter('found dominating revision for %s\n%s > %s', self.vf,
1415
                   self._head_key[-1], other)
1416
            self._weave = None
1417
        else:
1418
            self._head_key = None
1419
            self._build_weave()
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1420
1421
    def _precache_tip_lines(self):
1422
        # Turn this into a no-op, because we will do this later
1423
        pass
1424
1425
    def _find_recursive_lcas(self):
1426
        """Find all the ancestors back to a unique lca"""
1427
        cur_ancestors = (self.a_key, self.b_key)
1428
        # graph.find_lca(uncommon, keys) now returns plain NULL_REVISION,
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1429
        # rather than a key tuple. We will just map that directly to no common
1430
        # ancestors.
1431
        parent_map = {}
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1432
        while True:
1433
            next_lcas = self.graph.find_lca(*cur_ancestors)
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1434
            # Map a plain NULL_REVISION to a simple no-ancestors
1435
            if next_lcas == set([NULL_REVISION]):
1436
                next_lcas = ()
3514.2.9 by John Arbash Meinel
Add some debugging, and work on getting the graph right so we get the weave insertion order correct.
1437
            # Order the lca's based on when they were merged into the tip
1438
            # While the actual merge portion of weave merge uses a set() of
1439
            # active revisions, the order of insertion *does* effect the
1440
            # implicit ordering of the texts.
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1441
            for rev_key in cur_ancestors:
3514.2.9 by John Arbash Meinel
Add some debugging, and work on getting the graph right so we get the weave insertion order correct.
1442
                ordered_parents = tuple(self.graph.find_merge_order(rev_key,
1443
                                                                    next_lcas))
1444
                parent_map[rev_key] = ordered_parents
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1445
            if len(next_lcas) == 0:
1446
                break
1447
            elif len(next_lcas) == 1:
3514.2.9 by John Arbash Meinel
Add some debugging, and work on getting the graph right so we get the weave insertion order correct.
1448
                parent_map[list(next_lcas)[0]] = ()
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1449
                break
3514.2.10 by John Arbash Meinel
Handle more edge cases.
1450
            elif len(next_lcas) > 2:
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1451
                # More than 2 lca's, fall back to grabbing all nodes between
1452
                # this and the unique lca.
3514.2.16 by John Arbash Meinel
Review feedback from Ian.
1453
                mutter('More than 2 LCAs, falling back to all nodes for:'
1454
                       ' %s, %s\n=> %s', self.a_key, self.b_key, cur_ancestors)
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1455
                cur_lcas = next_lcas
1456
                while len(cur_lcas) > 1:
1457
                    cur_lcas = self.graph.find_lca(*cur_lcas)
1458
                if len(cur_lcas) == 0:
1459
                    # No common base to find, use the full ancestry
1460
                    unique_lca = None
1461
                else:
3514.2.8 by John Arbash Meinel
The insertion ordering into the weave has an impact on conflicts.
1462
                    unique_lca = list(cur_lcas)[0]
3514.2.14 by John Arbash Meinel
Bring in the code to collapse linear portions of the graph.
1463
                    if unique_lca == NULL_REVISION:
1464
                        # find_lca will return a plain 'NULL_REVISION' rather
1465
                        # than a key tuple when there is no common ancestor, we
1466
                        # prefer to just use None, because it doesn't confuse
1467
                        # _get_interesting_texts()
1468
                        unique_lca = None
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1469
                parent_map.update(self._find_unique_parents(next_lcas,
1470
                                                            unique_lca))
1471
                break
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1472
            cur_ancestors = next_lcas
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1473
        return parent_map
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1474
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1475
    def _find_unique_parents(self, tip_keys, base_key):
1476
        """Find ancestors of tip that aren't ancestors of base.
1477
        
1478
        :param tip_keys: Nodes that are interesting
1479
        :param base_key: Cull all ancestors of this node
1480
        :return: The parent map for all revisions between tip_keys and
1481
            base_key. base_key will be included. References to nodes outside of
1482
            the ancestor set will also be removed.
1483
        """
1484
        # TODO: this would be simpler if find_unique_ancestors took a list
1485
        #       instead of a single tip, internally it supports it, but it
1486
        #       isn't a "backwards compatible" api change.
1487
        if base_key is None:
1488
            parent_map = dict(self.graph.iter_ancestry(tip_keys))
3514.2.14 by John Arbash Meinel
Bring in the code to collapse linear portions of the graph.
1489
            # We remove NULL_REVISION because it isn't a proper tuple key, and
1490
            # thus confuses things like _get_interesting_texts, and our logic
1491
            # to add the texts into the memory weave.
1492
            if NULL_REVISION in parent_map:
1493
                parent_map.pop(NULL_REVISION)
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1494
        else:
1495
            interesting = set()
1496
            for tip in tip_keys:
1497
                interesting.update(
1498
                    self.graph.find_unique_ancestors(tip, [base_key]))
1499
            parent_map = self.graph.get_parent_map(interesting)
1500
            parent_map[base_key] = ()
3514.2.12 by John Arbash Meinel
Start refactoring into helper functions
1501
        culled_parent_map, child_map, tails = self._remove_external_references(
1502
            parent_map)
3514.2.13 by John Arbash Meinel
Add the ability to prune extra tails from the parent_map.
1503
        # Remove all the tails but base_key
3514.2.14 by John Arbash Meinel
Bring in the code to collapse linear portions of the graph.
1504
        if base_key is not None:
1505
            tails.remove(base_key)
1506
            self._prune_tails(culled_parent_map, child_map, tails)
1507
        # Now remove all the uninteresting 'linear' regions
3514.2.15 by John Arbash Meinel
Enable collapsing linear regions.
1508
        simple_map = _mod_graph.collapse_linear_regions(culled_parent_map)
1509
        return simple_map
3514.2.12 by John Arbash Meinel
Start refactoring into helper functions
1510
1511
    @staticmethod
1512
    def _remove_external_references(parent_map):
1513
        """Remove references that go outside of the parent map.
1514
1515
        :param parent_map: Something returned from Graph.get_parent_map(keys)
1516
        :return: (filtered_parent_map, child_map, tails)
1517
            filtered_parent_map is parent_map without external references
1518
            child_map is the {parent_key: [child_keys]} mapping
1519
            tails is a list of nodes that do not have any parents in the map
1520
        """
1521
        # TODO: The basic effect of this function seems more generic than
1522
        #       _PlanMerge. But the specific details of building a child_map,
1523
        #       and computing tails seems very specific to _PlanMerge.
1524
        #       Still, should this be in Graph land?
1525
        filtered_parent_map = {}
1526
        child_map = {}
1527
        tails = []
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1528
        for key, parent_keys in parent_map.iteritems():
3514.2.12 by John Arbash Meinel
Start refactoring into helper functions
1529
            culled_parent_keys = [p for p in parent_keys if p in parent_map]
1530
            if not culled_parent_keys:
1531
                tails.append(key)
1532
            for parent_key in culled_parent_keys:
1533
                child_map.setdefault(parent_key, []).append(key)
1534
            # TODO: Do we want to do this, it adds overhead for every node,
1535
            #       just to say that the node has no children
1536
            child_map.setdefault(key, [])
1537
            filtered_parent_map[key] = culled_parent_keys
1538
        return filtered_parent_map, child_map, tails
1539
3514.2.13 by John Arbash Meinel
Add the ability to prune extra tails from the parent_map.
1540
    @staticmethod
1541
    def _prune_tails(parent_map, child_map, tails_to_remove):
1542
        """Remove tails from the parent map.
1543
        
1544
        This will remove the supplied revisions until no more children have 0
1545
        parents.
1546
1547
        :param parent_map: A dict of {child: [parents]}, this dictionary will
1548
            be modified in place.
1549
        :param tails_to_remove: A list of tips that should be removed,
1550
            this list will be consumed
1551
        :param child_map: The reverse dict of parent_map ({parent: [children]})
1552
            this dict will be modified
1553
        :return: None, parent_map will be modified in place.
1554
        """
1555
        while tails_to_remove:
1556
            next = tails_to_remove.pop()
1557
            parent_map.pop(next)
1558
            children = child_map.pop(next)
1559
            for child in children:
1560
                child_parents = parent_map[child]
1561
                child_parents.remove(next)
1562
                if len(child_parents) == 0:
1563
                    tails_to_remove.append(child)
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1564
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1565
    def _get_interesting_texts(self, parent_map):
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1566
        """Return a dict of texts we are interested in.
1567
1568
        Note that the input is in key tuples, but the output is in plain
1569
        revision ids.
1570
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1571
        :param parent_map: The output from _find_recursive_lcas
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1572
        :return: A dict of {'revision_id':lines} as returned by
1573
            _PlanMergeBase.get_lines()
1574
        """
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1575
        all_revision_keys = set(parent_map)
1576
        all_revision_keys.add(self.a_key)
1577
        all_revision_keys.add(self.b_key)
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1578
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1579
        # Everything else is in 'keys' but get_lines is in 'revision_ids'
1580
        all_texts = self.get_lines([k[-1] for k in all_revision_keys])
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1581
        return all_texts
1582
1583
    def _build_weave(self):
1584
        from bzrlib import weave
1585
        self._weave = weave.Weave(weave_name='in_memory_weave',
1586
                                  allow_reserved=True)
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1587
        parent_map = self._find_recursive_lcas()
1588
1589
        all_texts = self._get_interesting_texts(parent_map)
1590
1591
        # Note: Unfortunately, the order given by topo_sort will effect the
1592
        # ordering resolution in the output. Specifically, if you add A then B,
1593
        # then in the output text A lines will show up before B lines. And, of
1594
        # course, topo_sort doesn't guarantee any real ordering.
3514.2.8 by John Arbash Meinel
The insertion ordering into the weave has an impact on conflicts.
1595
        # So we use merge_sort, and add a fake node on the tip.
1596
        # This ensures that left-hand parents will always be inserted into the
1597
        # weave before right-hand parents.
1598
        tip_key = self._key_prefix + (_mod_revision.CURRENT_REVISION,)
1599
        parent_map[tip_key] = (self.a_key, self.b_key)
1600
1601
        for seq_num, key, depth, eom in reversed(tsort.merge_sort(parent_map,
1602
                                                                  tip_key)):
1603
            if key == tip_key:
1604
                continue
3514.2.9 by John Arbash Meinel
Add some debugging, and work on getting the graph right so we get the weave insertion order correct.
1605
        # for key in tsort.topo_sort(parent_map):
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1606
            parent_keys = parent_map[key]
1607
            revision_id = key[-1]
1608
            parent_ids = [k[-1] for k in parent_keys]
1609
            self._weave.add_lines(revision_id, parent_ids,
1610
                                  all_texts[revision_id])
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1611
1612
    def plan_merge(self):
1613
        """Generate a 'plan' for merging the two revisions.
1614
1615
        This involves comparing their texts and determining the cause of
1616
        differences.  If text A has a line and text B does not, then either the
1617
        line was added to text A, or it was deleted from B.  Once the causes
1618
        are combined, they are written out in the format described in
1619
        VersionedFile.plan_merge
1620
        """
1621
        if self._head_key is not None: # There was a single head
1622
            if self._head_key == self.a_key:
1623
                plan = 'new-a'
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1624
            else:
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1625
                if self._head_key != self.b_key:
1626
                    raise AssertionError('There was an invalid head: %s != %s'
1627
                                         % (self.b_key, self._head_key))
1628
                plan = 'new-b'
3514.2.16 by John Arbash Meinel
Review feedback from Ian.
1629
            head_rev = self._head_key[-1]
1630
            lines = self.get_lines([head_rev])[head_rev]
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1631
            return ((plan, line) for line in lines)
1632
        return self._weave.plan_merge(self.a_rev, self.b_rev)
3062.2.1 by Aaron Bentley
Add support for plan-merge with a base
1633
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1634
1635
class _PlanLCAMerge(_PlanMergeBase):
1636
    """
3144.3.7 by Aaron Bentley
Update from review
1637
    This merge algorithm differs from _PlanMerge in that:
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1638
    1. comparisons are done against LCAs only
1639
    2. cases where a contested line is new versus one LCA but old versus
3144.3.7 by Aaron Bentley
Update from review
1640
       another are marked as conflicts, by emitting the line as conflicted-a
1641
       or conflicted-b.
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1642
1643
    This is faster, and hopefully produces more useful output.
1644
    """
1645
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1646
    def __init__(self, a_rev, b_rev, vf, key_prefix, graph):
1647
        _PlanMergeBase.__init__(self, a_rev, b_rev, vf, key_prefix)
1648
        lcas = graph.find_lca(key_prefix + (a_rev,), key_prefix + (b_rev,))
3350.6.5 by Robert Collins
Update to bzr.dev.
1649
        self.lcas = set()
1650
        for lca in lcas:
1651
            if lca == NULL_REVISION:
1652
                self.lcas.add(lca)
1653
            else:
1654
                self.lcas.add(lca[-1])
3144.3.7 by Aaron Bentley
Update from review
1655
        for lca in self.lcas:
3287.17.1 by John Arbash Meinel
Fix bug #235715 by using the empty list as the text for a base of NULL_REVISION.
1656
            if _mod_revision.is_null(lca):
1657
                lca_lines = []
1658
            else:
3350.6.5 by Robert Collins
Update to bzr.dev.
1659
                lca_lines = self.get_lines([lca])[lca]
3144.3.7 by Aaron Bentley
Update from review
1660
            matcher = patiencediff.PatienceSequenceMatcher(None, self.lines_a,
1661
                                                           lca_lines)
1662
            blocks = list(matcher.get_matching_blocks())
1663
            self._cached_matching_blocks[(a_rev, lca)] = blocks
1664
            matcher = patiencediff.PatienceSequenceMatcher(None, self.lines_b,
1665
                                                           lca_lines)
1666
            blocks = list(matcher.get_matching_blocks())
1667
            self._cached_matching_blocks[(b_rev, lca)] = blocks
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1668
3144.3.7 by Aaron Bentley
Update from review
1669
    def _determine_status(self, revision_id, unique_line_numbers):
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1670
        """Determines the status unique lines versus all lcas.
1671
1672
        Basically, determines why the line is unique to this revision.
1673
1674
        A line may be determined new, killed, or both.
1675
3144.3.7 by Aaron Bentley
Update from review
1676
        If a line is determined new, that means it was not present in at least
1677
        one LCA, and is not present in the other merge revision.
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1678
1679
        If a line is determined killed, that means the line was present in
1680
        at least one LCA.
1681
1682
        If a line is killed and new, this indicates that the two merge
1683
        revisions contain differing conflict resolutions.
3144.3.7 by Aaron Bentley
Update from review
1684
        :param revision_id: The id of the revision in which the lines are
1685
            unique
1686
        :param unique_line_numbers: The line numbers of unique lines.
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1687
        :return a tuple of (new_this, killed_other):
1688
        """
1689
        new = set()
1690
        killed = set()
3144.3.7 by Aaron Bentley
Update from review
1691
        unique_line_numbers = set(unique_line_numbers)
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1692
        for lca in self.lcas:
1693
            blocks = self._get_matching_blocks(revision_id, lca)
1694
            unique_vs_lca, _ignored = self._unique_lines(blocks)
3144.3.7 by Aaron Bentley
Update from review
1695
            new.update(unique_line_numbers.intersection(unique_vs_lca))
1696
            killed.update(unique_line_numbers.difference(unique_vs_lca))
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1697
        return new, killed