~bzr-pqm/bzr/bzr.dev

3350.6.10 by Martin Pool
VersionedFiles review cleanups
1
# Copyright (C) 2005, 2006, 2008 Canonical Ltd
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
2
#
1110 by Martin Pool
- merge aaron's merge improvements:
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
7
#
1110 by Martin Pool
- merge aaron's merge improvements:
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
12
#
1110 by Martin Pool
- merge aaron's merge improvements:
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
1545.2.3 by Aaron Bentley
Updated following j-a-meinel's comments
17
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
18
import errno
19
from itertools import chain
1185.1.2 by Martin Pool
- merge various windows and other fixes from Ollie Rutherfurd
20
import os
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
21
import warnings
1113 by Martin Pool
- fix is_ancestor import problem in merge
22
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
23
from bzrlib import (
1551.19.17 by Aaron Bentley
Add debugging flag for merges
24
    debug,
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
25
    errors,
3514.2.14 by John Arbash Meinel
Bring in the code to collapse linear portions of the graph.
26
    graph as _mod_graph,
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
27
    osutils,
1551.15.46 by Aaron Bentley
Move plan merge to tree
28
    patiencediff,
2221.4.15 by Aaron Bentley
Use RegistryOption for merge type
29
    registry,
2598.5.1 by Aaron Bentley
Start eliminating the use of None to indicate null revision
30
    revision as _mod_revision,
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
31
    tsort,
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
32
    )
1185.11.5 by John Arbash Meinel
Merged up-to-date against mainline, still broken.
33
from bzrlib.branch import Branch
1666.1.4 by Robert Collins
* 'Metadir' is now the default disk format. This improves behaviour in
34
from bzrlib.conflicts import ConflictList, Conflict
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
35
from bzrlib.errors import (BzrCommandError,
1534.4.28 by Robert Collins
first cut at merge from integration.
36
                           BzrError,
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
37
                           NoCommonAncestor,
38
                           NoCommits,
1534.4.28 by Robert Collins
first cut at merge from integration.
39
                           NoSuchRevision,
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
40
                           NoSuchFile,
1545.2.6 by Aaron Bentley
Removed _merge, renamed MergeConflictHandler to _MergeConflictHandler
41
                           NotBranchError,
1185.33.27 by Martin Pool
[merge] much integrated work from robert and john
42
                           NotVersionedError,
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
43
                           UnrelatedBranches,
1534.10.12 by Aaron Bentley
Merge produces new conflicts
44
                           UnsupportedOperation,
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
45
                           WorkingTreeNotRevision,
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
46
                           BinaryFile,
1534.4.28 by Robert Collins
first cut at merge from integration.
47
                           )
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
48
from bzrlib.graph import Graph
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
49
from bzrlib.merge3 import Merge3
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
50
from bzrlib.osutils import rename, pathjoin
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
51
from progress import DummyProgress, ProgressPhase
3052.1.3 by John Arbash Meinel
deprecate revision.is_ancestor, update the callers and the tests.
52
from bzrlib.revision import (NULL_REVISION, ensure_null)
1558.15.5 by Aaron Bentley
Fixed binary handling in weave merge
53
from bzrlib.textfile import check_text_lines
3200.1.1 by James Westby
Make pull --quiet more quiet. Fixes #185907.
54
from bzrlib.trace import mutter, warning, note, is_quiet
3008.1.9 by Michael Hudson
wanton hacking that lets me write an efficient version of get_diff_as_merged
55
from bzrlib.transform import (TransformPreview, TreeTransform,
56
                              resolve_conflicts, cook_conflicts,
2590.2.8 by Aaron Bentley
Restore conflict handling changes
57
                              conflict_pass, FinalPaths, create_by_entry,
58
                              unique_add, ROOT_PARENT)
1551.15.46 by Aaron Bentley
Move plan merge to tree
59
from bzrlib.versionedfile import PlanWeaveMerge
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
60
from bzrlib import ui
1545.2.6 by Aaron Bentley
Removed _merge, renamed MergeConflictHandler to _MergeConflictHandler
61
62
# TODO: Report back as changes are merged in
63
2325.3.1 by John Arbash Meinel
New helper function for merge, which allows us to re-use the existing workingtree, rather than opening it again.
64
1185.35.4 by Aaron Bentley
Implemented remerge
65
def transform_tree(from_tree, to_tree, interesting_ids=None):
66
    merge_inner(from_tree.branch, to_tree, from_tree, ignore_zero=True,
1558.1.3 by Aaron Bentley
Fixed deprecated op use in test suite
67
                interesting_ids=interesting_ids, this_tree=from_tree)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
68
1457.1.12 by Robert Collins
Update comment to reflect author.
69
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
70
class Merger(object):
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
71
    def __init__(self, this_branch, other_tree=None, base_tree=None,
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
72
                 this_tree=None, pb=DummyProgress(), change_reporter=None,
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
73
                 recurse='down', revision_graph=None):
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
74
        object.__init__(self)
75
        self.this_branch = this_branch
2598.5.4 by Aaron Bentley
Restore original Branch.last_revision behavior, fix bits that care
76
        self.this_basis = _mod_revision.ensure_null(
77
            this_branch.last_revision())
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
78
        self.this_rev_id = None
1534.4.26 by Robert Collins
Move working tree initialisation out from Branch.initialize, deprecated Branch.initialize to Branch.create.
79
        self.this_tree = this_tree
1185.12.83 by Aaron Bentley
Preliminary weave merge support
80
        self.this_revision_tree = None
1185.35.5 by Aaron Bentley
Made weave merge succeed if interesting files match history
81
        self.this_basis_tree = None
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
82
        self.other_tree = other_tree
2100.3.29 by Aaron Bentley
Get merge working initially
83
        self.other_branch = None
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
84
        self.base_tree = base_tree
85
        self.ignore_zero = False
86
        self.backup_files = False
87
        self.interesting_ids = None
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
88
        self.interesting_files = None
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
89
        self.show_base = False
1185.24.3 by Aaron Bentley
Integrated reprocessing into the rest of the merge stuff
90
        self.reprocess = False
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
91
        self._pb = pb
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
92
        self.pp = None
2100.3.29 by Aaron Bentley
Get merge working initially
93
        self.recurse = recurse
1551.11.9 by Aaron Bentley
Apply change reporting to merge
94
        self.change_reporter = change_reporter
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
95
        self._cached_trees = {}
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
96
        self._revision_graph = revision_graph
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
97
        self._base_is_ancestor = None
98
        self._base_is_other_ancestor = None
99
100
    @property
101
    def revision_graph(self):
102
        if self._revision_graph is None:
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
103
            self._revision_graph = self.this_branch.repository.get_graph()
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
104
        return self._revision_graph
105
106
    def _set_base_is_ancestor(self, value):
107
        self._base_is_ancestor = value
108
109
    def _get_base_is_ancestor(self):
110
        if self._base_is_ancestor is None:
111
            self._base_is_ancestor = self.revision_graph.is_ancestor(
112
                self.base_rev_id, self.this_basis)
113
        return self._base_is_ancestor
114
115
    base_is_ancestor = property(_get_base_is_ancestor, _set_base_is_ancestor)
116
117
    def _set_base_is_other_ancestor(self, value):
118
        self._base_is_other_ancestor = value
119
120
    def _get_base_is_other_ancestor(self):
121
        if self._base_is_other_ancestor is None:
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
122
            if self.other_basis is None:
123
                return True
124
            self._base_is_other_ancestor = self.revision_graph.is_ancestor(
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
125
                self.base_rev_id, self.other_basis)
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
126
        return self._base_is_other_ancestor
127
128
    base_is_other_ancestor = property(_get_base_is_other_ancestor,
129
                                      _set_base_is_other_ancestor)
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
130
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
131
    @staticmethod
132
    def from_uncommitted(tree, other_tree, pb):
1551.15.74 by Aaron Bentley
Textual updates from review
133
        """Return a Merger for uncommitted changes in other_tree.
134
135
        :param tree: The tree to merge into
136
        :param other_tree: The tree to get uncommitted changes from
137
        :param pb: A progress indicator
138
        """
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
139
        merger = Merger(tree.branch, other_tree, other_tree.basis_tree(), tree,
140
                        pb)
141
        merger.base_rev_id = merger.base_tree.get_revision_id()
142
        merger.other_rev_id = None
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
143
        merger.other_basis = merger.base_rev_id
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
144
        return merger
145
146
    @classmethod
147
    def from_mergeable(klass, tree, mergeable, pb):
1551.15.74 by Aaron Bentley
Textual updates from review
148
        """Return a Merger for a bundle or merge directive.
149
150
        :param tree: The tree to merge changes into
151
        :param mergeable: A merge directive or bundle
152
        :param pb: A progress indicator
153
        """
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
154
        mergeable.install_revisions(tree.branch.repository)
155
        base_revision_id, other_revision_id, verified =\
156
            mergeable.get_merge_request(tree.branch.repository)
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
157
        revision_graph = tree.branch.repository.get_graph()
1551.19.44 by Aaron Bentley
Fix handling of old merge directives with stricter get_parent_map
158
        if base_revision_id is not None:
159
            if (base_revision_id != _mod_revision.NULL_REVISION and
160
                revision_graph.is_ancestor(
161
                base_revision_id, tree.branch.last_revision())):
162
                base_revision_id = None
163
            else:
164
                warning('Performing cherrypick')
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
165
        merger = klass.from_revision_ids(pb, tree, other_revision_id,
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
166
                                         base_revision_id, revision_graph=
167
                                         revision_graph)
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
168
        return merger, verified
169
170
    @staticmethod
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
171
    def from_revision_ids(pb, tree, other, base=None, other_branch=None,
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
172
                          base_branch=None, revision_graph=None):
1551.15.74 by Aaron Bentley
Textual updates from review
173
        """Return a Merger for revision-ids.
174
175
        :param tree: The tree to merge changes into
176
        :param other: The revision-id to use as OTHER
177
        :param base: The revision-id to use as BASE.  If not specified, will
178
            be auto-selected.
179
        :param other_branch: A branch containing the other revision-id.  If
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
180
            not supplied, tree.branch is used.
1551.15.74 by Aaron Bentley
Textual updates from review
181
        :param base_branch: A branch containing the base revision-id.  If
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
182
            not supplied, other_branch or tree.branch will be used.
183
        :param revision_graph: If you have a revision_graph precomputed, pass
184
            it in, otherwise it will be created for you.
1551.15.74 by Aaron Bentley
Textual updates from review
185
        :param pb: A progress indicator
186
        """
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
187
        merger = Merger(tree.branch, this_tree=tree, pb=pb,
3146.5.3 by Aaron Bentley
Avoid retrieving revision graph twice
188
                        revision_graph=revision_graph)
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
189
        if other_branch is None:
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
190
            other_branch = tree.branch
1551.15.67 by Aaron Bentley
Stop using _merge_helper for merging
191
        merger.set_other_revision(other, other_branch)
192
        if base is None:
193
            merger.find_base()
194
        else:
195
            if base_branch is None:
196
                base_branch = other_branch
197
            merger.set_base_revision(base, base_branch)
198
        return merger
199
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
200
    def revision_tree(self, revision_id, branch=None):
201
        if revision_id not in self._cached_trees:
202
            if branch is None:
203
                branch = self.this_branch
204
            try:
205
                tree = self.this_tree.revision_tree(revision_id)
206
            except errors.NoSuchRevisionInTree:
207
                tree = branch.repository.revision_tree(revision_id)
208
            self._cached_trees[revision_id] = tree
209
        return self._cached_trees[revision_id]
210
2485.8.58 by Vincent Ladeuil
merge bzr.dev@1617
211
    def _get_tree(self, treespec, possible_transports=None):
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
212
        from bzrlib import workingtree
213
        location, revno = treespec
214
        if revno is None:
215
            tree = workingtree.WorkingTree.open_containing(location)[0]
216
            return tree.branch, tree
2485.8.58 by Vincent Ladeuil
merge bzr.dev@1617
217
        branch = Branch.open_containing(location, possible_transports)[0]
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
218
        if revno == -1:
219
            revision_id = branch.last_revision()
220
        else:
221
            revision_id = branch.get_rev_id(revno)
222
        revision_id = ensure_null(revision_id)
223
        return branch, self.revision_tree(revision_id, branch)
1185.12.83 by Aaron Bentley
Preliminary weave merge support
224
225
    def ensure_revision_trees(self):
226
        if self.this_revision_tree is None:
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
227
            self.this_basis_tree = self.revision_tree(self.this_basis)
1185.35.5 by Aaron Bentley
Made weave merge succeed if interesting files match history
228
            if self.this_basis == self.this_rev_id:
229
                self.this_revision_tree = self.this_basis_tree
230
1185.12.83 by Aaron Bentley
Preliminary weave merge support
231
        if self.other_rev_id is None:
232
            other_basis_tree = self.revision_tree(self.other_basis)
1852.10.3 by Robert Collins
Remove all uses of compare_trees and replace with Tree.changes_from throughout bzrlib.
233
            changes = other_basis_tree.changes_from(self.other_tree)
1185.12.83 by Aaron Bentley
Preliminary weave merge support
234
            if changes.has_changed():
235
                raise WorkingTreeNotRevision(self.this_tree)
1773.4.1 by Martin Pool
Add pyflakes makefile target; fix many warnings
236
            other_rev_id = self.other_basis
1185.12.83 by Aaron Bentley
Preliminary weave merge support
237
            self.other_tree = other_basis_tree
238
239
    def file_revisions(self, file_id):
240
        self.ensure_revision_trees()
241
        def get_id(tree, file_id):
242
            revision_id = tree.inventory[file_id].revision
243
            return revision_id
1185.35.5 by Aaron Bentley
Made weave merge succeed if interesting files match history
244
        if self.this_rev_id is None:
245
            if self.this_basis_tree.get_file_sha1(file_id) != \
246
                self.this_tree.get_file_sha1(file_id):
247
                raise WorkingTreeNotRevision(self.this_tree)
248
249
        trees = (self.this_basis_tree, self.other_tree)
1185.12.83 by Aaron Bentley
Preliminary weave merge support
250
        return [get_id(tree, file_id) for tree in trees]
251
1185.82.44 by Aaron Bentley
Switch to merge_changeset in test suite
252
    def check_basis(self, check_clean, require_commits=True):
253
        if self.this_basis is None and require_commits is True:
2249.3.1 by John Arbash Meinel
Mention using 'bzr pull' if there are no commits in current branch
254
            raise BzrCommandError("This branch has no commits."
255
                                  " (perhaps you would prefer 'bzr pull')")
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
256
        if check_clean:
257
            self.compare_basis()
258
            if self.this_basis != self.this_rev_id:
2796.2.1 by Aaron Bentley
Begin work on reconfigure command
259
                raise errors.UncommittedChanges(self.this_tree)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
260
261
    def compare_basis(self):
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
262
        try:
263
            basis_tree = self.revision_tree(self.this_tree.last_revision())
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
264
        except errors.NoSuchRevision:
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
265
            basis_tree = self.this_tree.basis_tree()
266
        changes = self.this_tree.changes_from(basis_tree)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
267
        if not changes.has_changed():
268
            self.this_rev_id = self.this_basis
269
270
    def set_interesting_files(self, file_list):
2590.2.7 by Aaron Bentley
Misc cleanup
271
        self.interesting_files = file_list
1457.1.8 by Robert Collins
Replace the WorkingTree.revert method algorithm with a call to merge_inner.
272
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
273
    def set_pending(self):
2644.1.1 by Wouter van Heyst
Fix bug #127115 by checking for self.other_rev_id being None in Merger.set_pending()
274
        if not self.base_is_ancestor or not self.base_is_other_ancestor or self.other_rev_id is None:
1185.12.77 by Aaron Bentley
Prevented all ancestors from being marked as pending merges
275
            return
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
276
        self._add_parent()
277
278
    def _add_parent(self):
279
        new_parents = self.this_tree.get_parent_ids() + [self.other_rev_id]
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
280
        new_parent_trees = []
281
        for revision_id in new_parents:
282
            try:
283
                tree = self.revision_tree(revision_id)
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
284
            except errors.NoSuchRevision:
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
285
                tree = None
286
            else:
287
                tree.lock_read()
288
            new_parent_trees.append((revision_id, tree))
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
289
        try:
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
290
            self.this_tree.set_parent_trees(new_parent_trees,
291
                                            allow_leftmost_as_ghost=True)
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
292
        finally:
293
            for _revision_id, tree in new_parent_trees:
2590.2.20 by Aaron Bentley
Fix handling of ghost base trees
294
                if tree is not None:
295
                    tree.unlock()
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
296
2485.8.37 by Vincent Ladeuil
Fix merge multiple connections. Test suite *not* passing (sftp
297
    def set_other(self, other_revision, possible_transports=None):
1979.2.1 by Robert Collins
(robertc) adds a convenience method "merge_from_branch" to WorkingTree.
298
        """Set the revision and tree to merge from.
299
300
        This sets the other_tree, other_rev_id, other_basis attributes.
301
302
        :param other_revision: The [path, revision] list to merge from.
303
        """
2485.8.58 by Vincent Ladeuil
merge bzr.dev@1617
304
        self.other_branch, self.other_tree = self._get_tree(other_revision,
305
                                                            possible_transports)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
306
        if other_revision[1] == -1:
2598.5.4 by Aaron Bentley
Restore original Branch.last_revision behavior, fix bits that care
307
            self.other_rev_id = _mod_revision.ensure_null(
308
                self.other_branch.last_revision())
2598.5.1 by Aaron Bentley
Start eliminating the use of None to indicate null revision
309
            if _mod_revision.is_null(self.other_rev_id):
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
310
                raise NoCommits(self.other_branch)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
311
            self.other_basis = self.other_rev_id
312
        elif other_revision[1] is not None:
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
313
            self.other_rev_id = self.other_branch.get_rev_id(other_revision[1])
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
314
            self.other_basis = self.other_rev_id
315
        else:
316
            self.other_rev_id = None
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
317
            self.other_basis = self.other_branch.last_revision()
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
318
            if self.other_basis is None:
2100.3.31 by Aaron Bentley
Merged bzr.dev (17 tests failing)
319
                raise NoCommits(self.other_branch)
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
320
        if self.other_rev_id is not None:
321
            self._cached_trees[self.other_rev_id] = self.other_tree
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
322
        self._maybe_fetch(self.other_branch,self.this_branch, self.other_basis)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
323
2100.3.29 by Aaron Bentley
Get merge working initially
324
    def set_other_revision(self, revision_id, other_branch):
325
        """Set 'other' based on a branch and revision id
326
327
        :param revision_id: The revision to use for a tree
328
        :param other_branch: The branch containing this tree
329
        """
330
        self.other_rev_id = revision_id
331
        self.other_branch = other_branch
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
332
        self._maybe_fetch(other_branch, self.this_branch, self.other_rev_id)
2100.3.29 by Aaron Bentley
Get merge working initially
333
        self.other_tree = self.revision_tree(revision_id)
334
        self.other_basis = revision_id
335
2520.4.110 by Aaron Bentley
Implement cherrypick support for merge directives
336
    def set_base_revision(self, revision_id, branch):
337
        """Set 'base' based on a branch and revision id
338
339
        :param revision_id: The revision to use for a tree
340
        :param branch: The branch containing this tree
341
        """
342
        self.base_rev_id = revision_id
343
        self.base_branch = branch
2520.4.132 by Aaron Bentley
Merge from bzr.dev
344
        self._maybe_fetch(branch, self.this_branch, revision_id)
2520.4.110 by Aaron Bentley
Implement cherrypick support for merge directives
345
        self.base_tree = self.revision_tree(revision_id)
2520.4.132 by Aaron Bentley
Merge from bzr.dev
346
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
347
    def _maybe_fetch(self, source, target, revision_id):
2665.5.2 by Aaron Bentley
Switch commit and merge to Repository.has_same_location
348
        if not source.repository.has_same_location(target.repository):
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
349
            target.fetch(source, revision_id)
2520.4.110 by Aaron Bentley
Implement cherrypick support for merge directives
350
1185.82.25 by Aaron Bentley
Added changeset-merging functionality
351
    def find_base(self):
2590.2.22 by Aaron Bentley
Remove cruft
352
        revisions = [ensure_null(self.this_basis),
353
                     ensure_null(self.other_basis)]
354
        if NULL_REVISION in revisions:
355
            self.base_rev_id = NULL_REVISION
356
        else:
3146.5.1 by Aaron Bentley
Make merge --uncommitted work with merge-type weave
357
            self.base_rev_id, steps = self.revision_graph.find_unique_lca(
358
                revisions[0], revisions[1], count_steps=True)
2590.2.22 by Aaron Bentley
Remove cruft
359
            if self.base_rev_id == NULL_REVISION:
360
                raise UnrelatedBranches()
1551.19.10 by Aaron Bentley
Merge now warns when it encounters a criss-cross
361
            if steps > 1:
1551.19.11 by Aaron Bentley
Add criss-cross help topic
362
                warning('Warning: criss-cross merge encountered.  See bzr'
363
                        ' help criss-cross.')
2590.2.13 by Aaron Bentley
Make find_base implement the base_finding code
364
        self.base_tree = self.revision_tree(self.base_rev_id)
365
        self.base_is_ancestor = True
2590.2.18 by Aaron Bentley
Merge is_ancestor fix
366
        self.base_is_other_ancestor = True
1185.82.25 by Aaron Bentley
Added changeset-merging functionality
367
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
368
    def set_base(self, base_revision):
1979.2.1 by Robert Collins
(robertc) adds a convenience method "merge_from_branch" to WorkingTree.
369
        """Set the base revision to use for the merge.
370
371
        :param base_revision: A 2-list containing a path and revision number.
372
        """
1185.12.96 by Aaron Bentley
Merge from mpool
373
        mutter("doing merge() with no base_revision specified")
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
374
        if base_revision == [None, None]:
2590.2.13 by Aaron Bentley
Make find_base implement the base_finding code
375
            self.find_base()
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
376
        else:
2590.2.11 by Aaron Bentley
Aggressively cache trees, use dirstate. re-mplement _add_parent.
377
            base_branch, self.base_tree = self._get_tree(base_revision)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
378
            if base_revision[1] == -1:
379
                self.base_rev_id = base_branch.last_revision()
380
            elif base_revision[1] is None:
2598.5.3 by Aaron Bentley
Push NULL_REVISION deeper
381
                self.base_rev_id = _mod_revision.NULL_REVISION
493 by Martin Pool
- Merge aaron's merge command
382
            else:
2598.5.3 by Aaron Bentley
Push NULL_REVISION deeper
383
                self.base_rev_id = _mod_revision.ensure_null(
384
                    base_branch.get_rev_id(base_revision[1]))
2590.2.19 by Aaron Bentley
Avoid fetch within a repository
385
            self._maybe_fetch(base_branch, self.this_branch, self.base_rev_id)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
386
3008.1.8 by Michael Hudson
extract merger creation into a method
387
    def make_merger(self):
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
388
        kwargs = {'working_tree':self.this_tree, 'this_tree': self.this_tree,
389
                  'other_tree': self.other_tree,
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
390
                  'interesting_ids': self.interesting_ids,
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
391
                  'interesting_files': self.interesting_files,
3008.1.11 by Michael Hudson
restore the default behaviour of Merge3Merger.__init__().
392
                  'pp': self.pp,
393
                  'do_merge': False}
1534.7.84 by Aaron Bentley
Added reprocess support, support for varying merge types
394
        if self.merge_type.requires_base:
395
            kwargs['base_tree'] = self.base_tree
1534.7.137 by Aaron Bentley
Avoided generating a new tree for every weave merge
396
        if self.merge_type.supports_reprocess:
397
            kwargs['reprocess'] = self.reprocess
398
        elif self.reprocess:
1551.6.14 by Aaron Bentley
Tweaks from merge review
399
            raise BzrError("Conflict reduction is not supported for merge"
400
                                  " type %s." % self.merge_type)
1534.7.137 by Aaron Bentley
Avoided generating a new tree for every weave merge
401
        if self.merge_type.supports_show_base:
402
            kwargs['show_base'] = self.show_base
403
        elif self.show_base:
1534.8.2 by Aaron Bentley
Implemented weave merge
404
            raise BzrError("Showing base is not supported for this"
3008.1.14 by Michael Hudson
trivial commit for testing
405
                           " merge type. %s" % self.merge_type)
3062.2.7 by Aaron Bentley
Prevent reverse cherry-picking with weave
406
        if (not getattr(self.merge_type, 'supports_reverse_cherrypick', True)
407
            and not self.base_is_other_ancestor):
408
            raise errors.CannotReverseCherrypick()
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
409
        if self.merge_type.supports_cherrypick:
3062.2.9 by Aaron Bentley
Don't use the base if not cherrypicking
410
            kwargs['cherrypick'] = (not self.base_is_ancestor or
411
                                    not self.base_is_other_ancestor)
3008.1.8 by Michael Hudson
extract merger creation into a method
412
        return self.merge_type(pb=self._pb,
413
                               change_reporter=self.change_reporter,
414
                               **kwargs)
415
416
    def do_merge(self):
2255.2.50 by John Arbash Meinel
merge only needs a lock_tree_write() on the working tree, not a full lock_write()
417
        self.this_tree.lock_tree_write()
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
418
        if self.base_tree is not None:
419
            self.base_tree.lock_read()
420
        if self.other_tree is not None:
421
            self.other_tree.lock_read()
422
        try:
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
423
            merge = self.make_merger()
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
424
            merge.do_merge()
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
425
            if self.recurse == 'down':
3504.2.2 by John Arbash Meinel
Find some code that thought we were dealing in absolute paths
426
                for relpath, file_id in self.this_tree.iter_references():
427
                    sub_tree = self.this_tree.get_nested_tree(file_id, relpath)
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
428
                    other_revision = self.other_tree.get_reference_revision(
3504.2.2 by John Arbash Meinel
Find some code that thought we were dealing in absolute paths
429
                        file_id, relpath)
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
430
                    if  other_revision == sub_tree.last_revision():
431
                        continue
432
                    sub_merge = Merger(sub_tree.branch, this_tree=sub_tree)
433
                    sub_merge.merge_type = self.merge_type
434
                    other_branch = self.other_branch.reference_parent(file_id, relpath)
435
                    sub_merge.set_other_revision(other_revision, other_branch)
436
                    base_revision = self.base_tree.get_reference_revision(file_id)
437
                    sub_merge.base_tree = \
438
                        sub_tree.branch.repository.revision_tree(base_revision)
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
439
                    sub_merge.base_rev_id = base_revision
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
440
                    sub_merge.do_merge()
441
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
442
        finally:
443
            if self.other_tree is not None:
444
                self.other_tree.unlock()
445
            if self.base_tree is not None:
446
                self.base_tree.unlock()
447
            self.this_tree.unlock()
1534.7.151 by Aaron Bentley
Fixed all changes applied successfully
448
        if len(merge.cooked_conflicts) == 0:
3200.1.1 by James Westby
Make pull --quiet more quiet. Fixes #185907.
449
            if not self.ignore_zero and not is_quiet():
1534.7.141 by Aaron Bentley
Added conflict reporting
450
                note("All changes applied successfully.")
451
        else:
452
            note("%d conflicts encountered." % len(merge.cooked_conflicts))
453
1534.7.134 by Aaron Bentley
Hid raw conflicts
454
        return len(merge.cooked_conflicts)
1185.12.76 by Aaron Bentley
Refactored merge and merge_inner to use Merger
455
1545.2.4 by Aaron Bentley
PEP8 fixes
456
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
457
class Merge3Merger(object):
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
458
    """Three-way merger that uses the merge3 text merger"""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
459
    requires_base = True
460
    supports_reprocess = True
461
    supports_show_base = True
462
    history_based = False
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
463
    supports_cherrypick = True
3062.2.7 by Aaron Bentley
Prevent reverse cherry-picking with weave
464
    supports_reverse_cherrypick = True
2590.2.7 by Aaron Bentley
Misc cleanup
465
    winner_idx = {"this": 2, "other": 1, "conflict": 1}
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
466
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
467
    def __init__(self, working_tree, this_tree, base_tree, other_tree, 
1558.2.2 by Aaron Bentley
Make remerge honour interesting-ids
468
                 interesting_ids=None, reprocess=False, show_base=False,
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
469
                 pb=DummyProgress(), pp=None, change_reporter=None,
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
470
                 interesting_files=None, do_merge=True,
471
                 cherrypick=False):
2590.2.10 by Aaron Bentley
Updates from review
472
        """Initialize the merger object and perform the merge.
473
474
        :param working_tree: The working tree to apply the merge to
475
        :param this_tree: The local tree in the merge operation
476
        :param base_tree: The common tree in the merge operation
477
        :param other_tree: The other other tree to merge changes from
478
        :param interesting_ids: The file_ids of files that should be
479
            participate in the merge.  May not be combined with
480
            interesting_files.
481
        :param: reprocess If True, perform conflict-reduction processing.
482
        :param show_base: If True, show the base revision in text conflicts.
483
            (incompatible with reprocess)
484
        :param pb: A Progress bar
485
        :param pp: A ProgressPhase object
486
        :param change_reporter: An object that should report changes made
487
        :param interesting_files: The tree-relative paths of files that should
488
            participate in the merge.  If these paths refer to directories,
489
            the contents of those directories will also be included.  May not
490
            be combined with interesting_ids.  If neither interesting_files nor
491
            interesting_ids is specified, all files may participate in the
492
            merge.
493
        """
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
494
        object.__init__(self)
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
495
        if interesting_files is not None and interesting_ids is not None:
496
            raise ValueError(
497
                'specify either interesting_ids or interesting_files')
2590.2.4 by Aaron Bentley
Move entry generation to a helper
498
        self.interesting_ids = interesting_ids
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
499
        self.interesting_files = interesting_files
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
500
        self.this_tree = working_tree
501
        self.base_tree = base_tree
502
        self.other_tree = other_tree
503
        self._raw_conflicts = []
504
        self.cooked_conflicts = []
505
        self.reprocess = reprocess
506
        self.show_base = show_base
1534.9.1 by Aaron Bentley
Added progress bars to merge
507
        self.pb = pb
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
508
        self.pp = pp
1551.11.9 by Aaron Bentley
Apply change reporting to merge
509
        self.change_reporter = change_reporter
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
510
        self.cherrypick = cherrypick
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
511
        if self.pp is None:
512
            self.pp = ProgressPhase("Merge phase", 3, self.pb)
3008.1.11 by Michael Hudson
restore the default behaviour of Merge3Merger.__init__().
513
        if do_merge:
514
            self.do_merge()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
515
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
516
    def do_merge(self):
517
        self.this_tree.lock_tree_write()
518
        self.base_tree.lock_read()
519
        self.other_tree.lock_read()
520
        self.tt = TreeTransform(self.this_tree, self.pb)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
521
        try:
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
522
            self.pp.next_phase()
3008.1.21 by Aaron Bentley
Make compute_transform private, test make_preview_transform
523
            self._compute_transform()
1551.2.32 by Aaron Bentley
Handle progress phases more nicely in merge
524
            self.pp.next_phase()
2590.2.17 by Aaron Bentley
Avoid redundant conflict check
525
            results = self.tt.apply(no_conflicts=True)
1558.4.3 by Aaron Bentley
Merge_modified performance/concurrency fix
526
            self.write_modified(results)
1534.10.12 by Aaron Bentley
Merge produces new conflicts
527
            try:
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
528
                self.this_tree.add_conflicts(self.cooked_conflicts)
1534.10.12 by Aaron Bentley
Merge produces new conflicts
529
            except UnsupportedOperation:
530
                pass
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
531
        finally:
1711.7.7 by John Arbash Meinel
Don't squelch errors in tt.finalize()
532
            self.tt.finalize()
2255.7.52 by Robert Collins
Lock trees in Merge3Merger correctly.
533
            self.other_tree.unlock()
534
            self.base_tree.unlock()
535
            self.this_tree.unlock()
1551.2.31 by Aaron Bentley
Got merge and revert using nested pbs
536
            self.pb.clear()
1534.7.192 by Aaron Bentley
Record hashes produced by merges
537
3008.1.9 by Michael Hudson
wanton hacking that lets me write an efficient version of get_diff_as_merged
538
    def make_preview_transform(self):
539
        self.base_tree.lock_read()
540
        self.other_tree.lock_read()
541
        self.tt = TransformPreview(self.this_tree)
542
        try:
543
            self.pp.next_phase()
3008.1.21 by Aaron Bentley
Make compute_transform private, test make_preview_transform
544
            self._compute_transform()
3008.1.9 by Michael Hudson
wanton hacking that lets me write an efficient version of get_diff_as_merged
545
            self.pp.next_phase()
546
        finally:
547
            self.other_tree.unlock()
548
            self.base_tree.unlock()
549
            self.pb.clear()
550
        return self.tt
551
3008.1.21 by Aaron Bentley
Make compute_transform private, test make_preview_transform
552
    def _compute_transform(self):
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
553
        entries = self._entries3()
554
        child_pb = ui.ui_factory.nested_progress_bar()
555
        try:
556
            for num, (file_id, changed, parents3, names3,
557
                      executable3) in enumerate(entries):
558
                child_pb.update('Preparing file merge', num, len(entries))
559
                self._merge_names(file_id, parents3, names3)
560
                if changed:
561
                    file_status = self.merge_contents(file_id)
562
                else:
563
                    file_status = 'unmodified'
564
                self._merge_executable(file_id,
565
                    executable3, file_status)
566
        finally:
567
            child_pb.finished()
568
        self.fix_root()
569
        self.pp.next_phase()
570
        child_pb = ui.ui_factory.nested_progress_bar()
571
        try:
572
            fs_conflicts = resolve_conflicts(self.tt, child_pb,
573
                lambda t, c: conflict_pass(t, c, self.other_tree))
574
        finally:
575
            child_pb.finished()
576
        if self.change_reporter is not None:
577
            from bzrlib import delta
578
            delta.report_changes(
3254.1.1 by Aaron Bentley
Make Tree.iter_changes a public method
579
                self.tt.iter_changes(), self.change_reporter)
3008.1.6 by Michael Hudson
chop up Merge3Merger.__init__ into pieces
580
        self.cook_conflicts(fs_conflicts)
581
        for conflict in self.cooked_conflicts:
582
            warning(conflict)
583
2590.2.4 by Aaron Bentley
Move entry generation to a helper
584
    def _entries3(self):
2590.2.7 by Aaron Bentley
Misc cleanup
585
        """Gather data about files modified between three trees.
586
587
        Return a list of tuples of file_id, changed, parents3, names3,
588
        executable3.  changed is a boolean indicating whether the file contents
589
        or kind were changed.  parents3 is a tuple of parent ids for base,
590
        other and this.  names3 is a tuple of names for base, other and this.
591
        executable3 is a tuple of execute-bit values for base, other and this.
592
        """
2590.2.4 by Aaron Bentley
Move entry generation to a helper
593
        result = []
3254.1.1 by Aaron Bentley
Make Tree.iter_changes a public method
594
        iterator = self.other_tree.iter_changes(self.base_tree,
3514.2.16 by John Arbash Meinel
Review feedback from Ian.
595
                include_unchanged=True, specific_files=self.interesting_files,
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
596
                extra_trees=[self.this_tree])
2590.2.4 by Aaron Bentley
Move entry generation to a helper
597
        for (file_id, paths, changed, versioned, parents, names, kind,
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
598
             executable) in iterator:
2590.2.4 by Aaron Bentley
Move entry generation to a helper
599
            if (self.interesting_ids is not None and
600
                file_id not in self.interesting_ids):
601
                continue
602
            if file_id in self.this_tree.inventory:
603
                entry = self.this_tree.inventory[file_id]
604
                this_name = entry.name
605
                this_parent = entry.parent_id
606
                this_executable = entry.executable
607
            else:
608
                this_name = None
609
                this_parent = None
610
                this_executable = None
611
            parents3 = parents + (this_parent,)
612
            names3 = names + (this_name,)
613
            executable3 = executable + (this_executable,)
614
            result.append((file_id, changed, parents3, names3, executable3))
615
        return result
616
1731.1.33 by Aaron Bentley
Revert no-special-root changes
617
    def fix_root(self):
618
        try:
619
            self.tt.final_kind(self.tt.root)
620
        except NoSuchFile:
621
            self.tt.cancel_deletion(self.tt.root)
622
        if self.tt.final_file_id(self.tt.root) is None:
623
            self.tt.version_file(self.tt.tree_file_id(self.tt.root), 
624
                                 self.tt.root)
625
        if self.other_tree.inventory.root is None:
626
            return
2946.3.3 by John Arbash Meinel
Prefer tree.get_root_id() as more explicit than tree.path2id('')
627
        other_root_file_id = self.other_tree.get_root_id()
1731.1.33 by Aaron Bentley
Revert no-special-root changes
628
        other_root = self.tt.trans_id_file_id(other_root_file_id)
629
        if other_root == self.tt.root:
630
            return
631
        try:
632
            self.tt.final_kind(other_root)
633
        except NoSuchFile:
634
            return
3649.3.1 by Jelmer Vernooij
Merging from a previously joined branch will no longer cause a traceback.
635
        if self.other_tree.inventory.root.file_id in self.this_tree.inventory:
636
            # the other tree's root is a non-root in the current tree
637
            return
1731.1.33 by Aaron Bentley
Revert no-special-root changes
638
        self.reparent_children(self.other_tree.inventory.root, self.tt.root)
639
        self.tt.cancel_creation(other_root)
640
        self.tt.cancel_versioning(other_root)
641
642
    def reparent_children(self, ie, target):
643
        for thing, child in ie.children.iteritems():
644
            trans_id = self.tt.trans_id_file_id(child.file_id)
645
            self.tt.adjust_path(self.tt.final_name(trans_id), target, trans_id)
646
1534.7.192 by Aaron Bentley
Record hashes produced by merges
647
    def write_modified(self, results):
648
        modified_hashes = {}
649
        for path in results.modified_paths:
650
            file_id = self.this_tree.path2id(self.this_tree.relpath(path))
651
            if file_id is None:
652
                continue
653
            hash = self.this_tree.get_file_sha1(file_id)
654
            if hash is None:
655
                continue
656
            modified_hashes[file_id] = hash
657
        self.this_tree.set_merge_modified(modified_hashes)
658
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
659
    @staticmethod
660
    def parent(entry, file_id):
1534.7.157 by Aaron Bentley
Added more docs
661
        """Determine the parent for a file_id (used as a key method)"""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
662
        if entry is None:
663
            return None
664
        return entry.parent_id
665
666
    @staticmethod
667
    def name(entry, file_id):
1534.7.157 by Aaron Bentley
Added more docs
668
        """Determine the name for a file_id (used as a key method)"""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
669
        if entry is None:
670
            return None
671
        return entry.name
672
    
673
    @staticmethod
674
    def contents_sha1(tree, file_id):
1534.7.157 by Aaron Bentley
Added more docs
675
        """Determine the sha1 of the file contents (used as a key method)."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
676
        if file_id not in tree:
677
            return None
678
        return tree.get_file_sha1(file_id)
679
680
    @staticmethod
681
    def executable(tree, file_id):
1534.7.157 by Aaron Bentley
Added more docs
682
        """Determine the executability of a file-id (used as a key method)."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
683
        if file_id not in tree:
684
            return None
685
        if tree.kind(file_id) != "file":
686
            return False
687
        return tree.is_executable(file_id)
688
689
    @staticmethod
690
    def kind(tree, file_id):
1534.7.157 by Aaron Bentley
Added more docs
691
        """Determine the kind of a file-id (used as a key method)."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
692
        if file_id not in tree:
693
            return None
694
        return tree.kind(file_id)
695
696
    @staticmethod
2590.2.8 by Aaron Bentley
Restore conflict handling changes
697
    def _three_way(base, other, this):
698
        #if base == other, either they all agree, or only THIS has changed.
699
        if base == other:
700
            return 'this'
2590.2.10 by Aaron Bentley
Updates from review
701
        elif this not in (base, other):
2590.2.8 by Aaron Bentley
Restore conflict handling changes
702
            return 'conflict'
2590.2.10 by Aaron Bentley
Updates from review
703
        # "Ambiguous clean merge" -- both sides have made the same change.
2590.2.8 by Aaron Bentley
Restore conflict handling changes
704
        elif this == other:
705
            return "this"
2590.2.10 by Aaron Bentley
Updates from review
706
        # this == base: only other has changed.
2590.2.8 by Aaron Bentley
Restore conflict handling changes
707
        else:
708
            return "other"
709
710
    @staticmethod
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
711
    def scalar_three_way(this_tree, base_tree, other_tree, file_id, key):
712
        """Do a three-way test on a scalar.
713
        Return "this", "other" or "conflict", depending whether a value wins.
714
        """
715
        key_base = key(base_tree, file_id)
716
        key_other = key(other_tree, file_id)
717
        #if base == other, either they all agree, or only THIS has changed.
718
        if key_base == key_other:
719
            return "this"
720
        key_this = key(this_tree, file_id)
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
721
        # "Ambiguous clean merge"
722
        if key_this == key_other:
723
            return "this"
724
        elif key_this == key_base:
725
            return "other"
726
        else:
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
727
            return "conflict"
728
729
    def merge_names(self, file_id):
730
        def get_entry(tree):
731
            if file_id in tree.inventory:
732
                return tree.inventory[file_id]
733
            else:
734
                return None
735
        this_entry = get_entry(self.this_tree)
736
        other_entry = get_entry(self.other_tree)
737
        base_entry = get_entry(self.base_tree)
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
738
        entries = (base_entry, other_entry, this_entry)
739
        names = []
740
        parents = []
741
        for entry in entries:
742
            if entry is None:
743
                names.append(None)
744
                parents.append(None)
745
            else:
746
                names.append(entry.name)
747
                parents.append(entry.parent_id)
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
748
        return self._merge_names(file_id, parents, names)
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
749
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
750
    def _merge_names(self, file_id, parents, names):
2590.2.7 by Aaron Bentley
Misc cleanup
751
        """Perform a merge on file_id names and parents"""
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
752
        base_name, other_name, this_name = names
753
        base_parent, other_parent, this_parent = parents
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
754
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
755
        name_winner = self._three_way(*names)
756
757
        parent_id_winner = self._three_way(*parents)
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
758
        if this_name is None:
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
759
            if name_winner == "this":
760
                name_winner = "other"
761
            if parent_id_winner == "this":
762
                parent_id_winner = "other"
763
        if name_winner == "this" and parent_id_winner == "this":
764
            return
765
        if name_winner == "conflict":
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
766
            trans_id = self.tt.trans_id_file_id(file_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
767
            self._raw_conflicts.append(('name conflict', trans_id, 
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
768
                                        this_name, other_name))
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
769
        if parent_id_winner == "conflict":
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
770
            trans_id = self.tt.trans_id_file_id(file_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
771
            self._raw_conflicts.append(('parent conflict', trans_id, 
2590.2.1 by Aaron Bentley
Start work on merging names based on iter_changes
772
                                        this_parent, other_parent))
2590.2.2 by Aaron Bentley
Do most name merging from iter_changes output
773
        if other_name is None:
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
774
            # it doesn't matter whether the result was 'other' or 
775
            # 'conflict'-- if there's no 'other', we leave it alone.
776
            return
777
        # if we get here, name_winner and parent_winner are set to safe values.
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
778
        trans_id = self.tt.trans_id_file_id(file_id)
2590.2.7 by Aaron Bentley
Misc cleanup
779
        parent_id = parents[self.winner_idx[parent_id_winner]]
1731.1.33 by Aaron Bentley
Revert no-special-root changes
780
        if parent_id is not None:
781
            parent_trans_id = self.tt.trans_id_file_id(parent_id)
2590.2.7 by Aaron Bentley
Misc cleanup
782
            self.tt.adjust_path(names[self.winner_idx[name_winner]],
1731.1.33 by Aaron Bentley
Revert no-special-root changes
783
                                parent_trans_id, trans_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
784
785
    def merge_contents(self, file_id):
1534.7.157 by Aaron Bentley
Added more docs
786
        """Performa a merge on file_id contents."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
787
        def contents_pair(tree):
788
            if file_id not in tree:
789
                return (None, None)
790
            kind = tree.kind(file_id)
791
            if kind == "file":
792
                contents = tree.get_file_sha1(file_id)
793
            elif kind == "symlink":
794
                contents = tree.get_symlink_target(file_id)
795
            else:
796
                contents = None
797
            return kind, contents
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
798
799
        def contents_conflict():
800
            trans_id = self.tt.trans_id_file_id(file_id)
801
            name = self.tt.final_name(trans_id)
802
            parent_id = self.tt.final_parent(trans_id)
803
            if file_id in self.this_tree.inventory:
804
                self.tt.unversion_file(trans_id)
1551.10.2 by Aaron Bentley
Handle merge with dangling inventory entries
805
                if file_id in self.this_tree:
806
                    self.tt.delete_contents(trans_id)
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
807
            file_group = self._dump_conflicts(name, parent_id, file_id, 
808
                                              set_version=True)
809
            self._raw_conflicts.append(('contents conflict', file_group))
810
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
811
        # See SPOT run.  run, SPOT, run.
812
        # So we're not QUITE repeating ourselves; we do tricky things with
813
        # file kind...
814
        base_pair = contents_pair(self.base_tree)
815
        other_pair = contents_pair(self.other_tree)
816
        if base_pair == other_pair:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
817
            # OTHER introduced no changes
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
818
            return "unmodified"
819
        this_pair = contents_pair(self.this_tree)
820
        if this_pair == other_pair:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
821
            # THIS and OTHER introduced the same changes
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
822
            return "unmodified"
823
        else:
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
824
            trans_id = self.tt.trans_id_file_id(file_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
825
            if this_pair == base_pair:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
826
                # only OTHER introduced changes
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
827
                if file_id in self.this_tree:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
828
                    # Remove any existing contents
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
829
                    self.tt.delete_contents(trans_id)
1534.7.147 by Aaron Bentley
Tweak to check inventory, not tree for file ids
830
                if file_id in self.other_tree:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
831
                    # OTHER changed the file
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
832
                    create_by_entry(self.tt, 
833
                                    self.other_tree.inventory[file_id], 
834
                                    self.other_tree, trans_id)
1534.7.147 by Aaron Bentley
Tweak to check inventory, not tree for file ids
835
                    if file_id not in self.this_tree.inventory:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
836
                        self.tt.version_file(file_id, trans_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
837
                    return "modified"
1534.7.147 by Aaron Bentley
Tweak to check inventory, not tree for file ids
838
                elif file_id in self.this_tree.inventory:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
839
                    # OTHER deleted the file
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
840
                    self.tt.unversion_file(trans_id)
841
                    return "deleted"
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
842
            #BOTH THIS and OTHER introduced changes; scalar conflict
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
843
            elif this_pair[0] == "file" and other_pair[0] == "file":
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
844
                # THIS and OTHER are both files, so text merge.  Either
845
                # BASE is a file, or both converted to files, so at least we
846
                # have agreement that output should be a file.
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
847
                try:
848
                    self.text_merge(file_id, trans_id)
849
                except BinaryFile:
850
                    return contents_conflict()
1534.7.147 by Aaron Bentley
Tweak to check inventory, not tree for file ids
851
                if file_id not in self.this_tree.inventory:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
852
                    self.tt.version_file(file_id, trans_id)
1534.7.152 by Aaron Bentley
Fixed overwrites
853
                try:
854
                    self.tt.tree_kind(trans_id)
855
                    self.tt.delete_contents(trans_id)
856
                except NoSuchFile:
857
                    pass
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
858
                return "modified"
859
            else:
1534.7.145 by Aaron Bentley
More fixups after get_trans_id
860
                # Scalar conflict, can't text merge.  Dump conflicts
1558.15.3 by Aaron Bentley
Handle binary files for diff3 merges
861
                return contents_conflict()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
862
863
    def get_lines(self, tree, file_id):
1534.7.157 by Aaron Bentley
Added more docs
864
        """Return the lines in a file, or an empty list."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
865
        if file_id in tree:
866
            return tree.get_file(file_id).readlines()
867
        else:
868
            return []
869
870
    def text_merge(self, file_id, trans_id):
871
        """Perform a three-way text merge on a file_id"""
872
        # it's possible that we got here with base as a different type.
873
        # if so, we just want two-way text conflicts.
874
        if file_id in self.base_tree and \
875
            self.base_tree.kind(file_id) == "file":
876
            base_lines = self.get_lines(self.base_tree, file_id)
877
        else:
878
            base_lines = []
879
        other_lines = self.get_lines(self.other_tree, file_id)
880
        this_lines = self.get_lines(self.this_tree, file_id)
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
881
        m3 = Merge3(base_lines, this_lines, other_lines,
882
                    is_cherrypick=self.cherrypick)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
883
        start_marker = "!START OF MERGE CONFLICT!" + "I HOPE THIS IS UNIQUE"
884
        if self.show_base is True:
885
            base_marker = '|' * 7
886
        else:
887
            base_marker = None
888
889
        def iter_merge3(retval):
890
            retval["text_conflicts"] = False
891
            for line in m3.merge_lines(name_a = "TREE", 
892
                                       name_b = "MERGE-SOURCE", 
893
                                       name_base = "BASE-REVISION",
894
                                       start_marker=start_marker, 
895
                                       base_marker=base_marker,
896
                                       reprocess=self.reprocess):
897
                if line.startswith(start_marker):
898
                    retval["text_conflicts"] = True
899
                    yield line.replace(start_marker, '<' * 7)
900
                else:
901
                    yield line
902
        retval = {}
903
        merge3_iterator = iter_merge3(retval)
904
        self.tt.create_file(merge3_iterator, trans_id)
905
        if retval["text_conflicts"] is True:
906
            self._raw_conflicts.append(('text conflict', trans_id))
907
            name = self.tt.final_name(trans_id)
908
            parent_id = self.tt.final_parent(trans_id)
909
            file_group = self._dump_conflicts(name, parent_id, file_id, 
910
                                              this_lines, base_lines,
911
                                              other_lines)
912
            file_group.append(trans_id)
913
914
    def _dump_conflicts(self, name, parent_id, file_id, this_lines=None, 
915
                        base_lines=None, other_lines=None, set_version=False,
916
                        no_base=False):
1534.7.157 by Aaron Bentley
Added more docs
917
        """Emit conflict files.
918
        If this_lines, base_lines, or other_lines are omitted, they will be
919
        determined automatically.  If set_version is true, the .OTHER, .THIS
920
        or .BASE (in that order) will be created as versioned files.
921
        """
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
922
        data = [('OTHER', self.other_tree, other_lines), 
923
                ('THIS', self.this_tree, this_lines)]
924
        if not no_base:
925
            data.append(('BASE', self.base_tree, base_lines))
926
        versioned = False
927
        file_group = []
928
        for suffix, tree, lines in data:
929
            if file_id in tree:
930
                trans_id = self._conflict_file(name, parent_id, tree, file_id,
931
                                               suffix, lines)
932
                file_group.append(trans_id)
933
                if set_version and not versioned:
934
                    self.tt.version_file(file_id, trans_id)
935
                    versioned = True
936
        return file_group
937
           
938
    def _conflict_file(self, name, parent_id, tree, file_id, suffix, 
939
                       lines=None):
1534.7.157 by Aaron Bentley
Added more docs
940
        """Emit a single conflict file."""
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
941
        name = name + '.' + suffix
942
        trans_id = self.tt.create_path(name, parent_id)
943
        entry = tree.inventory[file_id]
944
        create_by_entry(self.tt, entry, tree, trans_id, lines)
945
        return trans_id
946
947
    def merge_executable(self, file_id, file_status):
1534.7.157 by Aaron Bentley
Added more docs
948
        """Perform a merge on the execute bit."""
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
949
        executable = [self.executable(t, file_id) for t in (self.base_tree,
950
                      self.other_tree, self.this_tree)]
951
        self._merge_executable(file_id, executable, file_status)
952
953
    def _merge_executable(self, file_id, executable, file_status):
954
        """Perform a merge on the execute bit."""
955
        base_executable, other_executable, this_executable = executable
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
956
        if file_status == "deleted":
957
            return
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
958
        winner = self._three_way(*executable)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
959
        if winner == "conflict":
960
        # There must be a None in here, if we have a conflict, but we
961
        # need executability since file status was not deleted.
1534.10.35 by Aaron Bentley
Merge handles contents + executable + deletion conflict
962
            if self.executable(self.other_tree, file_id) is None:
1534.7.142 by Aaron Bentley
Fixed executability conflicts
963
                winner = "this"
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
964
            else:
1534.7.142 by Aaron Bentley
Fixed executability conflicts
965
                winner = "other"
1551.19.30 by Aaron Bentley
Accelerate merge by skipping file existence check when merging execute bit
966
        if winner == 'this' and file_status != "modified":
967
            return
968
        trans_id = self.tt.trans_id_file_id(file_id)
969
        try:
970
            if self.tt.final_kind(trans_id) != "file":
971
                return
972
        except NoSuchFile:
973
            return
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
974
        if winner == "this":
1551.19.30 by Aaron Bentley
Accelerate merge by skipping file existence check when merging execute bit
975
            executability = this_executable
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
976
        else:
977
            if file_id in self.other_tree:
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
978
                executability = other_executable
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
979
            elif file_id in self.this_tree:
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
980
                executability = this_executable
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
981
            elif file_id in self.base_tree:
2590.2.3 by Aaron Bentley
Merge the execute bit based on iter_changes
982
                executability = base_executable
1551.19.30 by Aaron Bentley
Accelerate merge by skipping file existence check when merging execute bit
983
        if executability is not None:
984
            trans_id = self.tt.trans_id_file_id(file_id)
985
            self.tt.set_executability(executability, trans_id)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
986
1534.7.172 by Aaron Bentley
Integrated fs conflicts with merge conflicts.
987
    def cook_conflicts(self, fs_conflicts):
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
988
        """Convert all conflicts into a form that doesn't depend on trans_id"""
1534.10.19 by Aaron Bentley
Stanza conversion, cooking
989
        from conflicts import Conflict
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
990
        name_conflicts = {}
1534.7.172 by Aaron Bentley
Integrated fs conflicts with merge conflicts.
991
        self.cooked_conflicts.extend(cook_conflicts(fs_conflicts, self.tt))
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
992
        fp = FinalPaths(self.tt)
993
        for conflict in self._raw_conflicts:
994
            conflict_type = conflict[0]
995
            if conflict_type in ('name conflict', 'parent conflict'):
996
                trans_id = conflict[1]
997
                conflict_args = conflict[2:]
998
                if trans_id not in name_conflicts:
999
                    name_conflicts[trans_id] = {}
1000
                unique_add(name_conflicts[trans_id], conflict_type, 
1001
                           conflict_args)
1002
            if conflict_type == 'contents conflict':
1003
                for trans_id in conflict[1]:
1004
                    file_id = self.tt.final_file_id(trans_id)
1005
                    if file_id is not None:
1006
                        break
1007
                path = fp.get_path(trans_id)
1008
                for suffix in ('.BASE', '.THIS', '.OTHER'):
1009
                    if path.endswith(suffix):
1010
                        path = path[:-len(suffix)]
1011
                        break
1534.10.19 by Aaron Bentley
Stanza conversion, cooking
1012
                c = Conflict.factory(conflict_type, path=path, file_id=file_id)
1013
                self.cooked_conflicts.append(c)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1014
            if conflict_type == 'text conflict':
1015
                trans_id = conflict[1]
1016
                path = fp.get_path(trans_id)
1017
                file_id = self.tt.final_file_id(trans_id)
1534.10.19 by Aaron Bentley
Stanza conversion, cooking
1018
                c = Conflict.factory(conflict_type, path=path, file_id=file_id)
1019
                self.cooked_conflicts.append(c)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1020
1021
        for trans_id, conflicts in name_conflicts.iteritems():
1022
            try:
1023
                this_parent, other_parent = conflicts['parent conflict']
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1024
                if this_parent == other_parent:
1025
                    raise AssertionError()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1026
            except KeyError:
1027
                this_parent = other_parent = \
1028
                    self.tt.final_file_id(self.tt.final_parent(trans_id))
1029
            try:
1030
                this_name, other_name = conflicts['name conflict']
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1031
                if this_name == other_name:
1032
                    raise AssertionError()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1033
            except KeyError:
1034
                this_name = other_name = self.tt.final_name(trans_id)
1035
            other_path = fp.get_path(trans_id)
1551.16.2 by Aaron Bentley
Don't crash on merging renamed deleted files (#110279)
1036
            if this_parent is not None and this_name is not None:
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1037
                this_parent_path = \
1534.7.181 by Aaron Bentley
Renamed a bunch of functions
1038
                    fp.get_path(self.tt.trans_id_file_id(this_parent))
1534.7.166 by Aaron Bentley
Swapped os.path.join for pathjoin everywhere
1039
                this_path = pathjoin(this_parent_path, this_name)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1040
            else:
1041
                this_path = "<deleted>"
1042
            file_id = self.tt.final_file_id(trans_id)
1534.10.20 by Aaron Bentley
Got all tests passing
1043
            c = Conflict.factory('path conflict', path=this_path,
1534.10.19 by Aaron Bentley
Stanza conversion, cooking
1044
                                 conflict_path=other_path, file_id=file_id)
1045
            self.cooked_conflicts.append(c)
1666.1.4 by Robert Collins
* 'Metadir' is now the default disk format. This improves behaviour in
1046
        self.cooked_conflicts.sort(key=Conflict.sort_key)
1534.7.141 by Aaron Bentley
Added conflict reporting
1047
1048
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1049
class WeaveMerger(Merge3Merger):
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
1050
    """Three-way tree merger, text weave merger."""
1551.6.8 by Aaron Bentley
Implemented reprocess for weave
1051
    supports_reprocess = True
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1052
    supports_show_base = False
3062.2.7 by Aaron Bentley
Prevent reverse cherry-picking with weave
1053
    supports_reverse_cherrypick = False
3062.2.9 by Aaron Bentley
Don't use the base if not cherrypicking
1054
    history_based = True
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1055
1056
    def _merged_lines(self, file_id):
1057
        """Generate the merged lines.
1058
        There is no distinction between lines that are meant to contain <<<<<<<
1059
        and conflicts.
1060
        """
3062.2.9 by Aaron Bentley
Don't use the base if not cherrypicking
1061
        if self.cherrypick:
1062
            base = self.base_tree
1063
        else:
1064
            base = None
3062.2.4 by Aaron Bentley
Start supporting merge-with-base
1065
        plan = self.this_tree.plan_file_merge(file_id, self.other_tree,
3062.2.9 by Aaron Bentley
Don't use the base if not cherrypicking
1066
                                              base=base)
1551.19.17 by Aaron Bentley
Add debugging flag for merges
1067
        if 'merge' in debug.debug_flags:
1068
            plan = list(plan)
1069
            trans_id = self.tt.trans_id_file_id(file_id)
1070
            name = self.tt.final_name(trans_id) + '.plan'
1071
            contents = ('%10s|%s' % l for l in plan)
1072
            self.tt.new_file(name, self.tt.final_parent(trans_id), contents)
1551.15.52 by Aaron Bentley
Tweak from review comments
1073
        textmerge = PlanWeaveMerge(plan, '<<<<<<< TREE\n',
1074
            '>>>>>>> MERGE-SOURCE\n')
1075
        return textmerge.merge_lines(self.reprocess)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1076
1077
    def text_merge(self, file_id, trans_id):
1534.7.157 by Aaron Bentley
Added more docs
1078
        """Perform a (weave) text merge for a given file and file-id.
1079
        If conflicts are encountered, .THIS and .OTHER files will be emitted,
1080
        and a conflict will be noted.
1081
        """
1551.6.12 by Aaron Bentley
Indicate conflicts from merge_lines, insead of guessing
1082
        lines, conflicts = self._merged_lines(file_id)
1558.15.10 by Aaron Bentley
Merge bzr.dev
1083
        lines = list(lines)
1558.15.5 by Aaron Bentley
Fixed binary handling in weave merge
1084
        # Note we're checking whether the OUTPUT is binary in this case, 
1085
        # because we don't want to get into weave merge guts.
1086
        check_text_lines(lines)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1087
        self.tt.create_file(lines, trans_id)
1088
        if conflicts:
1089
            self._raw_conflicts.append(('text conflict', trans_id))
1090
            name = self.tt.final_name(trans_id)
1091
            parent_id = self.tt.final_parent(trans_id)
1092
            file_group = self._dump_conflicts(name, parent_id, file_id, 
1093
                                              no_base=True)
1094
            file_group.append(trans_id)
1095
1096
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1097
class LCAMerger(WeaveMerger):
1098
1099
    def _merged_lines(self, file_id):
1100
        """Generate the merged lines.
1101
        There is no distinction between lines that are meant to contain <<<<<<<
1102
        and conflicts.
1103
        """
1104
        if self.cherrypick:
1105
            base = self.base_tree
1106
        else:
1107
            base = None
1108
        plan = self.this_tree.plan_file_lca_merge(file_id, self.other_tree,
1109
                                                  base=base)
1110
        if 'merge' in debug.debug_flags:
1111
            plan = list(plan)
1112
            trans_id = self.tt.trans_id_file_id(file_id)
1113
            name = self.tt.final_name(trans_id) + '.plan'
1114
            contents = ('%10s|%s' % l for l in plan)
1115
            self.tt.new_file(name, self.tt.final_parent(trans_id), contents)
1116
        textmerge = PlanWeaveMerge(plan, '<<<<<<< TREE\n',
1117
            '>>>>>>> MERGE-SOURCE\n')
1118
        return textmerge.merge_lines(self.reprocess)
1119
1120
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1121
class Diff3Merger(Merge3Merger):
1534.7.167 by Aaron Bentley
PEP8 and comment cleanups
1122
    """Three-way merger using external diff3 for text merging"""
1711.7.20 by John Arbash Meinel
always close files, minor PEP8 cleanup
1123
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1124
    def dump_file(self, temp_dir, name, tree, file_id):
1125
        out_path = pathjoin(temp_dir, name)
1711.7.20 by John Arbash Meinel
always close files, minor PEP8 cleanup
1126
        out_file = open(out_path, "wb")
1127
        try:
1128
            in_file = tree.get_file(file_id)
1129
            for line in in_file:
1130
                out_file.write(line)
1131
        finally:
1132
            out_file.close()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1133
        return out_path
1134
1135
    def text_merge(self, file_id, trans_id):
1534.7.157 by Aaron Bentley
Added more docs
1136
        """Perform a diff3 merge using a specified file-id and trans-id.
1137
        If conflicts are encountered, .BASE, .THIS. and .OTHER conflict files
1138
        will be dumped, and a will be conflict noted.
1139
        """
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1140
        import bzrlib.patch
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
1141
        temp_dir = osutils.mkdtemp(prefix="bzr-")
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1142
        try:
1534.7.166 by Aaron Bentley
Swapped os.path.join for pathjoin everywhere
1143
            new_file = pathjoin(temp_dir, "new")
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1144
            this = self.dump_file(temp_dir, "this", self.this_tree, file_id)
1145
            base = self.dump_file(temp_dir, "base", self.base_tree, file_id)
1146
            other = self.dump_file(temp_dir, "other", self.other_tree, file_id)
1147
            status = bzrlib.patch.diff3(new_file, this, base, other)
1148
            if status not in (0, 1):
1149
                raise BzrError("Unhandled diff3 exit code")
1711.7.20 by John Arbash Meinel
always close files, minor PEP8 cleanup
1150
            f = open(new_file, 'rb')
1151
            try:
1152
                self.tt.create_file(f, trans_id)
1153
            finally:
1154
                f.close()
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1155
            if status == 1:
1156
                name = self.tt.final_name(trans_id)
1157
                parent_id = self.tt.final_parent(trans_id)
1158
                self._dump_conflicts(name, parent_id, file_id)
1551.8.39 by Aaron Bentley
Fix diff3 conflict-reporting bug
1159
                self._raw_conflicts.append(('text conflict', trans_id))
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1160
        finally:
1996.3.18 by John Arbash Meinel
Now that mkdtemp and rmtree are lazy, they should not be directly improted.
1161
            osutils.rmtree(temp_dir)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1162
1163
1164
def merge_inner(this_branch, other_tree, base_tree, ignore_zero=False,
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1165
                backup_files=False,
1166
                merge_type=Merge3Merger,
1167
                interesting_ids=None,
1168
                show_base=False,
1169
                reprocess=False,
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1170
                other_rev_id=None,
1171
                interesting_files=None,
1534.9.9 by Aaron Bentley
Added progress bar to pull
1172
                this_tree=None,
1551.11.10 by Aaron Bentley
Add change reporting to pull
1173
                pb=DummyProgress(),
1174
                change_reporter=None):
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1175
    """Primary interface for merging. 
1176
1177
        typical use is probably 
1178
        'merge_inner(branch, branch.get_revision_tree(other_revision),
1179
                     branch.get_revision_tree(base_revision))'
1180
        """
1181
    if this_tree is None:
2367.2.1 by Robert Collins
Remove bzrlib 0.8 compatability where it was making the code unclear or messy. (Robert Collins)
1182
        raise BzrError("bzrlib.merge.merge_inner requires a this_tree "
1183
            "parameter as of bzrlib version 0.8.")
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1184
    merger = Merger(this_branch, other_tree, base_tree, this_tree=this_tree,
1551.11.10 by Aaron Bentley
Add change reporting to pull
1185
                    pb=pb, change_reporter=change_reporter)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1186
    merger.backup_files = backup_files
1187
    merger.merge_type = merge_type
1188
    merger.interesting_ids = interesting_ids
1551.2.23 by Aaron Bentley
Got merge_inner's ignore_zero parameter working
1189
    merger.ignore_zero = ignore_zero
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1190
    if interesting_files:
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1191
        if interesting_ids:
1192
            raise ValueError('Only supply interesting_ids'
1193
                             ' or interesting_files')
2590.2.5 by Aaron Bentley
Allow selected files to be specified instead of selected ids
1194
        merger.interesting_files = interesting_files
1979.2.1 by Robert Collins
(robertc) adds a convenience method "merge_from_branch" to WorkingTree.
1195
    merger.show_base = show_base
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1196
    merger.reprocess = reprocess
1197
    merger.other_rev_id = other_rev_id
1198
    merger.other_basis = other_rev_id
3249.3.1 by John Arbash Meinel
Implement cherrypick support for Merge3
1199
    get_revision_id = getattr(base_tree, 'get_revision_id', None)
1200
    if get_revision_id is None:
1201
        get_revision_id = base_tree.last_revision
1202
    merger.set_base_revision(get_revision_id(), this_branch)
1534.7.140 by Aaron Bentley
Moved the merge stuff into merge.py
1203
    return merger.do_merge()
1204
2221.4.15 by Aaron Bentley
Use RegistryOption for merge type
1205
def get_merge_type_registry():
2221.4.17 by Aaron Bentley
PEP8-ness
1206
    """Merge type registry is in bzrlib.option to avoid circular imports.
2221.4.15 by Aaron Bentley
Use RegistryOption for merge type
1207
1208
    This method provides a sanctioned way to retrieve it.
1209
    """
1210
    from bzrlib import option
2221.4.16 by Aaron Bentley
Add tests for get_merge_type_registry
1211
    return option._merge_type_registry
1551.15.46 by Aaron Bentley
Move plan merge to tree
1212
1213
1214
def _plan_annotate_merge(annotated_a, annotated_b, ancestors_a, ancestors_b):
1215
    def status_a(revision, text):
1216
        if revision in ancestors_b:
1217
            return 'killed-b', text
1218
        else:
1219
            return 'new-a', text
1220
1221
    def status_b(revision, text):
1222
        if revision in ancestors_a:
1223
            return 'killed-a', text
1224
        else:
1225
            return 'new-b', text
1226
1227
    plain_a = [t for (a, t) in annotated_a]
1228
    plain_b = [t for (a, t) in annotated_b]
1229
    matcher = patiencediff.PatienceSequenceMatcher(None, plain_a, plain_b)
1230
    blocks = matcher.get_matching_blocks()
1231
    a_cur = 0
1232
    b_cur = 0
1233
    for ai, bi, l in blocks:
1234
        # process all mismatched sections
1235
        # (last mismatched section is handled because blocks always
1236
        # includes a 0-length last block)
1237
        for revision, text in annotated_a[a_cur:ai]:
1238
            yield status_a(revision, text)
1239
        for revision, text in annotated_b[b_cur:bi]:
1240
            yield status_b(revision, text)
1241
        # and now the matched section
1242
        a_cur = ai + l
1243
        b_cur = bi + l
3376.2.8 by Martin Pool
Some review cleanups for assertion removal
1244
        for text_a in plain_a[ai:a_cur]:
1551.15.46 by Aaron Bentley
Move plan merge to tree
1245
            yield "unchanged", text_a
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1246
1247
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1248
class _PlanMergeBase(object):
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1249
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1250
    def __init__(self, a_rev, b_rev, vf, key_prefix):
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1251
        """Contructor.
1252
1253
        :param a_rev: Revision-id of one revision to merge
1254
        :param b_rev: Revision-id of the other revision to merge
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1255
        :param vf: A VersionedFiles containing both revisions
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1256
        :param key_prefix: A prefix for accessing keys in vf, typically
1257
            (file_id,).
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1258
        """
1259
        self.a_rev = a_rev
1260
        self.b_rev = b_rev
1261
        self.vf = vf
3062.1.12 by Aaron Bentley
Implement simple text cache
1262
        self._last_lines = None
1263
        self._last_lines_revision_id = None
3144.3.7 by Aaron Bentley
Update from review
1264
        self._cached_matching_blocks = {}
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1265
        self._key_prefix = key_prefix
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1266
        self._precache_tip_lines()
1267
1268
    def _precache_tip_lines(self):
1269
        lines = self.get_lines([self.a_rev, self.b_rev])
1270
        self.lines_a = lines[self.a_rev]
1271
        self.lines_b = lines[self.b_rev]
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1272
1273
    def get_lines(self, revisions):
1274
        """Get lines for revisions from the backing VersionedFiles.
1275
        
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1276
        :raises RevisionNotPresent: on absent texts.
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1277
        """
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1278
        keys = [(self._key_prefix + (rev,)) for rev in revisions]
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1279
        result = {}
1280
        for record in self.vf.get_record_stream(keys, 'unordered', True):
1281
            if record.storage_kind == 'absent':
1282
                raise errors.RevisionNotPresent(record.key, self.vf)
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1283
            result[record.key[-1]] = osutils.split_lines(
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1284
                record.get_bytes_as('fulltext'))
1285
        return result
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1286
1287
    def plan_merge(self):
1288
        """Generate a 'plan' for merging the two revisions.
1289
1290
        This involves comparing their texts and determining the cause of
1291
        differences.  If text A has a line and text B does not, then either the
1292
        line was added to text A, or it was deleted from B.  Once the causes
1293
        are combined, they are written out in the format described in
1294
        VersionedFile.plan_merge
1295
        """
1296
        blocks = self._get_matching_blocks(self.a_rev, self.b_rev)
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1297
        unique_a, unique_b = self._unique_lines(blocks)
1298
        new_a, killed_b = self._determine_status(self.a_rev, unique_a)
1299
        new_b, killed_a = self._determine_status(self.b_rev, unique_b)
1300
        return self._iter_plan(blocks, new_a, killed_b, new_b, killed_a)
1301
1302
    def _iter_plan(self, blocks, new_a, killed_b, new_b, killed_a):
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1303
        last_i = 0
1304
        last_j = 0
1305
        for i, j, n in blocks:
1306
            for a_index in range(last_i, i):
1307
                if a_index in new_a:
3144.3.2 by Aaron Bentley
Get conflict handling working
1308
                    if a_index in killed_b:
1309
                        yield 'conflicted-a', self.lines_a[a_index]
1310
                    else:
1311
                        yield 'new-a', self.lines_a[a_index]
1312
                else:
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1313
                    yield 'killed-b', self.lines_a[a_index]
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1314
            for b_index in range(last_j, j):
1315
                if b_index in new_b:
3144.3.2 by Aaron Bentley
Get conflict handling working
1316
                    if b_index in killed_a:
3144.3.10 by Aaron Bentley
Use correct index when emitting conflicted-b
1317
                        yield 'conflicted-b', self.lines_b[b_index]
3144.3.2 by Aaron Bentley
Get conflict handling working
1318
                    else:
1319
                        yield 'new-b', self.lines_b[b_index]
1320
                else:
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1321
                    yield 'killed-a', self.lines_b[b_index]
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1322
            # handle common lines
1323
            for a_index in range(i, i+n):
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1324
                yield 'unchanged', self.lines_a[a_index]
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1325
            last_i = i+n
1326
            last_j = j+n
1327
1328
    def _get_matching_blocks(self, left_revision, right_revision):
1329
        """Return a description of which sections of two revisions match.
1330
1331
        See SequenceMatcher.get_matching_blocks
1332
        """
3144.3.7 by Aaron Bentley
Update from review
1333
        cached = self._cached_matching_blocks.get((left_revision,
1334
                                                   right_revision))
1335
        if cached is not None:
1336
            return cached
3062.1.12 by Aaron Bentley
Implement simple text cache
1337
        if self._last_lines_revision_id == left_revision:
1338
            left_lines = self._last_lines
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1339
            right_lines = self.get_lines([right_revision])[right_revision]
3062.1.12 by Aaron Bentley
Implement simple text cache
1340
        else:
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1341
            lines = self.get_lines([left_revision, right_revision])
1342
            left_lines = lines[left_revision]
1343
            right_lines = lines[right_revision]
3062.1.12 by Aaron Bentley
Implement simple text cache
1344
        self._last_lines = right_lines
1345
        self._last_lines_revision_id = right_revision
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1346
        matcher = patiencediff.PatienceSequenceMatcher(None, left_lines,
1347
                                                       right_lines)
1348
        return matcher.get_matching_blocks()
1349
1350
    def _unique_lines(self, matching_blocks):
1351
        """Analyse matching_blocks to determine which lines are unique
1352
1353
        :return: a tuple of (unique_left, unique_right), where the values are
1354
            sets of line numbers of unique lines.
1355
        """
1356
        last_i = 0
1357
        last_j = 0
1358
        unique_left = []
1359
        unique_right = []
1360
        for i, j, n in matching_blocks:
1361
            unique_left.extend(range(last_i, i))
1362
            unique_right.extend(range(last_j, j))
1363
            last_i = i + n
1364
            last_j = j + n
1365
        return unique_left, unique_right
1366
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1367
    @staticmethod
1368
    def _subtract_plans(old_plan, new_plan):
3144.3.7 by Aaron Bentley
Update from review
1369
        """Remove changes from new_plan that came from old_plan.
1370
1371
        It is assumed that the difference between the old_plan and new_plan
1372
        is their choice of 'b' text.
1373
1374
        All lines from new_plan that differ from old_plan are emitted
1375
        verbatim.  All lines from new_plan that match old_plan but are
1376
        not about the 'b' revision are emitted verbatim.
1377
1378
        Lines that match and are about the 'b' revision are the lines we
1379
        don't want, so we convert 'killed-b' -> 'unchanged', and 'new-b'
1380
        is skipped entirely.
1381
        """
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1382
        matcher = patiencediff.PatienceSequenceMatcher(None, old_plan,
1383
                                                       new_plan)
1384
        last_j = 0
1385
        for i, j, n in matcher.get_matching_blocks():
1386
            for jj in range(last_j, j):
1387
                yield new_plan[jj]
1388
            for jj in range(j, j+n):
1389
                plan_line = new_plan[jj]
1390
                if plan_line[0] == 'new-b':
1391
                    pass
1392
                elif plan_line[0] == 'killed-b':
1393
                    yield 'unchanged', plan_line[1]
1394
                else:
1395
                    yield plan_line
1396
            last_j = j + n
1397
1398
1399
class _PlanMerge(_PlanMergeBase):
1400
    """Plan an annotate merge using on-the-fly annotation"""
1401
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1402
    def __init__(self, a_rev, b_rev, vf, key_prefix):
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1403
        super(_PlanMerge, self).__init__(a_rev, b_rev, vf, key_prefix)
1404
        self.a_key = self._key_prefix + (self.a_rev,)
1405
        self.b_key = self._key_prefix + (self.b_rev,)
1406
        self.graph = Graph(self.vf)
3514.2.11 by John Arbash Meinel
Shortcut the case when one revision is in the ancestry of the other.
1407
        heads = self.graph.heads((self.a_key, self.b_key))
1408
        if len(heads) == 1:
1409
            # one side dominates, so we can just return its values, yay for
1410
            # per-file graphs
1411
            # Ideally we would know that before we get this far
1412
            self._head_key = heads.pop()
1413
            if self._head_key == self.a_key:
1414
                other = b_rev
1415
            else:
1416
                other = a_rev
1417
            mutter('found dominating revision for %s\n%s > %s', self.vf,
1418
                   self._head_key[-1], other)
1419
            self._weave = None
1420
        else:
1421
            self._head_key = None
1422
            self._build_weave()
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1423
1424
    def _precache_tip_lines(self):
1425
        # Turn this into a no-op, because we will do this later
1426
        pass
1427
1428
    def _find_recursive_lcas(self):
1429
        """Find all the ancestors back to a unique lca"""
1430
        cur_ancestors = (self.a_key, self.b_key)
1431
        # graph.find_lca(uncommon, keys) now returns plain NULL_REVISION,
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1432
        # rather than a key tuple. We will just map that directly to no common
1433
        # ancestors.
1434
        parent_map = {}
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1435
        while True:
1436
            next_lcas = self.graph.find_lca(*cur_ancestors)
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1437
            # Map a plain NULL_REVISION to a simple no-ancestors
1438
            if next_lcas == set([NULL_REVISION]):
1439
                next_lcas = ()
3514.2.9 by John Arbash Meinel
Add some debugging, and work on getting the graph right so we get the weave insertion order correct.
1440
            # Order the lca's based on when they were merged into the tip
1441
            # While the actual merge portion of weave merge uses a set() of
1442
            # active revisions, the order of insertion *does* effect the
1443
            # implicit ordering of the texts.
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1444
            for rev_key in cur_ancestors:
3514.2.9 by John Arbash Meinel
Add some debugging, and work on getting the graph right so we get the weave insertion order correct.
1445
                ordered_parents = tuple(self.graph.find_merge_order(rev_key,
1446
                                                                    next_lcas))
1447
                parent_map[rev_key] = ordered_parents
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1448
            if len(next_lcas) == 0:
1449
                break
1450
            elif len(next_lcas) == 1:
3514.2.9 by John Arbash Meinel
Add some debugging, and work on getting the graph right so we get the weave insertion order correct.
1451
                parent_map[list(next_lcas)[0]] = ()
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1452
                break
3514.2.10 by John Arbash Meinel
Handle more edge cases.
1453
            elif len(next_lcas) > 2:
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1454
                # More than 2 lca's, fall back to grabbing all nodes between
1455
                # this and the unique lca.
3514.2.16 by John Arbash Meinel
Review feedback from Ian.
1456
                mutter('More than 2 LCAs, falling back to all nodes for:'
1457
                       ' %s, %s\n=> %s', self.a_key, self.b_key, cur_ancestors)
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1458
                cur_lcas = next_lcas
1459
                while len(cur_lcas) > 1:
1460
                    cur_lcas = self.graph.find_lca(*cur_lcas)
1461
                if len(cur_lcas) == 0:
1462
                    # No common base to find, use the full ancestry
1463
                    unique_lca = None
1464
                else:
3514.2.8 by John Arbash Meinel
The insertion ordering into the weave has an impact on conflicts.
1465
                    unique_lca = list(cur_lcas)[0]
3514.2.14 by John Arbash Meinel
Bring in the code to collapse linear portions of the graph.
1466
                    if unique_lca == NULL_REVISION:
1467
                        # find_lca will return a plain 'NULL_REVISION' rather
1468
                        # than a key tuple when there is no common ancestor, we
1469
                        # prefer to just use None, because it doesn't confuse
1470
                        # _get_interesting_texts()
1471
                        unique_lca = None
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1472
                parent_map.update(self._find_unique_parents(next_lcas,
1473
                                                            unique_lca))
1474
                break
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1475
            cur_ancestors = next_lcas
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1476
        return parent_map
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1477
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1478
    def _find_unique_parents(self, tip_keys, base_key):
1479
        """Find ancestors of tip that aren't ancestors of base.
1480
        
1481
        :param tip_keys: Nodes that are interesting
1482
        :param base_key: Cull all ancestors of this node
1483
        :return: The parent map for all revisions between tip_keys and
1484
            base_key. base_key will be included. References to nodes outside of
1485
            the ancestor set will also be removed.
1486
        """
1487
        # TODO: this would be simpler if find_unique_ancestors took a list
1488
        #       instead of a single tip, internally it supports it, but it
1489
        #       isn't a "backwards compatible" api change.
1490
        if base_key is None:
1491
            parent_map = dict(self.graph.iter_ancestry(tip_keys))
3514.2.14 by John Arbash Meinel
Bring in the code to collapse linear portions of the graph.
1492
            # We remove NULL_REVISION because it isn't a proper tuple key, and
1493
            # thus confuses things like _get_interesting_texts, and our logic
1494
            # to add the texts into the memory weave.
1495
            if NULL_REVISION in parent_map:
1496
                parent_map.pop(NULL_REVISION)
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1497
        else:
1498
            interesting = set()
1499
            for tip in tip_keys:
1500
                interesting.update(
1501
                    self.graph.find_unique_ancestors(tip, [base_key]))
1502
            parent_map = self.graph.get_parent_map(interesting)
1503
            parent_map[base_key] = ()
3514.2.12 by John Arbash Meinel
Start refactoring into helper functions
1504
        culled_parent_map, child_map, tails = self._remove_external_references(
1505
            parent_map)
3514.2.13 by John Arbash Meinel
Add the ability to prune extra tails from the parent_map.
1506
        # Remove all the tails but base_key
3514.2.14 by John Arbash Meinel
Bring in the code to collapse linear portions of the graph.
1507
        if base_key is not None:
1508
            tails.remove(base_key)
1509
            self._prune_tails(culled_parent_map, child_map, tails)
1510
        # Now remove all the uninteresting 'linear' regions
3514.2.15 by John Arbash Meinel
Enable collapsing linear regions.
1511
        simple_map = _mod_graph.collapse_linear_regions(culled_parent_map)
1512
        return simple_map
3514.2.12 by John Arbash Meinel
Start refactoring into helper functions
1513
1514
    @staticmethod
1515
    def _remove_external_references(parent_map):
1516
        """Remove references that go outside of the parent map.
1517
1518
        :param parent_map: Something returned from Graph.get_parent_map(keys)
1519
        :return: (filtered_parent_map, child_map, tails)
1520
            filtered_parent_map is parent_map without external references
1521
            child_map is the {parent_key: [child_keys]} mapping
1522
            tails is a list of nodes that do not have any parents in the map
1523
        """
1524
        # TODO: The basic effect of this function seems more generic than
1525
        #       _PlanMerge. But the specific details of building a child_map,
1526
        #       and computing tails seems very specific to _PlanMerge.
1527
        #       Still, should this be in Graph land?
1528
        filtered_parent_map = {}
1529
        child_map = {}
1530
        tails = []
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1531
        for key, parent_keys in parent_map.iteritems():
3514.2.12 by John Arbash Meinel
Start refactoring into helper functions
1532
            culled_parent_keys = [p for p in parent_keys if p in parent_map]
1533
            if not culled_parent_keys:
1534
                tails.append(key)
1535
            for parent_key in culled_parent_keys:
1536
                child_map.setdefault(parent_key, []).append(key)
1537
            # TODO: Do we want to do this, it adds overhead for every node,
1538
            #       just to say that the node has no children
1539
            child_map.setdefault(key, [])
1540
            filtered_parent_map[key] = culled_parent_keys
1541
        return filtered_parent_map, child_map, tails
1542
3514.2.13 by John Arbash Meinel
Add the ability to prune extra tails from the parent_map.
1543
    @staticmethod
1544
    def _prune_tails(parent_map, child_map, tails_to_remove):
1545
        """Remove tails from the parent map.
1546
        
1547
        This will remove the supplied revisions until no more children have 0
1548
        parents.
1549
1550
        :param parent_map: A dict of {child: [parents]}, this dictionary will
1551
            be modified in place.
1552
        :param tails_to_remove: A list of tips that should be removed,
1553
            this list will be consumed
1554
        :param child_map: The reverse dict of parent_map ({parent: [children]})
1555
            this dict will be modified
1556
        :return: None, parent_map will be modified in place.
1557
        """
1558
        while tails_to_remove:
1559
            next = tails_to_remove.pop()
1560
            parent_map.pop(next)
1561
            children = child_map.pop(next)
1562
            for child in children:
1563
                child_parents = parent_map[child]
1564
                child_parents.remove(next)
1565
                if len(child_parents) == 0:
1566
                    tails_to_remove.append(child)
3514.2.7 by John Arbash Meinel
Fix the failing test by implementing the fallback logic.
1567
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1568
    def _get_interesting_texts(self, parent_map):
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1569
        """Return a dict of texts we are interested in.
1570
1571
        Note that the input is in key tuples, but the output is in plain
1572
        revision ids.
1573
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1574
        :param parent_map: The output from _find_recursive_lcas
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1575
        :return: A dict of {'revision_id':lines} as returned by
1576
            _PlanMergeBase.get_lines()
1577
        """
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1578
        all_revision_keys = set(parent_map)
1579
        all_revision_keys.add(self.a_key)
1580
        all_revision_keys.add(self.b_key)
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1581
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1582
        # Everything else is in 'keys' but get_lines is in 'revision_ids'
1583
        all_texts = self.get_lines([k[-1] for k in all_revision_keys])
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1584
        return all_texts
1585
1586
    def _build_weave(self):
1587
        from bzrlib import weave
1588
        self._weave = weave.Weave(weave_name='in_memory_weave',
1589
                                  allow_reserved=True)
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1590
        parent_map = self._find_recursive_lcas()
1591
1592
        all_texts = self._get_interesting_texts(parent_map)
1593
1594
        # Note: Unfortunately, the order given by topo_sort will effect the
1595
        # ordering resolution in the output. Specifically, if you add A then B,
1596
        # then in the output text A lines will show up before B lines. And, of
1597
        # course, topo_sort doesn't guarantee any real ordering.
3514.2.8 by John Arbash Meinel
The insertion ordering into the weave has an impact on conflicts.
1598
        # So we use merge_sort, and add a fake node on the tip.
1599
        # This ensures that left-hand parents will always be inserted into the
1600
        # weave before right-hand parents.
1601
        tip_key = self._key_prefix + (_mod_revision.CURRENT_REVISION,)
1602
        parent_map[tip_key] = (self.a_key, self.b_key)
1603
1604
        for seq_num, key, depth, eom in reversed(tsort.merge_sort(parent_map,
1605
                                                                  tip_key)):
1606
            if key == tip_key:
1607
                continue
3514.2.9 by John Arbash Meinel
Add some debugging, and work on getting the graph right so we get the weave insertion order correct.
1608
        # for key in tsort.topo_sort(parent_map):
3514.2.5 by John Arbash Meinel
Switch to the get_parent_map design I had settled on.
1609
            parent_keys = parent_map[key]
1610
            revision_id = key[-1]
1611
            parent_ids = [k[-1] for k in parent_keys]
1612
            self._weave.add_lines(revision_id, parent_ids,
1613
                                  all_texts[revision_id])
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1614
1615
    def plan_merge(self):
1616
        """Generate a 'plan' for merging the two revisions.
1617
1618
        This involves comparing their texts and determining the cause of
1619
        differences.  If text A has a line and text B does not, then either the
1620
        line was added to text A, or it was deleted from B.  Once the causes
1621
        are combined, they are written out in the format described in
1622
        VersionedFile.plan_merge
1623
        """
1624
        if self._head_key is not None: # There was a single head
1625
            if self._head_key == self.a_key:
1626
                plan = 'new-a'
3062.1.9 by Aaron Bentley
Move PlanMerge into merge and _PlanMergeVersionedFile into versionedfile
1627
            else:
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1628
                if self._head_key != self.b_key:
1629
                    raise AssertionError('There was an invalid head: %s != %s'
1630
                                         % (self.b_key, self._head_key))
1631
                plan = 'new-b'
3514.2.16 by John Arbash Meinel
Review feedback from Ian.
1632
            head_rev = self._head_key[-1]
1633
            lines = self.get_lines([head_rev])[head_rev]
3514.2.2 by John Arbash Meinel
Restore a real weave merge to 'bzr merge --weave'.
1634
            return ((plan, line) for line in lines)
1635
        return self._weave.plan_merge(self.a_rev, self.b_rev)
3062.2.1 by Aaron Bentley
Add support for plan-merge with a base
1636
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1637
1638
class _PlanLCAMerge(_PlanMergeBase):
1639
    """
3144.3.7 by Aaron Bentley
Update from review
1640
    This merge algorithm differs from _PlanMerge in that:
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1641
    1. comparisons are done against LCAs only
1642
    2. cases where a contested line is new versus one LCA but old versus
3144.3.7 by Aaron Bentley
Update from review
1643
       another are marked as conflicts, by emitting the line as conflicted-a
1644
       or conflicted-b.
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1645
1646
    This is faster, and hopefully produces more useful output.
1647
    """
1648
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1649
    def __init__(self, a_rev, b_rev, vf, key_prefix, graph):
1650
        _PlanMergeBase.__init__(self, a_rev, b_rev, vf, key_prefix)
1651
        lcas = graph.find_lca(key_prefix + (a_rev,), key_prefix + (b_rev,))
3350.6.5 by Robert Collins
Update to bzr.dev.
1652
        self.lcas = set()
1653
        for lca in lcas:
1654
            if lca == NULL_REVISION:
1655
                self.lcas.add(lca)
1656
            else:
1657
                self.lcas.add(lca[-1])
3144.3.7 by Aaron Bentley
Update from review
1658
        for lca in self.lcas:
3287.17.1 by John Arbash Meinel
Fix bug #235715 by using the empty list as the text for a base of NULL_REVISION.
1659
            if _mod_revision.is_null(lca):
1660
                lca_lines = []
1661
            else:
3350.6.5 by Robert Collins
Update to bzr.dev.
1662
                lca_lines = self.get_lines([lca])[lca]
3144.3.7 by Aaron Bentley
Update from review
1663
            matcher = patiencediff.PatienceSequenceMatcher(None, self.lines_a,
1664
                                                           lca_lines)
1665
            blocks = list(matcher.get_matching_blocks())
1666
            self._cached_matching_blocks[(a_rev, lca)] = blocks
1667
            matcher = patiencediff.PatienceSequenceMatcher(None, self.lines_b,
1668
                                                           lca_lines)
1669
            blocks = list(matcher.get_matching_blocks())
1670
            self._cached_matching_blocks[(b_rev, lca)] = blocks
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1671
3144.3.7 by Aaron Bentley
Update from review
1672
    def _determine_status(self, revision_id, unique_line_numbers):
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1673
        """Determines the status unique lines versus all lcas.
1674
1675
        Basically, determines why the line is unique to this revision.
1676
1677
        A line may be determined new, killed, or both.
1678
3144.3.7 by Aaron Bentley
Update from review
1679
        If a line is determined new, that means it was not present in at least
1680
        one LCA, and is not present in the other merge revision.
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1681
1682
        If a line is determined killed, that means the line was present in
1683
        at least one LCA.
1684
1685
        If a line is killed and new, this indicates that the two merge
1686
        revisions contain differing conflict resolutions.
3144.3.7 by Aaron Bentley
Update from review
1687
        :param revision_id: The id of the revision in which the lines are
1688
            unique
1689
        :param unique_line_numbers: The line numbers of unique lines.
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1690
        :return a tuple of (new_this, killed_other):
1691
        """
1692
        new = set()
1693
        killed = set()
3144.3.7 by Aaron Bentley
Update from review
1694
        unique_line_numbers = set(unique_line_numbers)
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1695
        for lca in self.lcas:
1696
            blocks = self._get_matching_blocks(revision_id, lca)
1697
            unique_vs_lca, _ignored = self._unique_lines(blocks)
3144.3.7 by Aaron Bentley
Update from review
1698
            new.update(unique_line_numbers.intersection(unique_vs_lca))
1699
            killed.update(unique_line_numbers.difference(unique_vs_lca))
3144.3.1 by Aaron Bentley
Implement LCA merge, with problematic conflict markers
1700
        return new, killed