~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/missing.py

  • Committer: John Arbash Meinel
  • Date: 2009-11-07 01:58:11 UTC
  • mto: This revision was merged to the branch mainline in revision 4842.
  • Revision ID: john@arbash-meinel.com-20091107015811-apybkqd40koa4b98
Get rid of the GraphIndexBuilder/BTreeBuilder._keys attribute.

This removes a set that grows O(N). We used it for some performance
stuff, because set.intersection is not efficient if other is not
a set. But we can work around that differently. It saves about 2MB
for a set with 100k items in it.

Show diffs side-by-side

added added

removed removed

Lines of Context:
12
12
#
13
13
# You should have received a copy of the GNU General Public License
14
14
# along with this program; if not, write to the Free Software
15
 
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
16
16
 
17
17
"""Display what revisions are missing in 'other' from 'this' and vice versa."""
18
18
 
19
 
import bzrlib.ui as ui
20
 
 
21
 
 
22
 
def iter_log_data(revisions, revision_source, verbose):
23
 
    last_tree = revision_source.revision_tree(None)
 
19
from bzrlib import (
 
20
    log,
 
21
    repository as _mod_repository,
 
22
    tsort,
 
23
    )
 
24
import bzrlib.revision as _mod_revision
 
25
 
 
26
 
 
27
def iter_log_revisions(revisions, revision_source, verbose):
 
28
    last_tree = revision_source.revision_tree(_mod_revision.NULL_REVISION)
24
29
    last_rev_id = None
25
 
    for revno, rev_id in revisions:
 
30
    for rev in revisions:
 
31
        # We need the following for backward compatibilty (hopefully
 
32
        # this will be deprecated soon :-/) -- vila 080911
 
33
        if len(rev) == 2:
 
34
            revno, rev_id = rev
 
35
            merge_depth = 0
 
36
        else:
 
37
            revno, rev_id, merge_depth = rev
26
38
        rev = revision_source.get_revision(rev_id)
27
39
        if verbose:
28
 
            remote_tree = revision_source.revision_tree(rev_id)
29
 
            parent_rev_id = rev.parent_ids[0]
30
 
            if last_rev_id == parent_rev_id:
31
 
                parent_tree = last_tree
32
 
            else:
33
 
                parent_tree = revision_source.revision_tree(parent_rev_id)
34
 
            revision_tree = revision_source.revision_tree(rev_id)
35
 
            last_rev_id = rev_id
36
 
            last_tree = revision_tree
37
 
            delta = revision_tree.changes_from(parent_tree)
 
40
            delta = revision_source.get_revision_delta(rev_id)
38
41
        else:
39
42
            delta = None
40
 
        yield revno, rev, delta
41
 
 
42
 
 
43
 
def find_unmerged(local_branch, remote_branch):
44
 
    progress = ui.ui_factory.nested_progress_bar()
 
43
        yield log.LogRevision(rev, revno, merge_depth, delta=delta)
 
44
 
 
45
 
 
46
def find_unmerged(local_branch, remote_branch, restrict='all',
 
47
                  include_merges=False, backward=False,
 
48
                  local_revid_range=None, remote_revid_range=None):
 
49
    """Find revisions from each side that have not been merged.
 
50
 
 
51
    :param local_branch: Compare the history of local_branch
 
52
    :param remote_branch: versus the history of remote_branch, and determine
 
53
        mainline revisions which have not been merged.
 
54
    :param restrict: ('all', 'local', 'remote') If 'all', we will return the
 
55
        unique revisions from both sides. If 'local', we will return None
 
56
        for the remote revisions, similarly if 'remote' we will return None for
 
57
        the local revisions.
 
58
    :param include_merges: Show mainline revisions only if False,
 
59
        all revisions otherwise.
 
60
    :param backward: Show oldest versions first when True, newest versions
 
61
        first when False.
 
62
    :param local_revid_range: Revision-id range for filtering local_branch
 
63
        revisions (lower bound, upper bound)
 
64
    :param remote_revid_range: Revision-id range for filtering remote_branch
 
65
        revisions (lower bound, upper bound)
 
66
 
 
67
    :return: A list of [(revno, revision_id)] for the mainline revisions on
 
68
        each side.
 
69
    """
45
70
    local_branch.lock_read()
46
71
    try:
47
72
        remote_branch.lock_read()
48
73
        try:
49
 
            local_rev_history, local_rev_history_map = \
50
 
                _get_history(local_branch, progress, "local", 0)
51
 
            remote_rev_history, remote_rev_history_map = \
52
 
                _get_history(remote_branch, progress, "remote", 1)
53
 
            result = _shortcut(local_rev_history, remote_rev_history)
54
 
            if result is not None:
55
 
                local_extra, remote_extra = result
56
 
                local_extra = sorted_revisions(local_extra, 
57
 
                                               local_rev_history_map)
58
 
                remote_extra = sorted_revisions(remote_extra, 
59
 
                                                remote_rev_history_map)
60
 
                return local_extra, remote_extra
61
 
 
62
 
            local_ancestry = _get_ancestry(local_branch.repository, progress, 
63
 
                                           "local", 2, local_rev_history)
64
 
            remote_ancestry = _get_ancestry(remote_branch.repository, progress,
65
 
                                            "remote", 3, remote_rev_history)
66
 
            progress.update('pondering', 4, 5)
67
 
            extras = local_ancestry.symmetric_difference(remote_ancestry) 
68
 
            local_extra = extras.intersection(set(local_rev_history))
69
 
            remote_extra = extras.intersection(set(remote_rev_history))
70
 
            local_extra = sorted_revisions(local_extra, local_rev_history_map)
71
 
            remote_extra = sorted_revisions(remote_extra, 
72
 
                                            remote_rev_history_map)
73
 
                    
 
74
            return _find_unmerged(
 
75
                local_branch, remote_branch, restrict=restrict,
 
76
                include_merges=include_merges, backward=backward,
 
77
                local_revid_range=local_revid_range,
 
78
                remote_revid_range=remote_revid_range)
74
79
        finally:
75
80
            remote_branch.unlock()
76
81
    finally:
77
82
        local_branch.unlock()
78
 
        progress.finished()
79
 
    return (local_extra, remote_extra)
80
 
 
81
 
def _shortcut(local_rev_history, remote_rev_history):
82
 
    local_history = set(local_rev_history)
83
 
    remote_history = set(remote_rev_history)
84
 
    if len(local_rev_history) == 0:
85
 
        return set(), remote_history
86
 
    elif len(remote_rev_history) == 0:
87
 
        return local_history, set()
88
 
    elif local_rev_history[-1] in remote_history:
89
 
        return set(), _after(remote_rev_history, local_rev_history)
90
 
    elif remote_rev_history[-1] in local_history:
91
 
        return _after(local_rev_history, remote_rev_history), set()
92
 
    else:
93
 
        return None
94
 
 
95
 
def _after(larger_history, smaller_history):
96
 
    return set(larger_history[larger_history.index(smaller_history[-1])+1:])
97
 
 
98
 
def _get_history(branch, progress, label, step):
99
 
    progress.update('%s history' % label, step, 5)
100
 
    rev_history = branch.revision_history()
101
 
    rev_history_map = dict(
102
 
        [(rev, rev_history.index(rev) + 1)
103
 
         for rev in rev_history])
104
 
    return rev_history, rev_history_map
105
 
 
106
 
def _get_ancestry(repository, progress, label, step, rev_history):
107
 
    progress.update('%s ancestry' % label, step, 5)
108
 
    if len(rev_history) > 0:
109
 
        ancestry = set(repository.get_ancestry(rev_history[-1]))
110
 
    else:
111
 
        ancestry = set()
112
 
    return ancestry
113
 
    
 
83
 
 
84
 
 
85
def _enumerate_mainline(ancestry, graph, tip_revno, tip, backward=True):
 
86
    """Enumerate the mainline revisions for these revisions.
 
87
 
 
88
    :param ancestry: A set of revisions that we care about
 
89
    :param graph: A Graph which lets us find the parents for a revision
 
90
    :param tip_revno: The revision number for the tip revision
 
91
    :param tip: The tip of mainline
 
92
    :param backward: Show oldest versions first when True, newest versions
 
93
        first when False.
 
94
    :return: [(revno, revision_id)] for all revisions in ancestry that
 
95
        are left-hand parents from tip, or None if ancestry is None.
 
96
    """
 
97
    if ancestry is None:
 
98
        return None
 
99
    if not ancestry: #Empty ancestry, no need to do any work
 
100
        return []
 
101
 
 
102
    # Optionally, we could make 1 call to graph.get_parent_map with all
 
103
    # ancestors. However that will often check many more parents than we
 
104
    # actually need, and the Graph is likely to already have the parents cached
 
105
    # anyway.
 
106
    mainline = []
 
107
    cur = tip
 
108
    cur_revno = tip_revno
 
109
    while cur in ancestry:
 
110
        parent_map = graph.get_parent_map([cur])
 
111
        parents = parent_map.get(cur)
 
112
        if not parents:
 
113
            break # Ghost, we are done
 
114
        mainline.append((str(cur_revno), cur))
 
115
        cur = parents[0]
 
116
        cur_revno -= 1
 
117
    if not backward:
 
118
        mainline.reverse()
 
119
    return mainline
 
120
 
 
121
 
 
122
def _enumerate_with_merges(branch, ancestry, graph, tip_revno, tip,
 
123
                           backward=True):
 
124
    """Enumerate the revisions for the ancestry.
 
125
 
 
126
    :param branch: The branch we care about
 
127
    :param ancestry: A set of revisions that we care about
 
128
    :param graph: A Graph which lets us find the parents for a revision
 
129
    :param tip_revno: The revision number for the tip revision
 
130
    :param tip: The tip of the ancsetry
 
131
    :param backward: Show oldest versions first when True, newest versions
 
132
        first when False.
 
133
    :return: [(revno, revision_id)] for all revisions in ancestry that
 
134
        are parents from tip, or None if ancestry is None.
 
135
    """
 
136
    if ancestry is None:
 
137
        return None
 
138
    if not ancestry: #Empty ancestry, no need to do any work
 
139
        return []
 
140
 
 
141
    merge_sorted_revisions = branch.iter_merge_sorted_revisions()
 
142
    # Now that we got the correct revnos, keep only the relevant
 
143
    # revisions.
 
144
    merge_sorted_revisions = [
 
145
        # log.reverse_by_depth expects seq_num to be present, but it is
 
146
        # stripped by iter_merge_sorted_revisions()
 
147
        (0, revid, n, d, e) for revid, n, d, e in merge_sorted_revisions
 
148
        if revid in ancestry]
 
149
    if not backward:
 
150
        merge_sorted_revisions = log.reverse_by_depth(merge_sorted_revisions)
 
151
    revline = []
 
152
    for seq, rev_id, merge_depth, revno, end_of_merge in merge_sorted_revisions:
 
153
        revline.append(('.'.join(map(str, revno)), rev_id, merge_depth))
 
154
    return revline
 
155
 
 
156
 
 
157
def _filter_revs(graph, revs, revid_range):
 
158
    if revid_range is None or revs is None:
 
159
        return revs
 
160
    return [rev for rev in revs
 
161
        if graph.is_between(rev[1], revid_range[0], revid_range[1])]
 
162
 
 
163
 
 
164
def _find_unmerged(local_branch, remote_branch, restrict,
 
165
                   include_merges, backward,
 
166
                   local_revid_range=None, remote_revid_range=None):
 
167
    """See find_unmerged.
 
168
 
 
169
    The branches should already be locked before entering.
 
170
    """
 
171
    local_revno, local_revision_id = local_branch.last_revision_info()
 
172
    remote_revno, remote_revision_id = remote_branch.last_revision_info()
 
173
    if local_revno == remote_revno and local_revision_id == remote_revision_id:
 
174
        # A simple shortcut when the tips are at the same point
 
175
        return [], []
 
176
    graph = local_branch.repository.get_graph(remote_branch.repository)
 
177
    if restrict == 'remote':
 
178
        local_extra = None
 
179
        remote_extra = graph.find_unique_ancestors(remote_revision_id,
 
180
                                                   [local_revision_id])
 
181
    elif restrict == 'local':
 
182
        remote_extra = None
 
183
        local_extra = graph.find_unique_ancestors(local_revision_id,
 
184
                                                  [remote_revision_id])
 
185
    else:
 
186
        if restrict != 'all':
 
187
            raise ValueError('param restrict not one of "all", "local",'
 
188
                             ' "remote": %r' % (restrict,))
 
189
        local_extra, remote_extra = graph.find_difference(local_revision_id,
 
190
                                                          remote_revision_id)
 
191
    if include_merges:
 
192
        locals = _enumerate_with_merges(local_branch, local_extra,
 
193
                                        graph, local_revno,
 
194
                                        local_revision_id, backward)
 
195
        remotes = _enumerate_with_merges(remote_branch, remote_extra,
 
196
                                         graph, remote_revno,
 
197
                                         remote_revision_id, backward)
 
198
    else:
 
199
        # Now that we have unique ancestors, compute just the mainline, and
 
200
        # generate revnos for them.
 
201
        locals = _enumerate_mainline(local_extra, graph, local_revno,
 
202
                                     local_revision_id, backward)
 
203
        remotes = _enumerate_mainline(remote_extra, graph, remote_revno,
 
204
                                      remote_revision_id, backward)
 
205
    return _filter_revs(graph, locals, local_revid_range), _filter_revs(graph,
 
206
        remotes, remote_revid_range)
 
207
 
114
208
 
115
209
def sorted_revisions(revisions, history_map):
116
210
    revisions = [(history_map[r],r) for r in revisions]