~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/graph.py

Committer: Patch Queue Manager
Date: 2011-10-09 13:52:06 UTC
mfrom: (6202.1.3 revno-revision)
Revision ID: pqm@pqm.ubuntu.com-20111009135206-t3utsln6mtzv9eut

(jelmer) Add a --revision argument to 'bzr revno'. (Jelmer Vernooij)

files added:
bzrlib/estimate_compressed_size.py

bzrlib/filter_tree.py

bzrlib/help_topics/en/url-special-chars.txt

bzrlib/smart/signals.py

bzrlib/tests/blackbox/test_branches.py

bzrlib/tests/blackbox/test_export_pot.py

bzrlib/tests/per_intertree/test_file_content_matches.py

bzrlib/tests/per_repository_vf/test_fileid_involved.py

bzrlib/tests/per_repository_vf/test_refresh_data.py

bzrlib/tests/test_estimate_compressed_size.py

bzrlib/tests/test_features.py

bzrlib/tests/test_filter_tree.py

bzrlib/tests/test_smart_signals.py

doc/en/release-notes/bzr-2.5.txt

doc/en/whats-new/template.txt

doc/en/whats-new/whats-new-in-2.5.txt

po/bzr.pot

files removed:
bzrlib/tests/per_repository/test_fileid_involved.py

files renamed:
tools/build_mo.py => bzrlib/bzr_distutils.py

bzrlib/tests/per_repository/test_merge_directive.py => bzrlib/tests/per_repository_vf/test_merge_directive.py

files modified:
bzr

bzrlib/__init__.py

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/commit_signature_commands.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/controldir.py

bzrlib/debug.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/export_pot.py

bzrlib/fetch.py

bzrlib/foreign.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/hooks.py

bzrlib/i18n.py

bzrlib/info.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/library_state.py

bzrlib/lock.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_api_lite.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/repository.py

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/push.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/send.py

bzrlib/shelf_ui.py

bzrlib/smart/__init__.py

bzrlib/smart/bzrdir.py

bzrlib/smart/medium.py

bzrlib/smart/repository.py

bzrlib/smart/server.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/tag.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/features.py

bzrlib/tests/fixtures.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/http_utils.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/__init__.py

bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_export.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_export.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_i18n.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_server.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/transport_util.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/gio_transport.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/pathfilter.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/ui/__init__.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/version_info_formats/__init__.py

bzrlib/vf_repository.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_3.py

bzrlib/workingtree_4.py

doc/developers/HACKING.txt

doc/developers/configuration.txt

doc/developers/contribution-quickstart.txt

doc/developers/releasing.txt

doc/developers/testing.txt

doc/en/_templates/index.html

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/user-guide/gpg_signatures.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/undoing_mistakes.txt

setup.py

tools/generate_docs.py

Show diffs side-by-side

added added

removed removed

bzrlib/graph.py

def __repr__(self):

return 'DictParentsProvider(%r)' % self.ancestry

# Note: DictParentsProvider does not implement get_cached_parent_map

# Arguably, the data is clearly cached in memory. However, this class

# is mostly used for testing, and it keeps the tests clean to not

# change it.

def get_parent_map(self, keys):

"""See StackedParentsProvider.get_parent_map"""

ancestry = self.ancestry

return dict((k, ancestry[k]) for k in keys if k in ancestry)

return dict([(k, ancestry[k]) for k in keys if k in ancestry])

class StackedParentsProvider(object):

"""A parents provider which stacks (or unions) multiple providers.

The providers are queries in the order of the provided parent_providers.

"""

def __init__(self, parent_providers):

self._parent_providers = parent_providers

"""

found = {}

remaining = set(keys)

# This adds getattr() overhead to each get_parent_map call. However,

100

# this is StackedParentsProvider, which means we're dealing with I/O

101

# (either local indexes, or remote RPCs), so CPU overhead should be

102

# minimal.

103

for parents_provider in self._parent_providers:

104

get_cached = getattr(parents_provider, 'get_cached_parent_map',

105

None)

106

if get_cached is None:

107

continue

108

new_found = get_cached(remaining)

109

found.update(new_found)

110

remaining.difference_update(new_found)

111

if not remaining:

112

break

113

if not remaining:

114

return found

115

for parents_provider in self._parent_providers:

116

new_found = parents_provider.get_parent_map(remaining)

117

found.update(new_found)

150

171

return None

151

172

return dict(self._cache)

152

173

174

def get_cached_parent_map(self, keys):

175

"""Return items from the cache.

176

177

This returns the same info as get_parent_map, but explicitly does not

178

invoke the supplied ParentsProvider to search for uncached values.

179

"""

180

cache = self._cache

181

if cache is None:

182

return {}

183

return dict([(key, cache[key]) for key in keys if key in cache])

184

153

185

def get_parent_map(self, keys):

154

186

"""See StackedParentsProvider.get_parent_map."""

155

187

cache = self._cache

1419

1451

parents_of_found = set()

1420

1452

# revisions may contain nodes that point to other nodes in revisions:

1421

1453

# we want to filter them out.

1422

self.seen.update(revisions)

1454

seen = self.seen

1455

seen.update(revisions)

1423

1456

parent_map = self._parents_provider.get_parent_map(revisions)

1424

1457

found_revisions.update(parent_map)

1425

1458

for rev_id, parents in parent_map.iteritems():

1426

1459

if parents is None:

1427

1460

continue

1428

new_found_parents = [p for p in parents if p not in self.seen]

1461

new_found_parents = [p for p in parents if p not in seen]

1429

1462

if new_found_parents:

1430

1463

# Calling set.update() with an empty generator is actually

1431

1464

# rather expensive.

1891

1924

limit=self.limit)

1892

1925

1893

1926

1927

def invert_parent_map(parent_map):

1928

"""Given a map from child => parents, create a map of parent=>children"""

1929

child_map = {}

1930

for child, parents in parent_map.iteritems():

1931

for p in parents:

1932

# Any given parent is likely to have only a small handful

1933

# of children, many will have only one. So we avoid mem overhead of

1934

# a list, in exchange for extra copying of tuples

1935

if p not in child_map:

1936

child_map[p] = (child,)

1937

else:

1938

child_map[p] = child_map[p] + (child,)

1939

return child_map

1940

1941

1942

def _find_possible_heads(parent_map, tip_keys, depth):

1943

"""Walk backwards (towards children) through the parent_map.

1944

1945

This finds 'heads' that will hopefully succinctly describe our search

1946

graph.

1947

"""

1948

child_map = invert_parent_map(parent_map)

1949

heads = set()

1950

current_roots = tip_keys

1951

walked = set(current_roots)

1952

while current_roots and depth > 0:

1953

depth -= 1

1954

children = set()

1955

children_update = children.update

1956

for p in current_roots:

1957

# Is it better to pre- or post- filter the children?

1958

try:

1959

children_update(child_map[p])

1960

except KeyError:

1961

heads.add(p)

1962

# If we've seen a key before, we don't want to walk it again. Note that

1963

# 'children' stays relatively small while 'walked' grows large. So

1964

# don't use 'difference_update' here which has to walk all of 'walked'.

1965

# '.difference' is smart enough to walk only children and compare it to

1966

# walked.

1967

children = children.difference(walked)

1968

walked.update(children)

1969

current_roots = children

1970

if current_roots:

1971

# We walked to the end of depth, so these are the new tips.

1972

heads.update(current_roots)

1973

return heads

1974

1975

1976

def _run_search(parent_map, heads, exclude_keys):

1977

"""Given a parent map, run a _BreadthFirstSearcher on it.

1978

1979

Start at heads, walk until you hit exclude_keys. As a further improvement,

1980

watch for any heads that you encounter while walking, which means they were

1981

not heads of the search.

1982

1983

This is mostly used to generate a succinct recipe for how to walk through

1984

most of parent_map.

1985

1986

:return: (_BreadthFirstSearcher, set(heads_encountered_by_walking))

1987

"""

1988

g = Graph(DictParentsProvider(parent_map))

1989

s = g._make_breadth_first_searcher(heads)

1990

found_heads = set()

1991

while True:

1992

try:

1993

next_revs = s.next()

1994

except StopIteration:

1995

break

1996

for parents in s._current_parents.itervalues():

1997

f_heads = heads.intersection(parents)

1998

if f_heads:

1999

found_heads.update(f_heads)

2000

stop_keys = exclude_keys.intersection(next_revs)

2001

if stop_keys:

2002

s.stop_searching_any(stop_keys)

2003

for parents in s._current_parents.itervalues():

2004

f_heads = heads.intersection(parents)

2005

if f_heads:

2006

found_heads.update(f_heads)

2007

return s, found_heads

2008

2009

2010

def limited_search_result_from_parent_map(parent_map, missing_keys, tip_keys,

2011

depth):

2012

"""Transform a parent_map that is searching 'tip_keys' into an

2013

approximate SearchResult.

2014

2015

We should be able to generate a SearchResult from a given set of starting

2016

keys, that covers a subset of parent_map that has the last step pointing at

2017

tip_keys. This is to handle the case that really-long-searches shouldn't be

2018

started from scratch on each get_parent_map request, but we *do* want to

2019

filter out some of the keys that we've already seen, so we don't get

2020

information that we already know about on every request.

2021

2022

The server will validate the search (that starting at start_keys and

2023

stopping at stop_keys yields the exact key_count), so we have to be careful

2024

to give an exact recipe.

2025

2026

Basic algorithm is:

2027

1) Invert parent_map to get child_map (todo: have it cached and pass it

2028

in)

2029

2) Starting at tip_keys, walk towards children for 'depth' steps.

2030

3) At that point, we have the 'start' keys.

2031

4) Start walking parent_map from 'start' keys, counting how many keys

2032

are seen, and generating stop_keys for anything that would walk

2033

outside of the parent_map.

2034

2035

:param parent_map: A map from {child_id: (parent_ids,)}

2036

:param missing_keys: parent_ids that we know are unavailable

2037

:param tip_keys: the revision_ids that we are searching

2038

:param depth: How far back to walk.

2039

"""

2040

if not parent_map:

2041

# No search to send, because we haven't done any searching yet.

2042

return [], [], 0

2043

heads = _find_possible_heads(parent_map, tip_keys, depth)

2044

s, found_heads = _run_search(parent_map, heads, set(tip_keys))

2045

_, start_keys, exclude_keys, key_count = s.get_result().get_recipe()

2046

if found_heads:

2047

# Anything in found_heads are redundant start_keys, we hit them while

2048

# walking, so we can exclude them from the start list.

2049

start_keys = set(start_keys).difference(found_heads)

2050

return start_keys, exclude_keys, key_count

2051

2052

2053

def search_result_from_parent_map(parent_map, missing_keys):

2054

"""Transform a parent_map into SearchResult information."""

2055

if not parent_map:

2056

# parent_map is empty or None, simple search result

2057

return [], [], 0

2058

# start_set is all the keys in the cache

2059

start_set = set(parent_map)

2060

# result set is all the references to keys in the cache

2061

result_parents = set()

2062

for parents in parent_map.itervalues():

2063

result_parents.update(parents)

2064

stop_keys = result_parents.difference(start_set)

2065

# We don't need to send ghosts back to the server as a position to

2066

# stop either.

2067

stop_keys.difference_update(missing_keys)

2068

key_count = len(parent_map)

2069

if (revision.NULL_REVISION in result_parents

2070

and revision.NULL_REVISION in missing_keys):

2071

# If we pruned NULL_REVISION from the stop_keys because it's also

2072

# in our cache of "missing" keys we need to increment our key count

2073

# by 1, because the reconsitituted SearchResult on the server will

2074

# still consider NULL_REVISION to be an included key.

2075

key_count += 1

2076

included_keys = start_set.intersection(result_parents)

2077

start_set.difference_update(included_keys)

2078

return start_set, stop_keys, key_count

2079

2080

1894

2081

def collapse_linear_regions(parent_map):

1895

2082

"""Collapse regions of the graph that are 'linear'.

1896

2083

Older »