~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/graph.py

Committer: Martin Packman
Date: 2011-12-08 19:00:14 UTC
mto: This revision was merged to the branch mainline in revision 6359.
Revision ID: martin.packman@canonical.com-20111208190014-mi8jm6v7jygmhb0r

Use --include-duplicates for make update-pot which already combines multiple msgid strings prettily

files added:
bzrlib/plugins/po_merge

bzrlib/plugins/po_merge/README

bzrlib/plugins/po_merge/__init__.py

bzrlib/plugins/po_merge/po_merge.py

bzrlib/plugins/po_merge/tests

bzrlib/plugins/po_merge/tests/__init__.py

bzrlib/plugins/po_merge/tests/test_po_merge.py

bzrlib/tests/test_vf_search.py

bzrlib/vf_search.py

doc/developers/new-config-rationale.txt

files removed:
bzrlib/help_topics/en/location-alias.txt

files modified:
Makefile

bzrlib/__init__.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/config.py

bzrlib/directory_service.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/export_pot.py

bzrlib/fetch.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/debug-flags.txt

bzrlib/hooks.py

bzrlib/merge.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/status.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/features.py

bzrlib/tests/fixtures.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_features.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_server.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_workingtree_4.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/local.py

bzrlib/transport/ssh.py

bzrlib/vf_repository.py

bzrlib/win32utils.py

bzrlib/workingtree_4.py

doc/developers/configuration.txt

doc/developers/network-protocol.txt

doc/developers/plans.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/bzr-2.5.txt

po/bzr.pot

Show diffs side-by-side

added added

removed removed

bzrlib/graph.py

1346

return ('_BreadthFirstSearcher(iterations=%d, %s,'

1347

' seen=%r)' % (self._iterations, search, list(self.seen)))

1348

1349

def get_result(self):

1350

"""Get a SearchResult for the current state of this searcher.

1349

def get_state(self):

1350

"""Get the current state of this searcher.

1351

1352

:return: A SearchResult for this search so far. The SearchResult is

1353

static - the search can be advanced and the search result will not

1354

be invalidated or altered.

1352

:return: Tuple with started keys, excludes and included keys

1355

1353

"""

1356

1354

if self._returning == 'next':

1357

1355

# We have to know the current nodes children to be able to list the

1368

1366

next_query = self._next_query

1369

1367

excludes = self._stopped_keys.union(next_query)

1370

1368

included_keys = self.seen.difference(excludes)

1371

return SearchResult(self._started_keys, excludes, len(included_keys),

1369

return self._started_keys, excludes, included_keys

1370

1371

def _get_result(self):

1372

"""Get a SearchResult for the current state of this searcher.

1373

1374

:return: A SearchResult for this search so far. The SearchResult is

1375

static - the search can be advanced and the search result will not

1376

be invalidated or altered.

1377

"""

1378

from bzrlib.vf_search import SearchResult

1379

(started_keys, excludes, included_keys) = self.get_state()

1380

return SearchResult(started_keys, excludes, len(included_keys),

1372

1381

included_keys)

1373

1382

1374

1383

def step(self):

1583

1592

return revs, ghosts

1584

1593

1585

1594

1586

class AbstractSearchResult(object):

1587

"""The result of a search, describing a set of keys.

1588

1589

Search results are typically used as the 'fetch_spec' parameter when

1590

fetching revisions.

1591

1592

:seealso: AbstractSearch

1593

"""

1594

1595

def get_recipe(self):

1596

"""Return a recipe that can be used to replay this search.

1597

1598

The recipe allows reconstruction of the same results at a later date.

1599

1600

:return: A tuple of `(search_kind_str, *details)`. The details vary by

1601

kind of search result.

1602

"""

1603

raise NotImplementedError(self.get_recipe)

1604

1605

def get_network_struct(self):

1606

"""Return a tuple that can be transmitted via the HPSS protocol."""

1607

raise NotImplementedError(self.get_network_struct)

1608

1609

def get_keys(self):

1610

"""Return the keys found in this search.

1611

1612

:return: A set of keys.

1613

"""

1614

raise NotImplementedError(self.get_keys)

1615

1616

def is_empty(self):

1617

"""Return false if the search lists 1 or more revisions."""

1618

raise NotImplementedError(self.is_empty)

1619

1620

def refine(self, seen, referenced):

1621

"""Create a new search by refining this search.

1622

1623

:param seen: Revisions that have been satisfied.

1624

:param referenced: Revision references observed while satisfying some

1625

of this search.

1626

:return: A search result.

1627

"""

1628

raise NotImplementedError(self.refine)

1629

1630

1631

class AbstractSearch(object):

1632

"""A search that can be executed, producing a search result.

1633

1634

:seealso: AbstractSearchResult

1635

"""

1636

1637

def execute(self):

1638

"""Construct a network-ready search result from this search description.

1639

1640

This may take some time to search repositories, etc.

1641

1642

:return: A search result (an object that implements

1643

AbstractSearchResult's API).

1644

"""

1645

raise NotImplementedError(self.execute)

1646

1647

1648

class SearchResult(AbstractSearchResult):

1649

"""The result of a breadth first search.

1650

1651

A SearchResult provides the ability to reconstruct the search or access a

1652

set of the keys the search found.

1653

"""

1654

1655

def __init__(self, start_keys, exclude_keys, key_count, keys):

1656

"""Create a SearchResult.

1657

1658

:param start_keys: The keys the search started at.

1659

:param exclude_keys: The keys the search excludes.

1660

:param key_count: The total number of keys (from start to but not

1661

including exclude).

1662

:param keys: The keys the search found. Note that in future we may get

1663

a SearchResult from a smart server, in which case the keys list is

1664

not necessarily immediately available.

1665

"""

1666

self._recipe = ('search', start_keys, exclude_keys, key_count)

1667

self._keys = frozenset(keys)

1668

1669

def __repr__(self):

1670

kind, start_keys, exclude_keys, key_count = self._recipe

1671

if len(start_keys) > 5:

1672

start_keys_repr = repr(list(start_keys)[:5])[:-1] + ', ...]'

1673

else:

1674

start_keys_repr = repr(start_keys)

1675

if len(exclude_keys) > 5:

1676

exclude_keys_repr = repr(list(exclude_keys)[:5])[:-1] + ', ...]'

1677

else:

1678

exclude_keys_repr = repr(exclude_keys)

1679

return '<%s %s:(%s, %s, %d)>' % (self.__class__.__name__,

1680

kind, start_keys_repr, exclude_keys_repr, key_count)

1681

1682

def get_recipe(self):

1683

"""Return a recipe that can be used to replay this search.

1684

1685

The recipe allows reconstruction of the same results at a later date

1686

without knowing all the found keys. The essential elements are a list

1687

of keys to start and to stop at. In order to give reproducible

1688

results when ghosts are encountered by a search they are automatically

1689

added to the exclude list (or else ghost filling may alter the

1690

results).

1691

1692

:return: A tuple ('search', start_keys_set, exclude_keys_set,

1693

revision_count). To recreate the results of this search, create a

1694

breadth first searcher on the same graph starting at start_keys.

1695

Then call next() (or next_with_ghosts()) repeatedly, and on every

1696

result, call stop_searching_any on any keys from the exclude_keys

1697

set. The revision_count value acts as a trivial cross-check - the

1698

found revisions of the new search should have as many elements as

1699

revision_count. If it does not, then additional revisions have been

1700

ghosted since the search was executed the first time and the second

1701

time.

1702

"""

1703

return self._recipe

1704

1705

def get_network_struct(self):

1706

start_keys = ' '.join(self._recipe[1])

1707

stop_keys = ' '.join(self._recipe[2])

1708

count = str(self._recipe[3])

1709

return (self._recipe[0], '\n'.join((start_keys, stop_keys, count)))

1710

1711

def get_keys(self):

1712

"""Return the keys found in this search.

1713

1714

:return: A set of keys.

1715

"""

1716

return self._keys

1717

1718

def is_empty(self):

1719

"""Return false if the search lists 1 or more revisions."""

1720

return self._recipe[3] == 0

1721

1722

def refine(self, seen, referenced):

1723

"""Create a new search by refining this search.

1724

1725

:param seen: Revisions that have been satisfied.

1726

:param referenced: Revision references observed while satisfying some

1727

of this search.

1728

"""

1729

start = self._recipe[1]

1730

exclude = self._recipe[2]

1731

count = self._recipe[3]

1732

keys = self.get_keys()

1733

# New heads = referenced + old heads - seen things - exclude

1734

pending_refs = set(referenced)

1735

pending_refs.update(start)

1736

pending_refs.difference_update(seen)

1737

pending_refs.difference_update(exclude)

1738

# New exclude = old exclude + satisfied heads

1739

seen_heads = start.intersection(seen)

1740

exclude.update(seen_heads)

1741

# keys gets seen removed

1742

keys = keys - seen

1743

# length is reduced by len(seen)

1744

count -= len(seen)

1745

return SearchResult(pending_refs, exclude, count, keys)

1746

1747

1748

class PendingAncestryResult(AbstractSearchResult):

1749

"""A search result that will reconstruct the ancestry for some graph heads.

1750

1751

Unlike SearchResult, this doesn't hold the complete search result in

1752

memory, it just holds a description of how to generate it.

1753

"""

1754

1755

def __init__(self, heads, repo):

1756

"""Constructor.

1757

1758

:param heads: an iterable of graph heads.

1759

:param repo: a repository to use to generate the ancestry for the given

1760

heads.

1761

"""

1762

self.heads = frozenset(heads)

1763

self.repo = repo

1764

1765

def __repr__(self):

1766

if len(self.heads) > 5:

1767

heads_repr = repr(list(self.heads)[:5])[:-1]

1768

heads_repr += ', <%d more>...]' % (len(self.heads) - 5,)

1769

else:

1770

heads_repr = repr(self.heads)

1771

return '<%s heads:%s repo:%r>' % (

1772

self.__class__.__name__, heads_repr, self.repo)

1773

1774

def get_recipe(self):

1775

"""Return a recipe that can be used to replay this search.

1776

1777

The recipe allows reconstruction of the same results at a later date.

1778

1779

:seealso SearchResult.get_recipe:

1780

1781

:return: A tuple ('proxy-search', start_keys_set, set(), -1)

1782

To recreate this result, create a PendingAncestryResult with the

1783

start_keys_set.

1784

"""

1785

return ('proxy-search', self.heads, set(), -1)

1786

1787

def get_network_struct(self):

1788

parts = ['ancestry-of']

1789

parts.extend(self.heads)

1790

return parts

1791

1792

def get_keys(self):

1793

"""See SearchResult.get_keys.

1794

1795

Returns all the keys for the ancestry of the heads, excluding

1796

NULL_REVISION.

1797

"""

1798

return self._get_keys(self.repo.get_graph())

1799

1800

def _get_keys(self, graph):

1801

NULL_REVISION = revision.NULL_REVISION

1802

keys = [key for (key, parents) in graph.iter_ancestry(self.heads)

1803

if key != NULL_REVISION and parents is not None]

1804

return keys

1805

1806

def is_empty(self):

1807

"""Return false if the search lists 1 or more revisions."""

1808

if revision.NULL_REVISION in self.heads:

1809

return len(self.heads) == 1

1810

else:

1811

return len(self.heads) == 0

1812

1813

def refine(self, seen, referenced):

1814

"""Create a new search by refining this search.

1815

1816

:param seen: Revisions that have been satisfied.

1817

:param referenced: Revision references observed while satisfying some

1818

of this search.

1819

"""

1820

referenced = self.heads.union(referenced)

1821

return PendingAncestryResult(referenced - seen, self.repo)

1822

1823

1824

class EmptySearchResult(AbstractSearchResult):

1825

"""An empty search result."""

1826

1827

def is_empty(self):

1828

return True

1829

1830

1831

class EverythingResult(AbstractSearchResult):

1832

"""A search result that simply requests everything in the repository."""

1833

1834

def __init__(self, repo):

1835

self._repo = repo

1836

1837

def __repr__(self):

1838

return '%s(%r)' % (self.__class__.__name__, self._repo)

1839

1840

def get_recipe(self):

1841

raise NotImplementedError(self.get_recipe)

1842

1843

def get_network_struct(self):

1844

return ('everything',)

1845

1846

def get_keys(self):

1847

if 'evil' in debug.debug_flags:

1848

from bzrlib import remote

1849

if isinstance(self._repo, remote.RemoteRepository):

1850

# warn developers (not users) not to do this

1851

trace.mutter_callsite(

1852

2, "EverythingResult(RemoteRepository).get_keys() is slow.")

1853

return self._repo.all_revision_ids()

1854

1855

def is_empty(self):

1856

# It's ok for this to wrongly return False: the worst that can happen

1857

# is that RemoteStreamSource will initiate a get_stream on an empty

1858

# repository. And almost all repositories are non-empty.

1859

return False

1860

1861

def refine(self, seen, referenced):

1862

heads = set(self._repo.all_revision_ids())

1863

heads.difference_update(seen)

1864

heads.update(referenced)

1865

return PendingAncestryResult(heads, self._repo)

1866

1867

1868

class EverythingNotInOther(AbstractSearch):

1869

"""Find all revisions in that are in one repo but not the other."""

1870

1871

def __init__(self, to_repo, from_repo, find_ghosts=False):

1872

self.to_repo = to_repo

1873

self.from_repo = from_repo

1874

self.find_ghosts = find_ghosts

1875

1876

def execute(self):

1877

return self.to_repo.search_missing_revision_ids(

1878

self.from_repo, find_ghosts=self.find_ghosts)

1879

1880

1881

class NotInOtherForRevs(AbstractSearch):

1882

"""Find all revisions missing in one repo for a some specific heads."""

1883

1884

def __init__(self, to_repo, from_repo, required_ids, if_present_ids=None,

1885

find_ghosts=False, limit=None):

1886

"""Constructor.

1887

1888

:param required_ids: revision IDs of heads that must be found, or else

1889

the search will fail with NoSuchRevision. All revisions in their

1890

ancestry not already in the other repository will be included in

1891

the search result.

1892

:param if_present_ids: revision IDs of heads that may be absent in the

1893

source repository. If present, then their ancestry not already

1894

found in other will be included in the search result.

1895

:param limit: maximum number of revisions to fetch

1896

"""

1897

self.to_repo = to_repo

1898

self.from_repo = from_repo

1899

self.find_ghosts = find_ghosts

1900

self.required_ids = required_ids

1901

self.if_present_ids = if_present_ids

1902

self.limit = limit

1903

1904

def __repr__(self):

1905

if len(self.required_ids) > 5:

1906

reqd_revs_repr = repr(list(self.required_ids)[:5])[:-1] + ', ...]'

1907

else:

1908

reqd_revs_repr = repr(self.required_ids)

1909

if self.if_present_ids and len(self.if_present_ids) > 5:

1910

ifp_revs_repr = repr(list(self.if_present_ids)[:5])[:-1] + ', ...]'

1911

else:

1912

ifp_revs_repr = repr(self.if_present_ids)

1913

1914

return ("<%s from:%r to:%r find_ghosts:%r req'd:%r if-present:%r"

1915

"limit:%r>") % (

1916

self.__class__.__name__, self.from_repo, self.to_repo,

1917

self.find_ghosts, reqd_revs_repr, ifp_revs_repr,

1918

self.limit)

1919

1920

def execute(self):

1921

return self.to_repo.search_missing_revision_ids(

1922

self.from_repo, revision_ids=self.required_ids,

1923

if_present_ids=self.if_present_ids, find_ghosts=self.find_ghosts,

1924

limit=self.limit)

1925

1926

1927

1595

def invert_parent_map(parent_map):

1928

1596

"""Given a map from child => parents, create a map of parent=>children"""

1929

1597

child_map = {}

1939

1607

return child_map

1940

1608

1941

1609

1942

def _find_possible_heads(parent_map, tip_keys, depth):

1943

"""Walk backwards (towards children) through the parent_map.

1944

1945

This finds 'heads' that will hopefully succinctly describe our search

1946

graph.

1947

"""

1948

child_map = invert_parent_map(parent_map)

1949

heads = set()

1950

current_roots = tip_keys

1951

walked = set(current_roots)

1952

while current_roots and depth > 0:

1953

depth -= 1

1954

children = set()

1955

children_update = children.update

1956

for p in current_roots:

1957

# Is it better to pre- or post- filter the children?

1958

try:

1959

children_update(child_map[p])

1960

except KeyError:

1961

heads.add(p)

1962

# If we've seen a key before, we don't want to walk it again. Note that

1963

# 'children' stays relatively small while 'walked' grows large. So

1964

# don't use 'difference_update' here which has to walk all of 'walked'.

1965

# '.difference' is smart enough to walk only children and compare it to

1966

# walked.

1967

children = children.difference(walked)

1968

walked.update(children)

1969

current_roots = children

1970

if current_roots:

1971

# We walked to the end of depth, so these are the new tips.

1972

heads.update(current_roots)

1973

return heads

1974

1975

1976

def _run_search(parent_map, heads, exclude_keys):

1977

"""Given a parent map, run a _BreadthFirstSearcher on it.

1978

1979

Start at heads, walk until you hit exclude_keys. As a further improvement,

1980

watch for any heads that you encounter while walking, which means they were

1981

not heads of the search.

1982

1983

This is mostly used to generate a succinct recipe for how to walk through

1984

most of parent_map.

1985

1986

:return: (_BreadthFirstSearcher, set(heads_encountered_by_walking))

1987

"""

1988

g = Graph(DictParentsProvider(parent_map))

1989

s = g._make_breadth_first_searcher(heads)

1990

found_heads = set()

1991

while True:

1992

try:

1993

next_revs = s.next()

1994

except StopIteration:

1995

break

1996

for parents in s._current_parents.itervalues():

1997

f_heads = heads.intersection(parents)

1998

if f_heads:

1999

found_heads.update(f_heads)

2000

stop_keys = exclude_keys.intersection(next_revs)

2001

if stop_keys:

2002

s.stop_searching_any(stop_keys)

2003

for parents in s._current_parents.itervalues():

2004

f_heads = heads.intersection(parents)

2005

if f_heads:

2006

found_heads.update(f_heads)

2007

return s, found_heads

2008

2009

2010

def limited_search_result_from_parent_map(parent_map, missing_keys, tip_keys,

2011

depth):

2012

"""Transform a parent_map that is searching 'tip_keys' into an

2013

approximate SearchResult.

2014

2015

We should be able to generate a SearchResult from a given set of starting

2016

keys, that covers a subset of parent_map that has the last step pointing at

2017

tip_keys. This is to handle the case that really-long-searches shouldn't be

2018

started from scratch on each get_parent_map request, but we *do* want to

2019

filter out some of the keys that we've already seen, so we don't get

2020

information that we already know about on every request.

2021

2022

The server will validate the search (that starting at start_keys and

2023

stopping at stop_keys yields the exact key_count), so we have to be careful

2024

to give an exact recipe.

2025

2026

Basic algorithm is:

2027

1) Invert parent_map to get child_map (todo: have it cached and pass it

2028

in)

2029

2) Starting at tip_keys, walk towards children for 'depth' steps.

2030

3) At that point, we have the 'start' keys.

2031

4) Start walking parent_map from 'start' keys, counting how many keys

2032

are seen, and generating stop_keys for anything that would walk

2033

outside of the parent_map.

2034

2035

:param parent_map: A map from {child_id: (parent_ids,)}

2036

:param missing_keys: parent_ids that we know are unavailable

2037

:param tip_keys: the revision_ids that we are searching

2038

:param depth: How far back to walk.

2039

"""

2040

if not parent_map:

2041

# No search to send, because we haven't done any searching yet.

2042

return [], [], 0

2043

heads = _find_possible_heads(parent_map, tip_keys, depth)

2044

s, found_heads = _run_search(parent_map, heads, set(tip_keys))

2045

_, start_keys, exclude_keys, key_count = s.get_result().get_recipe()

2046

if found_heads:

2047

# Anything in found_heads are redundant start_keys, we hit them while

2048

# walking, so we can exclude them from the start list.

2049

start_keys = set(start_keys).difference(found_heads)

2050

return start_keys, exclude_keys, key_count

2051

2052

2053

def search_result_from_parent_map(parent_map, missing_keys):

2054

"""Transform a parent_map into SearchResult information."""

2055

if not parent_map:

2056

# parent_map is empty or None, simple search result

2057

return [], [], 0

2058

# start_set is all the keys in the cache

2059

start_set = set(parent_map)

2060

# result set is all the references to keys in the cache

2061

result_parents = set()

2062

for parents in parent_map.itervalues():

2063

result_parents.update(parents)

2064

stop_keys = result_parents.difference(start_set)

2065

# We don't need to send ghosts back to the server as a position to

2066

# stop either.

2067

stop_keys.difference_update(missing_keys)

2068

key_count = len(parent_map)

2069

if (revision.NULL_REVISION in result_parents

2070

and revision.NULL_REVISION in missing_keys):

2071

# If we pruned NULL_REVISION from the stop_keys because it's also

2072

# in our cache of "missing" keys we need to increment our key count

2073

# by 1, because the reconsitituted SearchResult on the server will

2074

# still consider NULL_REVISION to be an included key.

2075

key_count += 1

2076

included_keys = start_set.intersection(result_parents)

2077

start_set.difference_update(included_keys)

2078

return start_set, stop_keys, key_count

2079

2080

2081

1610

def collapse_linear_regions(parent_map):

2082

1611

"""Collapse regions of the graph that are 'linear'.

2083

1612

Older »