~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/repository.py

Committer: Martin Pool
Date: 2009-06-19 09:06:56 UTC
mfrom: (4463 +trunk)
mto: This revision was merged to the branch mainline in revision 4464.
Revision ID: mbp@sourcefrog.net-20090619090656-d5weqeecyscv8kqp

merge news

files added:
bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/test__known_graph.py

doc/developers/bug-handling.txt

doc/index.ru.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/time_graph.py

files removed:
doc/developers/performance-contributing.txt

files modified:
.bzrignore

Makefile

NEWS

bzrlib/__init__.py

bzrlib/_dirstate_helpers_c.pyx

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/dirstate.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/eol.txt

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/osutils.py

bzrlib/push.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisiontree.py

bzrlib/serializer.py

bzrlib/shellcomplete.py

bzrlib/smart/bzrdir.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_options.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_ui.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_eol_conversion.py

bzrlib/transform.py

bzrlib/ui/text.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/cycle.txt

doc/developers/index.txt

doc/developers/performance-roadmap.txt

doc/developers/planned-change-integration.txt

doc/developers/releasing.txt

doc/en/developer-guide/HACKING.txt

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.png

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/introducing_bazaar.txt

doc/index.txt

generate_docs.py

setup.py

tools/win32/build_release.py

Show diffs side-by-side

added added

removed removed

bzrlib/repository.py

1919

yield line, revid

1920

1921

def _find_file_ids_from_xml_inventory_lines(self, line_iterator,

1922

revision_ids):

1922

revision_keys):

1923

"""Helper routine for fileids_altered_by_revision_ids.

1924

1925

This performs the translation of xml lines to revision ids.

1926

1927

:param line_iterator: An iterator of lines, origin_version_id

1928

:param revision_ids: The revision ids to filter for. This should be a

1928

:param revision_keys: The revision ids to filter for. This should be a

1929

set or other type which supports efficient __contains__ lookups, as

1930

the revision id from each parsed line will be looked up in the

1931

revision_ids filter.

1930

the revision key from each parsed line will be looked up in the

1931

revision_keys filter.

1932

:return: a dictionary mapping altered file-ids to an iterable of

1933

revision_ids. Each altered file-ids has the exact revision_ids that

1934

altered it listed explicitly.

1935

"""

1936

seen = set(self._find_text_key_references_from_xml_inventory_lines(

1937

line_iterator).iterkeys())

1938

# Note that revision_ids are revision keys.

1939

parent_maps = self.revisions.get_parent_map(revision_ids)

1940

parents = set()

1941

map(parents.update, parent_maps.itervalues())

1942

parents.difference_update(revision_ids)

1938

parent_keys = self._find_parent_keys_of_revisions(revision_keys)

1943

1939

parent_seen = set(self._find_text_key_references_from_xml_inventory_lines(

1944

self._inventory_xml_lines_for_keys(parents)))

1940

self._inventory_xml_lines_for_keys(parent_keys)))

1945

1941

new_keys = seen - parent_seen

1946

1942

result = {}

1947

1943

setdefault = result.setdefault

1949

1945

setdefault(key[0], set()).add(key[-1])

1950

1946

return result

1951

1947

1948

def _find_parent_ids_of_revisions(self, revision_ids):

1949

"""Find all parent ids that are mentioned in the revision graph.

1950

1951

:return: set of revisions that are parents of revision_ids which are

1952

not part of revision_ids themselves

1953

"""

1954

parent_map = self.get_parent_map(revision_ids)

1955

parent_ids = set()

1956

map(parent_ids.update, parent_map.itervalues())

1957

parent_ids.difference_update(revision_ids)

1958

parent_ids.discard(_mod_revision.NULL_REVISION)

1959

return parent_ids

1960

1961

def _find_parent_keys_of_revisions(self, revision_keys):

1962

"""Similar to _find_parent_ids_of_revisions, but used with keys.

1963

1964

:param revision_keys: An iterable of revision_keys.

1965

:return: The parents of all revision_keys that are not already in

1966

revision_keys

1967

"""

1968

parent_map = self.revisions.get_parent_map(revision_keys)

1969

parent_keys = set()

1970

map(parent_keys.update, parent_map.itervalues())

1971

parent_keys.difference_update(revision_keys)

1972

parent_keys.discard(_mod_revision.NULL_REVISION)

1973

return parent_keys

1974

1952

1975

def fileids_altered_by_revision_ids(self, revision_ids, _inv_weave=None):

1953

1976

"""Find the file ids and versions affected by revisions.

1954

1977

2234

2257

"""

2235

2258

return self.get_revision(revision_id).inventory_sha1

2236

2259

2260

def get_rev_id_for_revno(self, revno, known_pair):

2261

"""Return the revision id of a revno, given a later (revno, revid)

2262

pair in the same history.

2263

2264

:return: if found (True, revid). If the available history ran out

2265

before reaching the revno, then this returns

2266

(False, (closest_revno, closest_revid)).

2267

"""

2268

known_revno, known_revid = known_pair

2269

partial_history = [known_revid]

2270

distance_from_known = known_revno - revno

2271

if distance_from_known < 0:

2272

raise ValueError(

2273

'requested revno (%d) is later than given known revno (%d)'

2274

% (revno, known_revno))

2275

try:

2276

_iter_for_revno(

2277

self, partial_history, stop_index=distance_from_known)

2278

except errors.RevisionNotPresent, err:

2279

if err.revision_id == known_revid:

2280

# The start revision (known_revid) wasn't found.

2281

raise

2282

# This is a stacked repository with no fallbacks, or a there's a

2283

# left-hand ghost. Either way, even though the revision named in

2284

# the error isn't in this repo, we know it's the next step in this

2285

# left-hand history.

2286

partial_history.append(err.revision_id)

2287

if len(partial_history) <= distance_from_known:

2288

# Didn't find enough history to get a revid for the revno.

2289

earliest_revno = known_revno - len(partial_history) + 1

2290

return (False, (earliest_revno, partial_history[-1]))

2291

if len(partial_history) - 1 > distance_from_known:

2292

raise AssertionError('_iter_for_revno returned too much history')

2293

return (True, partial_history[-1])

2294

2237

2295

def iter_reverse_revision_history(self, revision_id):

2238

2296

"""Iterate backwards through revision ids in the lefthand history

2239

2297

3062

3120

3063

3121

format_registry.register_lazy(

3064

3122

'Bazaar development format - chk repository with bencode revision '

3065

'serialization (needs bzr.dev from 1.15)\n',

3123

'serialization (needs bzr.dev from 1.16)\n',

3066

3124

'bzrlib.repofmt.groupcompress_repo',

3067

3125

'RepositoryFormatCHK2',

3068

3126

)

3127

format_registry.register_lazy(

3128

'Bazaar repository format 2a (needs bzr 1.16 or later)\n',

3129

'bzrlib.repofmt.groupcompress_repo',

3130

'RepositoryFormat2a',

3131

)

3069

3132

3070

3133

3071

3134

class InterRepository(InterObject):

3413

3476

return self.source.revision_ids_to_search_result(result_set)

3414

3477

3415

3478

3416

class InterPackRepo(InterSameDataRepository):

3417

"""Optimised code paths between Pack based repositories."""

3418

3419

@classmethod

3420

def _get_repo_format_to_test(self):

3421

from bzrlib.repofmt import pack_repo

3422

return pack_repo.RepositoryFormatKnitPack6RichRoot()

3423

3424

@staticmethod

3425

def is_compatible(source, target):

3426

"""Be compatible with known Pack formats.

3427

3428

We don't test for the stores being of specific types because that

3429

could lead to confusing results, and there is no need to be

3430

overly general.

3431

3432

InterPackRepo does not support CHK based repositories.

3433

"""

3434

from bzrlib.repofmt.pack_repo import RepositoryFormatPack

3435

from bzrlib.repofmt.groupcompress_repo import RepositoryFormatCHK1

3436

try:

3437

are_packs = (isinstance(source._format, RepositoryFormatPack) and

3438

isinstance(target._format, RepositoryFormatPack))

3439

not_packs = (isinstance(source._format, RepositoryFormatCHK1) or

3440

isinstance(target._format, RepositoryFormatCHK1))

3441

except AttributeError:

3442

return False

3443

if not_packs or not are_packs:

3444

return False

3445

return InterRepository._same_model(source, target)

3446

3447

@needs_write_lock

3448

def fetch(self, revision_id=None, pb=None, find_ghosts=False,

3449

fetch_spec=None):

3450

"""See InterRepository.fetch()."""

3451

if (len(self.source._fallback_repositories) > 0 or

3452

len(self.target._fallback_repositories) > 0):

3453

# The pack layer is not aware of fallback repositories, so when

3454

# fetching from a stacked repository or into a stacked repository

3455

# we use the generic fetch logic which uses the VersionedFiles

3456

# attributes on repository.

3457

from bzrlib.fetch import RepoFetcher

3458

fetcher = RepoFetcher(self.target, self.source, revision_id,

3459

pb, find_ghosts, fetch_spec=fetch_spec)

3460

if fetch_spec is not None:

3461

if len(list(fetch_spec.heads)) != 1:

3462

raise AssertionError(

3463

"InterPackRepo.fetch doesn't support "

3464

"fetching multiple heads yet.")

3465

revision_id = list(fetch_spec.heads)[0]

3466

fetch_spec = None

3467

if revision_id is None:

3468

# TODO:

3469

# everything to do - use pack logic

3470

# to fetch from all packs to one without

3471

# inventory parsing etc, IFF nothing to be copied is in the target.

3472

# till then:

3473

source_revision_ids = frozenset(self.source.all_revision_ids())

3474

revision_ids = source_revision_ids - \

3475

frozenset(self.target.get_parent_map(source_revision_ids))

3476

revision_keys = [(revid,) for revid in revision_ids]

3477

index = self.target._pack_collection.revision_index.combined_index

3478

present_revision_ids = set(item[1][0] for item in

3479

index.iter_entries(revision_keys))

3480

revision_ids = set(revision_ids) - present_revision_ids

3481

# implementing the TODO will involve:

3482

# - detecting when all of a pack is selected

3483

# - avoiding as much as possible pre-selection, so the

3484

# more-core routines such as create_pack_from_packs can filter in

3485

# a just-in-time fashion. (though having a HEADS list on a

3486

# repository might make this a lot easier, because we could

3487

# sensibly detect 'new revisions' without doing a full index scan.

3488

elif _mod_revision.is_null(revision_id):

3489

# nothing to do:

3490

return (0, [])

3491

else:

3492

revision_ids = self.search_missing_revision_ids(revision_id,

3493

find_ghosts=find_ghosts).get_keys()

3494

if len(revision_ids) == 0:

3495

return (0, [])

3496

return self._pack(self.source, self.target, revision_ids)

3497

3498

def _pack(self, source, target, revision_ids):

3499

from bzrlib.repofmt.pack_repo import Packer

3500

packs = source._pack_collection.all_packs()

3501

pack = Packer(self.target._pack_collection, packs, '.fetch',

3502

revision_ids).pack()

3503

if pack is not None:

3504

self.target._pack_collection._save_pack_names()

3505

copied_revs = pack.get_revision_count()

3506

# Trigger an autopack. This may duplicate effort as we've just done

3507

# a pack creation, but for now it is simpler to think about as

3508

# 'upload data, then repack if needed'.

3509

self.target._pack_collection.autopack()

3510

return (copied_revs, [])

3511

else:

3512

return (0, [])

3513

3514

@needs_read_lock

3515

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

3516

"""See InterRepository.missing_revision_ids().

3517

3518

:param find_ghosts: Find ghosts throughout the ancestry of

3519

revision_id.

3520

"""

3521

if not find_ghosts and revision_id is not None:

3522

return self._walk_to_common_revisions([revision_id])

3523

elif revision_id is not None:

3524

# Find ghosts: search for revisions pointing from one repository to

3525

# the other, and vice versa, anywhere in the history of revision_id.

3526

graph = self.target.get_graph(other_repository=self.source)

3527

searcher = graph._make_breadth_first_searcher([revision_id])

3528

found_ids = set()

3529

while True:

3530

try:

3531

next_revs, ghosts = searcher.next_with_ghosts()

3532

except StopIteration:

3533

break

3534

if revision_id in ghosts:

3535

raise errors.NoSuchRevision(self.source, revision_id)

3536

found_ids.update(next_revs)

3537

found_ids.update(ghosts)

3538

found_ids = frozenset(found_ids)

3539

# Double query here: should be able to avoid this by changing the

3540

# graph api further.

3541

result_set = found_ids - frozenset(

3542

self.target.get_parent_map(found_ids))

3543

else:

3544

source_ids = self.source.all_revision_ids()

3545

# source_ids is the worst possible case we may need to pull.

3546

# now we want to filter source_ids against what we actually

3547

# have in target, but don't try to check for existence where we know

3548

# we do not have a revision as that would be pointless.

3549

target_ids = set(self.target.all_revision_ids())

3550

result_set = set(source_ids).difference(target_ids)

3551

return self.source.revision_ids_to_search_result(result_set)

3552

3553

3554

3479

class InterDifferingSerializer(InterRepository):

3555

3480

3556

3481

@classmethod

3831

3756

InterRepository.register_optimiser(InterSameDataRepository)

3832

3757

InterRepository.register_optimiser(InterWeaveRepo)

3833

3758

InterRepository.register_optimiser(InterKnitRepo)

3834

InterRepository.register_optimiser(InterPackRepo)

3835

3759

3836

3760

3837

3761

class CopyConverter(object):

4412

4336

yield versionedfile.FulltextContentFactory(

4413

4337

key, parent_keys, None, as_bytes)

4414

4338

4339

4340

def _iter_for_revno(repo, partial_history_cache, stop_index=None,

4341

stop_revision=None):

4342

"""Extend the partial history to include a given index

4343

4344

If a stop_index is supplied, stop when that index has been reached.

4345

If a stop_revision is supplied, stop when that revision is

4346

encountered. Otherwise, stop when the beginning of history is

4347

reached.

4348

4349

:param stop_index: The index which should be present. When it is

4350

present, history extension will stop.

4351

:param stop_revision: The revision id which should be present. When

4352

it is encountered, history extension will stop.

4353

"""

4354

start_revision = partial_history_cache[-1]

4355

iterator = repo.iter_reverse_revision_history(start_revision)

4356

try:

4357

#skip the last revision in the list

4358

iterator.next()

4359

while True:

4360

if (stop_index is not None and

4361

len(partial_history_cache) > stop_index):

4362

break

4363

if partial_history_cache[-1] == stop_revision:

4364

break

4365

revision_id = iterator.next()

4366

partial_history_cache.append(revision_id)

4367

except StopIteration:

4368

# No more history

4369

return

4370

Older »