~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/repository.py

Committer: Robert Collins
Date: 2009-05-11 01:59:06 UTC
mto: This revision was merged to the branch mainline in revision 4593.
Revision ID: robertc@robertcollins.net-20090511015906-6zi6a9b8tuuhipc8

Less lock thrashing in check.py.

files added:
bzrlib/tests/test_http_implementations.py

bzrlib/util/tests/test_bencode.py

doc/developers/performance-contributing.txt

files removed:
bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/crash.py

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/send.py

bzrlib/tests/features.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_lock.py

bzrlib/util/bencode.py

doc/BUILD-NOTES

doc/Makefile

doc/_static

doc/_static/bzr icon 16.png

doc/_static/bzr.ico

doc/_static/en

doc/_static/en/quick-reference

doc/_templates

doc/_templates/index.html

doc/_templates/layout.html

doc/conf.py

doc/contents.txt

doc/developers/apport.txt

doc/developers/bug-handling.txt

doc/developers/content-filtering.txt

doc/en/quick-reference/index.txt

doc/en/tutorials/index.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide/index-for-2x.txt

doc/es/quick-reference/quick-start-summary.pdf

doc/es/quick-reference/quick-start-summary.png

doc/index.ru.txt

doc/make.bat

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

files renamed:
bzrlib/_btree_serializer_pyx.pyx => bzrlib/_btree_serializer_c.pyx

bzrlib/_dirstate_helpers_pyx.h => bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_pyx.pyx => bzrlib/_dirstate_helpers_c.pyx

bzrlib/_knit_load_data_pyx.pyx => bzrlib/_knit_load_data_c.pyx

bzrlib/tests/per_branch/ => bzrlib/tests/branch_implementations/

bzrlib/tests/per_bzrdir/ => bzrlib/tests/bzrdir_implementations/

bzrlib/tests/per_interrepository/ => bzrlib/tests/interrepository_implementations/

bzrlib/tests/per_intertree/ => bzrlib/tests/intertree_implementations/

bzrlib/tests/per_inventory/ => bzrlib/tests/inventory_implementations/

bzrlib/tests/per_pack_repository.py => bzrlib/tests/test_pack_repository.py

bzrlib/tests/per_transport.py => bzrlib/tests/test_transport_implementations.py

bzrlib/tests/per_versionedfile.py => bzrlib/tests/test_versionedfile.py

bzrlib/tests/per_tree/ => bzrlib/tests/tree_implementations/

bzrlib/tests/per_workingtree/ => bzrlib/tests/workingtree_implementations/

bzrlib/tests/per_tree/test_get_file_with_stat.py => bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/util/_bencode_py.py => bzrlib/util/bencode.py

doc/en/developer-guide/HACKING.txt => doc/developers/HACKING.txt

doc/_static/en/quick-reference/Makefile => doc/en/quick-reference/Makefile

doc/_static/en/quick-reference/bzr-quick-reference.pdf => doc/en/quick-reference/quick-start-summary.pdf

doc/_static/en/quick-reference/bzr-quick-reference.png => doc/en/quick-reference/quick-start-summary.png

doc/_static/en/quick-reference/bzr-quick-reference.svg => doc/en/quick-reference/quick-start-summary.svg

doc/es/developer-guide/ => doc/es/guia-desarrollador/

doc/es/user-guide/ => doc/es/guia-usuario/

doc/es/release-notes/ => doc/es/notas-version/

doc/es/quick-reference/ => doc/es/referencia-rapida/

doc/es/quick-reference/quick-start-summary.svg => doc/es/referencia-rapida/referencia-rapida.svg

doc/es/user-reference/ => doc/es/referencia/

tools/generate_docs.py => generate_docs.py

bzrlib/doc_generate/ => tools/doc_generate/

files modified:
.bzrignore

Makefile

NEWS

bzrlib/__init__.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_readdir_pyx.pyx

bzrlib/annotate.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/counted_lock.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/errors.py

bzrlib/export/dir_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/eol.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/switch.py

bzrlib/tag.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_create_clone.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/bzrdir_implementations/test_push.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_index.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_check.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_eol_conversion.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/urlutils.py

bzrlib/version.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/check.txt

doc/developers/cycle.txt

doc/developers/index.txt

doc/developers/inventory.txt

doc/developers/performance-roadmap.txt

doc/developers/planned-change-integration.txt

doc/developers/plugin-api.txt

doc/developers/releasing.txt

doc/developers/testing.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/index.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/writing_a_plugin.txt

doc/es/mini-tutorial/index.txt

doc/es/referencia-rapida/Makefile

doc/index.es.txt

doc/index.txt

setup.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/win32/build_release.py

tools/win32/bzr.iss.cog

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/repository.py

gpg,

graph,

inventory,

inventory_delta,

lazy_regex,

lockable_files,

lockdir,

entry_factory,

)

from bzrlib import registry

from bzrlib.symbol_versioning import (

deprecated_method,

)

from bzrlib.trace import (

log_exception_quietly, note, mutter, mutter_callsite, warning)

465

467

if content_summary[2] is None:

466

468

raise ValueError("Files must not have executable = None")

467

469

if not store:

468

# We can't trust a check of the file length because of content

469

# filtering...

470

if (# if the exec bit has changed we have to store:

470

if (# if the file length changed we have to store:

471

parent_entry.text_size != content_summary[1] or

472

# if the exec bit has changed we have to store:

471

473

parent_entry.executable != content_summary[2]):

472

474

store = True

473

475

elif parent_entry.text_sha1 == content_summary[3]:

492

494

ie.executable = content_summary[2]

493

495

file_obj, stat_value = tree.get_file_with_stat(ie.file_id, path)

494

496

try:

495

text = file_obj.read()

497

lines = file_obj.readlines()

496

498

finally:

497

499

file_obj.close()

498

500

try:

499

501

ie.text_sha1, ie.text_size = self._add_text_to_weave(

500

ie.file_id, text, heads, nostore_sha)

502

ie.file_id, lines, heads, nostore_sha)

501

503

# Let the caller know we generated a stat fingerprint.

502

504

fingerprint = (ie.text_sha1, stat_value)

503

505

except errors.ExistingContent:

515

517

# carry over:

516

518

ie.revision = parent_entry.revision

517

519

return self._get_delta(ie, basis_inv, path), False, None

518

self._add_text_to_weave(ie.file_id, '', heads, None)

520

lines = []

521

self._add_text_to_weave(ie.file_id, lines, heads, None)

519

522

elif kind == 'symlink':

520

523

current_link_target = content_summary[3]

521

524

if not store:

529

532

ie.symlink_target = parent_entry.symlink_target

530

533

return self._get_delta(ie, basis_inv, path), False, None

531

534

ie.symlink_target = current_link_target

532

self._add_text_to_weave(ie.file_id, '', heads, None)

535

lines = []

536

self._add_text_to_weave(ie.file_id, lines, heads, None)

533

537

elif kind == 'tree-reference':

534

538

if not store:

535

539

if content_summary[3] != parent_entry.reference_revision:

540

544

ie.revision = parent_entry.revision

541

545

return self._get_delta(ie, basis_inv, path), False, None

542

546

ie.reference_revision = content_summary[3]

543

if ie.reference_revision is None:

544

raise AssertionError("invalid content_summary for nested tree: %r"

545

% (content_summary,))

546

self._add_text_to_weave(ie.file_id, '', heads, None)

547

lines = []

548

self._add_text_to_weave(ie.file_id, lines, heads, None)

547

549

else:

548

550

raise NotImplementedError('unknown kind')

549

551

ie.revision = self._new_revision_id

743

745

entry.executable = True

744

746

else:

745

747

entry.executable = False

746

if (carry_over_possible and

748

if (carry_over_possible and

747

749

parent_entry.executable == entry.executable):

748

750

# Check the file length, content hash after reading

749

751

# the file.

752

754

nostore_sha = None

753

755

file_obj, stat_value = tree.get_file_with_stat(file_id, change[1][1])

754

756

try:

755

text = file_obj.read()

757

lines = file_obj.readlines()

756

758

finally:

757

759

file_obj.close()

758

760

try:

759

761

entry.text_sha1, entry.text_size = self._add_text_to_weave(

760

file_id, text, heads, nostore_sha)

762

file_id, lines, heads, nostore_sha)

761

763

yield file_id, change[1][1], (entry.text_sha1, stat_value)

762

764

except errors.ExistingContent:

763

765

# No content change against a carry_over parent

772

774

parent_entry.symlink_target == entry.symlink_target):

773

775

carried_over = True

774

776

else:

775

self._add_text_to_weave(change[0], '', heads, None)

777

self._add_text_to_weave(change[0], [], heads, None)

776

778

elif kind == 'directory':

777

779

if carry_over_possible:

778

780

carried_over = True

780

782

# Nothing to set on the entry.

781

783

# XXX: split into the Root and nonRoot versions.

782

784

if change[1][1] != '' or self.repository.supports_rich_root():

783

self._add_text_to_weave(change[0], '', heads, None)

785

self._add_text_to_weave(change[0], [], heads, None)

784

786

elif kind == 'tree-reference':

785

787

if not self.repository._format.supports_tree_reference:

786

788

# This isn't quite sane as an error, but we shouldn't

789

791

# references.

790

792

raise errors.UnsupportedOperation(tree.add_reference,

791

793

self.repository)

792

reference_revision = tree.get_reference_revision(change[0])

793

entry.reference_revision = reference_revision

794

entry.reference_revision = \

795

tree.get_reference_revision(change[0])

794

796

if (carry_over_possible and

795

797

parent_entry.reference_revision == reference_revision):

796

798

carried_over = True

797

799

else:

798

self._add_text_to_weave(change[0], '', heads, None)

800

self._add_text_to_weave(change[0], [], heads, None)

799

801

else:

800

802

raise AssertionError('unknown kind %r' % kind)

801

803

if not carried_over:

810

812

seen_root = True

811

813

self.new_inventory = None

812

814

if len(inv_delta):

813

# This should perhaps be guarded by a check that the basis we

814

# commit against is the basis for the commit and if not do a delta

815

# against the basis.

816

815

self._any_changes = True

817

816

if not seen_root:

818

817

# housekeeping root entry changes do not affect no-change commits.

819

818

self._require_root_change(tree)

820

819

self.basis_delta_revision = basis_revision_id

821

820

822

def _add_text_to_weave(self, file_id, new_text, parents, nostore_sha):

823

parent_keys = tuple([(file_id, parent) for parent in parents])

824

return self.repository.texts._add_text(

825

(file_id, self._new_revision_id), parent_keys, new_text,

826

nostore_sha=nostore_sha, random_id=self.random_revid)[0:2]

821

def _add_text_to_weave(self, file_id, new_lines, parents, nostore_sha):

822

# Note: as we read the content directly from the tree, we know its not

823

# been turned into unicode or badly split - but a broken tree

824

# implementation could give us bad output from readlines() so this is

825

# not a guarantee of safety. What would be better is always checking

826

# the content during test suite execution. RBC 20070912

827

parent_keys = tuple((file_id, parent) for parent in parents)

828

return self.repository.texts.add_lines(

829

(file_id, self._new_revision_id), parent_keys, new_lines,

830

nostore_sha=nostore_sha, random_id=self.random_revid,

831

check_content=False)[0:2]

827

832

828

833

829

834

class RootCommitBuilder(CommitBuilder):

855

860

######################################################################

856

861

# Repositories

857

862

858

859

863

class Repository(object):

860

864

"""Repository holding history for one or more branches.

861

865

931

935

"""

932

936

if self._write_group is not self.get_transaction():

933

937

# has an unlock or relock occured ?

934

if suppress_errors:

935

mutter(

936

'(suppressed) mismatched lock context and write group. %r, %r',

937

self._write_group, self.get_transaction())

938

return

939

938

raise errors.BzrError(

940

939

'mismatched lock context and write group. %r, %r' %

941

940

(self._write_group, self.get_transaction()))

970

969

"""

971

970

if not self._format.supports_external_lookups:

972

971

raise errors.UnstackableRepositoryFormat(self._format, self.base)

973

if self.is_locked():

974

# This repository will call fallback.unlock() when we transition to

975

# the unlocked state, so we make sure to increment the lock count

976

repository.lock_read()

977

972

self._check_fallback_repository(repository)

978

973

self._fallback_repositories.append(repository)

979

974

self.texts.add_fallback_versioned_files(repository.texts)

1028

1023

parents, basis_inv=None, propagate_caches=False):

1029

1024

"""Add a new inventory expressed as a delta against another revision.

1030

1025

1031

See the inventory developers documentation for the theory behind

1032

inventory deltas.

1033

1034

1026

:param basis_revision_id: The inventory id the delta was created

1035

1027

against. (This does not have to be a direct parent.)

1036

1028

:param delta: The inventory delta (see Inventory.apply_delta for

1075

1067

check_content=True):

1076

1068

"""Store lines in inv_vf and return the sha1 of the inventory."""

1077

1069

parents = [(parent,) for parent in parents]

1078

result = self.inventories.add_lines((revision_id,), parents, lines,

1070

return self.inventories.add_lines((revision_id,), parents, lines,

1079

1071

check_content=check_content)[0]

1080

self.inventories._access.flush()

1081

return result

1082

1072

1083

1073

def add_revision(self, revision_id, rev, inv=None, config=None):

1084

1074

"""Add rev to the revision store as revision_id.

1160

1150

# The old API returned a list, should this actually be a set?

1161

1151

return parent_map.keys()

1162

1152

1163

def _check_inventories(self, checker):

1164

"""Check the inventories found from the revision scan.

1165

1166

This is responsible for verifying the sha1 of inventories and

1167

creating a pending_keys set that covers data referenced by inventories.

1168

"""

1169

bar = ui.ui_factory.nested_progress_bar()

1170

try:

1171

self._do_check_inventories(checker, bar)

1172

finally:

1173

bar.finished()

1174

1175

def _do_check_inventories(self, checker, bar):

1176

"""Helper for _check_inventories."""

1177

revno = 0

1178

keys = {'chk_bytes':set(), 'inventories':set(), 'texts':set()}

1179

kinds = ['chk_bytes', 'texts']

1180

count = len(checker.pending_keys)

1181

bar.update("inventories", 0, 2)

1182

current_keys = checker.pending_keys

1183

checker.pending_keys = {}

1184

# Accumulate current checks.

1185

for key in current_keys:

1186

if key[0] != 'inventories' and key[0] not in kinds:

1187

checker._report_items.append('unknown key type %r' % (key,))

1188

keys[key[0]].add(key[1:])

1189

if keys['inventories']:

1190

# NB: output order *should* be roughly sorted - topo or

1191

# inverse topo depending on repository - either way decent

1192

# to just delta against. However, pre-CHK formats didn't

1193

# try to optimise inventory layout on disk. As such the

1194

# pre-CHK code path does not use inventory deltas.

1195

last_object = None

1196

for record in self.inventories.check(keys=keys['inventories']):

1197

if record.storage_kind == 'absent':

1198

checker._report_items.append(

1199

'Missing inventory {%s}' % (record.key,))

1200

else:

1201

last_object = self._check_record('inventories', record,

1202

checker, last_object,

1203

current_keys[('inventories',) + record.key])

1204

del keys['inventories']

1205

else:

1206

return

1207

bar.update("texts", 1)

1208

while (checker.pending_keys or keys['chk_bytes']

1209

or keys['texts']):

1210

# Something to check.

1211

current_keys = checker.pending_keys

1212

checker.pending_keys = {}

1213

# Accumulate current checks.

1214

for key in current_keys:

1215

if key[0] not in kinds:

1216

checker._report_items.append('unknown key type %r' % (key,))

1217

keys[key[0]].add(key[1:])

1218

# Check the outermost kind only - inventories || chk_bytes || texts

1219

for kind in kinds:

1220

if keys[kind]:

1221

last_object = None

1222

for record in getattr(self, kind).check(keys=keys[kind]):

1223

if record.storage_kind == 'absent':

1224

checker._report_items.append(

1225

'Missing %s {%s}' % (kind, record.key,))

1226

else:

1227

last_object = self._check_record(kind, record,

1228

checker, last_object, current_keys[(kind,) + record.key])

1229

keys[kind] = set()

1230

break

1231

1232

def _check_record(self, kind, record, checker, last_object, item_data):

1233

"""Check a single text from this repository."""

1234

if kind == 'inventories':

1235

rev_id = record.key[0]

1236

inv = self.deserialise_inventory(rev_id,

1237

record.get_bytes_as('fulltext'))

1238

if last_object is not None:

1239

delta = inv._make_delta(last_object)

1240

for old_path, path, file_id, ie in delta:

1241

if ie is None:

1242

continue

1243

ie.check(checker, rev_id, inv)

1244

else:

1245

for path, ie in inv.iter_entries():

1246

ie.check(checker, rev_id, inv)

1247

if self._format.fast_deltas:

1248

return inv

1249

elif kind == 'chk_bytes':

1250

# No code written to check chk_bytes for this repo format.

1251

checker._report_items.append(

1252

'unsupported key type chk_bytes for %s' % (record.key,))

1253

elif kind == 'texts':

1254

self._check_text(record, checker, item_data)

1255

else:

1256

checker._report_items.append(

1257

'unknown key type %s for %s' % (kind, record.key))

1258

1259

def _check_text(self, record, checker, item_data):

1260

"""Check a single text."""

1261

# Check it is extractable.

1262

# TODO: check length.

1263

if record.storage_kind == 'chunked':

1264

chunks = record.get_bytes_as(record.storage_kind)

1265

sha1 = osutils.sha_strings(chunks)

1266

length = sum(map(len, chunks))

1267

else:

1268

content = record.get_bytes_as('fulltext')

1269

sha1 = osutils.sha_string(content)

1270

length = len(content)

1271

if item_data and sha1 != item_data[1]:

1272

checker._report_items.append(

1273

'sha1 mismatch: %s has sha1 %s expected %s referenced by %s' %

1274

(record.key, sha1, item_data[1], item_data[2]))

1275

1276

1153

@staticmethod

1277

1154

def create(a_bzrdir):

1278

1155

"""Construct the current default format repository in a_bzrdir."""

1311

1188

self._inventory_entry_cache = fifo_cache.FIFOCache(10*1024)

1312

1189

1313

1190

def __repr__(self):

1314

if self._fallback_repositories:

1315

return '%s(%r, fallback_repositories=%r)' % (

1316

self.__class__.__name__,

1317

self.base,

1318

self._fallback_repositories)

1319

else:

1320

return '%s(%r)' % (self.__class__.__name__,

1321

self.base)

1322

1323

def _has_same_fallbacks(self, other_repo):

1324

"""Returns true if the repositories have the same fallbacks."""

1325

my_fb = self._fallback_repositories

1326

other_fb = other_repo._fallback_repositories

1327

if len(my_fb) != len(other_fb):

1328

return False

1329

for f, g in zip(my_fb, other_fb):

1330

if not f.has_same_location(g):

1331

return False

1332

return True

1191

return '%s(%r)' % (self.__class__.__name__,

1192

self.base)

1333

1193

1334

1194

def has_same_location(self, other):

1335

1195

"""Returns a boolean indicating if this repository is at the same

1380

1240

"""

1381

1241

locked = self.is_locked()

1382

1242

result = self.control_files.lock_write(token=token)

1243

for repo in self._fallback_repositories:

1244

# Writes don't affect fallback repos

1245

repo.lock_read()

1383

1246

if not locked:

1384

for repo in self._fallback_repositories:

1385

# Writes don't affect fallback repos

1386

repo.lock_read()

1387

1247

self._refresh_data()

1388

1248

return result

1389

1249

1390

1250

def lock_read(self):

1391

1251

locked = self.is_locked()

1392

1252

self.control_files.lock_read()

1253

for repo in self._fallback_repositories:

1254

repo.lock_read()

1393

1255

if not locked:

1394

for repo in self._fallback_repositories:

1395

repo.lock_read()

1396

1256

self._refresh_data()

1397

1257

1398

1258

def get_physical_lock_status(self):

1543

1403

"""Commit the contents accrued within the current write group.

1544

1404

1545

1405

:seealso: start_write_group.

1546

1547

:return: it may return an opaque hint that can be passed to 'pack'.

1548

1406

"""

1549

1407

if self._write_group is not self.get_transaction():

1550

1408

# has an unlock or relock occured ?

1551

1409

raise errors.BzrError('mismatched lock context %r and '

1552

1410

'write group %r.' %

1553

1411

(self.get_transaction(), self._write_group))

1554

result = self._commit_write_group()

1412

self._commit_write_group()

1555

1413

self._write_group = None

1556

return result

1557

1414

1558

1415

def _commit_write_group(self):

1559

1416

"""Template method for per-repository write group cleanup.

1567

1424

def suspend_write_group(self):

1568

1425

raise errors.UnsuspendableWriteGroup(self)

1569

1426

1570

def get_missing_parent_inventories(self, check_for_missing_texts=True):

1427

def get_missing_parent_inventories(self):

1571

1428

"""Return the keys of missing inventory parents for revisions added in

1572

1429

this write group.

1573

1430

1582

1439

return set()

1583

1440

if not self.is_in_write_group():

1584

1441

raise AssertionError('not in a write group')

1585

1442

1586

1443

# XXX: We assume that every added revision already has its

1587

1444

# corresponding inventory, so we only check for parent inventories that

1588

1445

# might be missing, rather than all inventories.

1592

1449

present_inventories = unstacked_inventories.get_parent_map(

1593

1450

key[-1:] for key in parents)

1594

1451

parents.difference_update(present_inventories)

1595

if len(parents) == 0:

1596

# No missing parent inventories.

1597

return set()

1598

if not check_for_missing_texts:

1599

return set(('inventories', rev_id) for (rev_id,) in parents)

1600

# Ok, now we have a list of missing inventories. But these only matter

1601

# if the inventories that reference them are missing some texts they

1602

# appear to introduce.

1603

# XXX: Texts referenced by all added inventories need to be present,

1604

# but at the moment we're only checking for texts referenced by

1605

# inventories at the graph's edge.

1606

key_deps = self.revisions._index._key_dependencies

1607

key_deps.add_keys(present_inventories)

1608

referrers = frozenset(r[0] for r in key_deps.get_referrers())

1609

file_ids = self.fileids_altered_by_revision_ids(referrers)

1610

missing_texts = set()

1611

for file_id, version_ids in file_ids.iteritems():

1612

missing_texts.update(

1613

(file_id, version_id) for version_id in version_ids)

1614

present_texts = self.texts.get_parent_map(missing_texts)

1615

missing_texts.difference_update(present_texts)

1616

if not missing_texts:

1617

# No texts are missing, so all revisions and their deltas are

1618

# reconstructable.

1619

return set()

1620

# Alternatively the text versions could be returned as the missing

1621

# keys, but this is likely to be less data.

1622

1452

missing_keys = set(('inventories', rev_id) for (rev_id,) in parents)

1623

1453

return missing_keys

1624

1454

1676

1506

raise errors.InternalBzrError(

1677

1507

"May not fetch while in a write group.")

1678

1508

# fast path same-url fetch operations

1679

# TODO: lift out to somewhere common with RemoteRepository

1680

# <https://bugs.edge.launchpad.net/bzr/+bug/401646>

1681

if (self.has_same_location(source)

1682

and fetch_spec is None

1683

and self._has_same_fallbacks(source)):

1509

if self.has_same_location(source) and fetch_spec is None:

1684

1510

# check that last_revision is in 'from' and then return a

1685

1511

# no-operation.

1686

1512

if (revision_id is not None and

1711

1537

:param revprops: Optional dictionary of revision properties.

1712

1538

:param revision_id: Optional revision id.

1713

1539

"""

1714

if self._fallback_repositories:

1715

raise errors.BzrError("Cannot commit from a lightweight checkout "

1716

"to a stacked branch. See "

1717

"https://bugs.launchpad.net/bzr/+bug/375013 for details.")

1718

1540

result = self._commit_builder_class(self, parents, config,

1719

1541

timestamp, timezone, committer, revprops, revision_id)

1720

1542

self.start_write_group()

1731

1553

self.control_files.unlock()

1732

1554

if self.control_files._lock_count == 0:

1733

1555

self._inventory_entry_cache.clear()

1734

for repo in self._fallback_repositories:

1735

repo.unlock()

1556

for repo in self._fallback_repositories:

1557

repo.unlock()

1736

1558

1737

1559

@needs_read_lock

1738

1560

def clone(self, a_bzrdir, revision_id=None):

1847

1669

1848

1670

@needs_read_lock

1849

1671

def get_revisions(self, revision_ids):

1850

"""Get many revisions at once.

1851

1852

Repositories that need to check data on every revision read should

1853

subclass this method.

1854

"""

1672

"""Get many revisions at once."""

1855

1673

return self._get_revisions(revision_ids)

1856

1674

1857

1675

@needs_read_lock

1858

1676

def _get_revisions(self, revision_ids):

1859

1677

"""Core work logic to get many revisions without sanity checks."""

1678

for rev_id in revision_ids:

1679

if not rev_id or not isinstance(rev_id, basestring):

1680

raise errors.InvalidRevisionId(revision_id=rev_id, branch=self)

1681

keys = [(key,) for key in revision_ids]

1682

stream = self.revisions.get_record_stream(keys, 'unordered', True)

1860

1683

revs = {}

1861

for revid, rev in self._iter_revisions(revision_ids):

1862

if rev is None:

1863

raise errors.NoSuchRevision(self, revid)

1864

revs[revid] = rev

1684

for record in stream:

1685

if record.storage_kind == 'absent':

1686

raise errors.NoSuchRevision(self, record.key[0])

1687

text = record.get_bytes_as('fulltext')

1688

rev = self._serializer.read_revision_from_string(text)

1689

revs[record.key[0]] = rev

1865

1690

return [revs[revid] for revid in revision_ids]

1866

1691

1867

def _iter_revisions(self, revision_ids):

1868

"""Iterate over revision objects.

1869

1870

:param revision_ids: An iterable of revisions to examine. None may be

1871

passed to request all revisions known to the repository. Note that

1872

not all repositories can find unreferenced revisions; for those

1873

repositories only referenced ones will be returned.

1874

:return: An iterator of (revid, revision) tuples. Absent revisions (

1875

those asked for but not available) are returned as (revid, None).

1876

"""

1877

if revision_ids is None:

1878

revision_ids = self.all_revision_ids()

1879

else:

1880

for rev_id in revision_ids:

1881

if not rev_id or not isinstance(rev_id, basestring):

1882

raise errors.InvalidRevisionId(revision_id=rev_id, branch=self)

1883

keys = [(key,) for key in revision_ids]

1884

stream = self.revisions.get_record_stream(keys, 'unordered', True)

1885

for record in stream:

1886

revid = record.key[0]

1887

if record.storage_kind == 'absent':

1888

yield (revid, None)

1889

else:

1890

text = record.get_bytes_as('fulltext')

1891

rev = self._serializer.read_revision_from_string(text)

1892

yield (revid, rev)

1893

1894

1692

@needs_read_lock

1895

1693

def get_revision_xml(self, revision_id):

1896

1694

# TODO: jam 20070210 This shouldn't be necessary since get_revision

2090

1888

yield line, revid

2091

1889

2092

1890

def _find_file_ids_from_xml_inventory_lines(self, line_iterator,

2093

revision_keys):

1891

revision_ids):

2094

1892

"""Helper routine for fileids_altered_by_revision_ids.

2095

1893

2096

1894

This performs the translation of xml lines to revision ids.

2097

1895

2098

1896

:param line_iterator: An iterator of lines, origin_version_id

2099

:param revision_keys: The revision ids to filter for. This should be a

1897

:param revision_ids: The revision ids to filter for. This should be a

2100

1898

set or other type which supports efficient __contains__ lookups, as

2101

the revision key from each parsed line will be looked up in the

2102

revision_keys filter.

1899

the revision id from each parsed line will be looked up in the

1900

revision_ids filter.

2103

1901

:return: a dictionary mapping altered file-ids to an iterable of

2104

1902

revision_ids. Each altered file-ids has the exact revision_ids that

2105

1903

altered it listed explicitly.

2106

1904

"""

2107

1905

seen = set(self._find_text_key_references_from_xml_inventory_lines(

2108

1906

line_iterator).iterkeys())

2109

parent_keys = self._find_parent_keys_of_revisions(revision_keys)

1907

# Note that revision_ids are revision keys.

1908

parent_maps = self.revisions.get_parent_map(revision_ids)

1909

parents = set()

1910

map(parents.update, parent_maps.itervalues())

1911

parents.difference_update(revision_ids)

2110

1912

parent_seen = set(self._find_text_key_references_from_xml_inventory_lines(

2111

self._inventory_xml_lines_for_keys(parent_keys)))

1913

self._inventory_xml_lines_for_keys(parents)))

2112

1914

new_keys = seen - parent_seen

2113

1915

result = {}

2114

1916

setdefault = result.setdefault

2116

1918

setdefault(key[0], set()).add(key[-1])

2117

1919

return result

2118

1920

2119

def _find_parent_ids_of_revisions(self, revision_ids):

2120

"""Find all parent ids that are mentioned in the revision graph.

2121

2122

:return: set of revisions that are parents of revision_ids which are

2123

not part of revision_ids themselves

2124

"""

2125

parent_map = self.get_parent_map(revision_ids)

2126

parent_ids = set()

2127

map(parent_ids.update, parent_map.itervalues())

2128

parent_ids.difference_update(revision_ids)

2129

parent_ids.discard(_mod_revision.NULL_REVISION)

2130

return parent_ids

2131

2132

def _find_parent_keys_of_revisions(self, revision_keys):

2133

"""Similar to _find_parent_ids_of_revisions, but used with keys.

2134

2135

:param revision_keys: An iterable of revision_keys.

2136

:return: The parents of all revision_keys that are not already in

2137

revision_keys

2138

"""

2139

parent_map = self.revisions.get_parent_map(revision_keys)

2140

parent_keys = set()

2141

map(parent_keys.update, parent_map.itervalues())

2142

parent_keys.difference_update(revision_keys)

2143

parent_keys.discard(_mod_revision.NULL_REVISION)

2144

return parent_keys

2145

2146

1921

def fileids_altered_by_revision_ids(self, revision_ids, _inv_weave=None):

2147

1922

"""Find the file ids and versions affected by revisions.

2148

1923

2250

2025

batch_size]

2251

2026

if not to_query:

2252

2027

break

2253

for revision_id in to_query:

2028

for rev_tree in self.revision_trees(to_query):

2029

revision_id = rev_tree.get_revision_id()

2254

2030

parent_ids = ancestors[revision_id]

2255

2031

for text_key in revision_keys[revision_id]:

2256

2032

pb.update("Calculating text parents", processed_texts)

2329

2105

num_file_ids = len(file_ids)

2330

2106

for file_id, altered_versions in file_ids.iteritems():

2331

2107

if pb is not None:

2332

pb.update("Fetch texts", count, num_file_ids)

2108

pb.update("fetch texts", count, num_file_ids)

2333

2109

count += 1

2334

2110

yield ("file", file_id, altered_versions)

2335

2111

2356

2132

"""Get Inventory object by revision id."""

2357

2133

return self.iter_inventories([revision_id]).next()

2358

2134

2359

def iter_inventories(self, revision_ids, ordering=None):

2135

def iter_inventories(self, revision_ids):

2360

2136

"""Get many inventories by revision_ids.

2361

2137

2362

2138

This will buffer some or all of the texts used in constructing the

2364

2140

time.

2365

2141

2366

2142

:param revision_ids: The expected revision ids of the inventories.

2367

:param ordering: optional ordering, e.g. 'topological'. If not

2368

specified, the order of revision_ids will be preserved (by

2369

buffering if necessary).

2370

2143

:return: An iterator of inventories.

2371

2144

"""

2372

2145

if ((None in revision_ids)

2373

2146

or (_mod_revision.NULL_REVISION in revision_ids)):

2374

2147

raise ValueError('cannot get null revision inventory')

2375

return self._iter_inventories(revision_ids, ordering)

2148

return self._iter_inventories(revision_ids)

2376

2149

2377

def _iter_inventories(self, revision_ids, ordering):

2150

def _iter_inventories(self, revision_ids):

2378

2151

"""single-document based inventory iteration."""

2379

inv_xmls = self._iter_inventory_xmls(revision_ids, ordering)

2380

for text, revision_id in inv_xmls:

2152

for text, revision_id in self._iter_inventory_xmls(revision_ids):

2381

2153

yield self.deserialise_inventory(revision_id, text)

2382

2154

2383

def _iter_inventory_xmls(self, revision_ids, ordering):

2384

if ordering is None:

2385

order_as_requested = True

2386

ordering = 'unordered'

2387

else:

2388

order_as_requested = False

2155

def _iter_inventory_xmls(self, revision_ids):

2389

2156

keys = [(revision_id,) for revision_id in revision_ids]

2390

if not keys:

2391

return

2392

if order_as_requested:

2393

key_iter = iter(keys)

2394

next_key = key_iter.next()

2395

stream = self.inventories.get_record_stream(keys, ordering, True)

2157

stream = self.inventories.get_record_stream(keys, 'unordered', True)

2396

2158

text_chunks = {}

2397

2159

for record in stream:

2398

2160

if record.storage_kind != 'absent':

2399

chunks = record.get_bytes_as('chunked')

2400

if order_as_requested:

2401

text_chunks[record.key] = chunks

2402

else:

2403

yield ''.join(chunks), record.key[-1]

2161

text_chunks[record.key] = record.get_bytes_as('chunked')

2404

2162

else:

2405

2163

raise errors.NoSuchRevision(self, record.key)

2406

if order_as_requested:

2407

# Yield as many results as we can while preserving order.

2408

while next_key in text_chunks:

2409

chunks = text_chunks.pop(next_key)

2410

yield ''.join(chunks), next_key[-1]

2411

try:

2412

next_key = key_iter.next()

2413

except StopIteration:

2414

# We still want to fully consume the get_record_stream,

2415

# just in case it is not actually finished at this point

2416

next_key = None

2417

break

2164

for key in keys:

2165

chunks = text_chunks.pop(key)

2166

yield ''.join(chunks), key[-1]

2418

2167

2419

2168

def deserialise_inventory(self, revision_id, xml):

2420

2169

"""Transform the xml into an inventory object.

2441

2190

@needs_read_lock

2442

2191

def get_inventory_xml(self, revision_id):

2443

2192

"""Get inventory XML as a file object."""

2444

texts = self._iter_inventory_xmls([revision_id], 'unordered')

2193

texts = self._iter_inventory_xmls([revision_id])

2445

2194

try:

2446

2195

text, revision_id = texts.next()

2447

2196

except StopIteration:

2454

2203

"""

2455

2204

return self.get_revision(revision_id).inventory_sha1

2456

2205

2457

def get_rev_id_for_revno(self, revno, known_pair):

2458

"""Return the revision id of a revno, given a later (revno, revid)

2459

pair in the same history.

2460

2461

:return: if found (True, revid). If the available history ran out

2462

before reaching the revno, then this returns

2463

(False, (closest_revno, closest_revid)).

2464

"""

2465

known_revno, known_revid = known_pair

2466

partial_history = [known_revid]

2467

distance_from_known = known_revno - revno

2468

if distance_from_known < 0:

2469

raise ValueError(

2470

'requested revno (%d) is later than given known revno (%d)'

2471

% (revno, known_revno))

2472

try:

2473

_iter_for_revno(

2474

self, partial_history, stop_index=distance_from_known)

2475

except errors.RevisionNotPresent, err:

2476

if err.revision_id == known_revid:

2477

# The start revision (known_revid) wasn't found.

2478

raise

2479

# This is a stacked repository with no fallbacks, or a there's a

2480

# left-hand ghost. Either way, even though the revision named in

2481

# the error isn't in this repo, we know it's the next step in this

2482

# left-hand history.

2483

partial_history.append(err.revision_id)

2484

if len(partial_history) <= distance_from_known:

2485

# Didn't find enough history to get a revid for the revno.

2486

earliest_revno = known_revno - len(partial_history) + 1

2487

return (False, (earliest_revno, partial_history[-1]))

2488

if len(partial_history) - 1 > distance_from_known:

2489

raise AssertionError('_iter_for_revno returned too much history')

2490

return (True, partial_history[-1])

2491

2492

2206

def iter_reverse_revision_history(self, revision_id):

2493

2207

"""Iterate backwards through revision ids in the lefthand history

2494

2208

2500

2214

while True:

2501

2215

if next_id in (None, _mod_revision.NULL_REVISION):

2502

2216

return

2503

try:

2504

parents = graph.get_parent_map([next_id])[next_id]

2505

except KeyError:

2506

raise errors.RevisionNotPresent(next_id, self)

2507

2217

yield next_id

2218

# Note: The following line may raise KeyError in the event of

2219

# truncated history. We decided not to have a try:except:raise

2220

# RevisionNotPresent here until we see a use for it, because of the

2221

# cost in an inner loop that is by its very nature O(history).

2222

# Robert Collins 20080326

2223

parents = graph.get_parent_map([next_id])[next_id]

2508

2224

if len(parents) == 0:

2509

2225

return

2510

2226

else:

2624

2340

keys = tsort.topo_sort(parent_map)

2625

2341

return [None] + list(keys)

2626

2342

2627

def pack(self, hint=None):

2343

def pack(self):

2628

2344

"""Compress the data within the repository.

2629

2345

2630

2346

This operation only makes sense for some repository types. For other

2633

2349

This stub method does not require a lock, but subclasses should use

2634

2350

@needs_write_lock as this is a long running call its reasonable to

2635

2351

implicitly lock for the user.

2636

2637

:param hint: If not supplied, the whole repository is packed.

2638

If supplied, the repository may use the hint parameter as a

2639

hint for the parts of the repository to pack. A hint can be

2640

obtained from the result of commit_write_group(). Out of

2641

date hints are simply ignored, because concurrent operations

2642

can obsolete them rapidly.

2643

2352

"""

2644

2353

2645

2354

def get_transaction(self):

2646

2355

return self.control_files.get_transaction()

2647

2356

2648

2357

def get_parent_map(self, revision_ids):

2649

"""See graph.StackedParentsProvider.get_parent_map"""

2358

"""See graph._StackedParentsProvider.get_parent_map"""

2650

2359

# revisions index works in keys; this just works in revisions

2651

2360

# therefore wrap and unwrap

2652

2361

query_keys = []

2675

2384

parents_provider = self._make_parents_provider()

2676

2385

if (other_repository is not None and

2677

2386

not self.has_same_location(other_repository)):

2678

parents_provider = graph.StackedParentsProvider(

2387

parents_provider = graph._StackedParentsProvider(

2679

2388

[parents_provider, other_repository._make_parents_provider()])

2680

2389

return graph.Graph(parents_provider)

2681

2390

2682

def _get_versioned_file_checker(self, text_key_references=None,

2683

ancestors=None):

2391

def _get_versioned_file_checker(self, text_key_references=None):

2684

2392

"""Return an object suitable for checking versioned files.

2685

2393

2686

2394

:param text_key_references: if non-None, an already built

2688

2396

to whether they were referred to by the inventory of the

2689

2397

revision_id that they contain. If None, this will be

2690

2398

calculated.

2691

:param ancestors: Optional result from

2692

self.get_graph().get_parent_map(self.all_revision_ids()) if already

2693

available.

2694

2399

"""

2695

2400

return _VersionedFileChecker(self,

2696

text_key_references=text_key_references, ancestors=ancestors)

2401

text_key_references=text_key_references)

2697

2402

2698

2403

def revision_ids_to_search_result(self, result_set):

2699

2404

"""Convert a set of revision ids to a graph SearchResult."""

2749

2454

return record.get_bytes_as('fulltext')

2750

2455

2751

2456

@needs_read_lock

2752

def check(self, revision_ids=None, callback_refs=None, check_repo=True):

2457

def check(self, revision_ids=None):

2753

2458

"""Check consistency of all history of given revision_ids.

2754

2459

2755

2460

Different repository implementations should override _check().

2756

2461

2757

2462

:param revision_ids: A non-empty list of revision_ids whose ancestry

2758

2463

will be checked. Typically the last revision_id of a branch.

2759

:param callback_refs: A dict of check-refs to resolve and callback

2760

the check/_check method on the items listed as wanting the ref.

2761

see bzrlib.check.

2762

:param check_repo: If False do not check the repository contents, just

2763

calculate the data callback_refs requires and call them back.

2764

2464

"""

2765

return self._check(revision_ids, callback_refs=callback_refs,

2766

check_repo=check_repo)

2465

# TODO: Reinstate or confirm its obsolescence.

2466

# from Branch.check - a cross check that the parents index

2467

# (iter_reverse_revision_history uses that) and the revision objects

2468

# match up.

2469

#real_rev_history = list(self.repository.iter_reverse_revision_history(

2470

# last_revision_id))

2471

#real_rev_history.reverse()

2472

2473

#mainline_parent_id = None

2474

#for revision_id in real_rev_history:

2475

# try:

2476

# revision = self.repository.get_revision(revision_id)

2477

# except errors.NoSuchRevision, e:

2478

# result.errors.append(errors.BzrCheckError(

2479

# "mainline revision {%s} not in repository" % revision_id))

2480

# break

2481

# # In general the first entry on the revision history has no parents.

2482

# # But it's not illegal for it to have parents listed; this can happen

2483

# # in imports from Arch when the parents weren't reachable.

2484

# if mainline_parent_id is not None:

2485

# if mainline_parent_id not in revision.parent_ids:

2486

# raise errors.BzrCheckError("previous revision {%s} not listed among "

2487

# "parents of {%s}"

2488

# % (mainline_parent_id, revision_id))

2489

# mainline_parent_id = revision_id

2490

return self._check(revision_ids)

2767

2491

2768

def _check(self, revision_ids, callback_refs, check_repo):

2769

result = check.Check(self, check_repo=check_repo)

2770

result.check(callback_refs)

2492

def _check(self, revision_ids):

2493

result = check.Check(self)

2494

result.check()

2771

2495

return result

2772

2496

2773

2497

def _warn_if_deprecated(self):

3058

2782

# Does this format have < O(tree_size) delta generation. Used to hint what

3059

2783

# code path for commit, amongst other things.

3060

2784

fast_deltas = None

3061

# Does doing a pack operation compress data? Useful for the pack UI command

3062

# (so if there is one pack, the operation can still proceed because it may

3063

# help), and for fetching when data won't have come from the same

3064

# compressor.

3065

pack_compresses = False

3066

# Does the repository inventory storage understand references to trees?

3067

supports_tree_reference = None

3068

2785

3069

2786

def __str__(self):

3070

2787

return "<%s>" % self.__class__.__name__

3174

2891

raise NotImplementedError(self.network_name)

3175

2892

3176

2893

def check_conversion_target(self, target_format):

3177

if self.rich_root_data and not target_format.rich_root_data:

3178

raise errors.BadConversionTarget(

3179

'Does not support rich root data.', target_format,

3180

from_format=self)

3181

if (self.supports_tree_reference and

3182

not getattr(target_format, 'supports_tree_reference', False)):

3183

raise errors.BadConversionTarget(

3184

'Does not support nested trees', target_format,

3185

from_format=self)

2894

raise NotImplementedError(self.check_conversion_target)

3186

2895

3187

2896

def open(self, a_bzrdir, _found=False):

3188

2897

"""Return an instance of this format for the bzrdir a_bzrdir.

3347

3056

'RepositoryFormatCHK1',

3348

3057

)

3349

3058

3350

format_registry.register_lazy(

3351

'Bazaar development format - chk repository with bencode revision '

3352

'serialization (needs bzr.dev from 1.16)\n',

3353

'bzrlib.repofmt.groupcompress_repo',

3354

'RepositoryFormatCHK2',

3355

)

3356

format_registry.register_lazy(

3357

'Bazaar repository format 2a (needs bzr 1.16 or later)\n',

3358

'bzrlib.repofmt.groupcompress_repo',

3359

'RepositoryFormat2a',

3360

)

3361

3362

3059

3363

3060

class InterRepository(InterObject):

3364

3061

"""This class represents operations taking place between two repositories.

3585

3282

self.target.texts.insert_record_stream(

3586

3283

self.source.texts.get_record_stream(

3587

3284

self.source.texts.keys(), 'topological', False))

3588

pb.update('Copying inventory', 0, 1)

3285

pb.update('copying inventory', 0, 1)

3589

3286

self.target.inventories.insert_record_stream(

3590

3287

self.source.inventories.get_record_stream(

3591

3288

self.source.inventories.keys(), 'topological', False))

3705

3402

return self.source.revision_ids_to_search_result(result_set)

3706

3403

3707

3404

3405

class InterPackRepo(InterSameDataRepository):

3406

"""Optimised code paths between Pack based repositories."""

3407

3408

@classmethod

3409

def _get_repo_format_to_test(self):

3410

from bzrlib.repofmt import pack_repo

3411

return pack_repo.RepositoryFormatKnitPack6RichRoot()

3412

3413

@staticmethod

3414

def is_compatible(source, target):

3415

"""Be compatible with known Pack formats.

3416

3417

We don't test for the stores being of specific types because that

3418

could lead to confusing results, and there is no need to be

3419

overly general.

3420

3421

InterPackRepo does not support CHK based repositories.

3422

"""

3423

from bzrlib.repofmt.pack_repo import RepositoryFormatPack

3424

from bzrlib.repofmt.groupcompress_repo import RepositoryFormatCHK1

3425

try:

3426

are_packs = (isinstance(source._format, RepositoryFormatPack) and

3427

isinstance(target._format, RepositoryFormatPack))

3428

not_packs = (isinstance(source._format, RepositoryFormatCHK1) or

3429

isinstance(target._format, RepositoryFormatCHK1))

3430

except AttributeError:

3431

return False

3432

if not_packs or not are_packs:

3433

return False

3434

return InterRepository._same_model(source, target)

3435

3436

@needs_write_lock

3437

def fetch(self, revision_id=None, pb=None, find_ghosts=False,

3438

fetch_spec=None):

3439

"""See InterRepository.fetch()."""

3440

if (len(self.source._fallback_repositories) > 0 or

3441

len(self.target._fallback_repositories) > 0):

3442

# The pack layer is not aware of fallback repositories, so when

3443

# fetching from a stacked repository or into a stacked repository

3444

# we use the generic fetch logic which uses the VersionedFiles

3445

# attributes on repository.

3446

from bzrlib.fetch import RepoFetcher

3447

fetcher = RepoFetcher(self.target, self.source, revision_id,

3448

pb, find_ghosts, fetch_spec=fetch_spec)

3449

if fetch_spec is not None:

3450

if len(list(fetch_spec.heads)) != 1:

3451

raise AssertionError(

3452

"InterPackRepo.fetch doesn't support "

3453

"fetching multiple heads yet.")

3454

revision_id = list(fetch_spec.heads)[0]

3455

fetch_spec = None

3456

if revision_id is None:

3457

# TODO:

3458

# everything to do - use pack logic

3459

# to fetch from all packs to one without

3460

# inventory parsing etc, IFF nothing to be copied is in the target.

3461

# till then:

3462

source_revision_ids = frozenset(self.source.all_revision_ids())

3463

revision_ids = source_revision_ids - \

3464

frozenset(self.target.get_parent_map(source_revision_ids))

3465

revision_keys = [(revid,) for revid in revision_ids]

3466

index = self.target._pack_collection.revision_index.combined_index

3467

present_revision_ids = set(item[1][0] for item in

3468

index.iter_entries(revision_keys))

3469

revision_ids = set(revision_ids) - present_revision_ids

3470

# implementing the TODO will involve:

3471

# - detecting when all of a pack is selected

3472

# - avoiding as much as possible pre-selection, so the

3473

# more-core routines such as create_pack_from_packs can filter in

3474

# a just-in-time fashion. (though having a HEADS list on a

3475

# repository might make this a lot easier, because we could

3476

# sensibly detect 'new revisions' without doing a full index scan.

3477

elif _mod_revision.is_null(revision_id):

3478

# nothing to do:

3479

return (0, [])

3480

else:

3481

revision_ids = self.search_missing_revision_ids(revision_id,

3482

find_ghosts=find_ghosts).get_keys()

3483

if len(revision_ids) == 0:

3484

return (0, [])

3485

return self._pack(self.source, self.target, revision_ids)

3486

3487

def _pack(self, source, target, revision_ids):

3488

from bzrlib.repofmt.pack_repo import Packer

3489

packs = source._pack_collection.all_packs()

3490

pack = Packer(self.target._pack_collection, packs, '.fetch',

3491

revision_ids).pack()

3492

if pack is not None:

3493

self.target._pack_collection._save_pack_names()

3494

copied_revs = pack.get_revision_count()

3495

# Trigger an autopack. This may duplicate effort as we've just done

3496

# a pack creation, but for now it is simpler to think about as

3497

# 'upload data, then repack if needed'.

3498

self.target._pack_collection.autopack()

3499

return (copied_revs, [])

3500

else:

3501

return (0, [])

3502

3503

@needs_read_lock

3504

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

3505

"""See InterRepository.missing_revision_ids().

3506

3507

:param find_ghosts: Find ghosts throughout the ancestry of

3508

revision_id.

3509

"""

3510

if not find_ghosts and revision_id is not None:

3511

return self._walk_to_common_revisions([revision_id])

3512

elif revision_id is not None:

3513

# Find ghosts: search for revisions pointing from one repository to

3514

# the other, and vice versa, anywhere in the history of revision_id.

3515

graph = self.target.get_graph(other_repository=self.source)

3516

searcher = graph._make_breadth_first_searcher([revision_id])

3517

found_ids = set()

3518

while True:

3519

try:

3520

next_revs, ghosts = searcher.next_with_ghosts()

3521

except StopIteration:

3522

break

3523

if revision_id in ghosts:

3524

raise errors.NoSuchRevision(self.source, revision_id)

3525

found_ids.update(next_revs)

3526

found_ids.update(ghosts)

3527

found_ids = frozenset(found_ids)

3528

# Double query here: should be able to avoid this by changing the

3529

# graph api further.

3530

result_set = found_ids - frozenset(

3531

self.target.get_parent_map(found_ids))

3532

else:

3533

source_ids = self.source.all_revision_ids()

3534

# source_ids is the worst possible case we may need to pull.

3535

# now we want to filter source_ids against what we actually

3536

# have in target, but don't try to check for existence where we know

3537

# we do not have a revision as that would be pointless.

3538

target_ids = set(self.target.all_revision_ids())

3539

result_set = set(source_ids).difference(target_ids)

3540

return self.source.revision_ids_to_search_result(result_set)

3541

3542

3708

3543

class InterDifferingSerializer(InterRepository):

3709

3544

3710

3545

@classmethod

3717

3552

# This is redundant with format.check_conversion_target(), however that

3718

3553

# raises an exception, and we just want to say "False" as in we won't

3719

3554

# support converting between these formats.

3720

if 'IDS_never' in debug.debug_flags:

3721

return False

3722

3555

if source.supports_rich_root() and not target.supports_rich_root():

3723

3556

return False

3724

3557

if (source._format.supports_tree_reference

3725

3558

and not target._format.supports_tree_reference):

3726

3559

return False

3727

if target._fallback_repositories and target._format.supports_chks:

3728

# IDS doesn't know how to copy CHKs for the parent inventories it

3729

# adds to stacked repos.

3730

return False

3731

if 'IDS_always' in debug.debug_flags:

3732

return True

3733

# Only use this code path for local source and target. IDS does far

3734

# too much IO (both bandwidth and roundtrips) over a network.

3735

if not source.bzrdir.transport.base.startswith('file:///'):

3736

return False

3737

if not target.bzrdir.transport.base.startswith('file:///'):

3738

return False

3739

3560

return True

3740

3561

3741

def _get_trees(self, revision_ids, cache):

3742

possible_trees = []

3743

for rev_id in revision_ids:

3744

if rev_id in cache:

3745

possible_trees.append((rev_id, cache[rev_id]))

3746

else:

3747

# Not cached, but inventory might be present anyway.

3748

try:

3749

tree = self.source.revision_tree(rev_id)

3750

except errors.NoSuchRevision:

3751

# Nope, parent is ghost.

3752

pass

3753

else:

3754

cache[rev_id] = tree

3755

possible_trees.append((rev_id, tree))

3756

return possible_trees

3757

3758

def _get_delta_for_revision(self, tree, parent_ids, possible_trees):

3562

def _get_delta_for_revision(self, tree, parent_ids, basis_id, cache):

3759

3563

"""Get the best delta and base for this revision.

3760

3564

3761

3565

:return: (basis_id, delta)

3762

3566

"""

3567

possible_trees = [(parent_id, cache[parent_id])

3568

for parent_id in parent_ids

3569

if parent_id in cache]

3570

if len(possible_trees) == 0:

3571

# There either aren't any parents, or the parents aren't in the

3572

# cache, so just use the last converted tree

3573

possible_trees.append((basis_id, cache[basis_id]))

3763

3574

deltas = []

3764

# Generate deltas against each tree, to find the shortest.

3765

texts_possibly_new_in_tree = set()

3766

3575

for basis_id, basis_tree in possible_trees:

3767

3576

delta = tree.inventory._make_delta(basis_tree.inventory)

3768

for old_path, new_path, file_id, new_entry in delta:

3769

if new_path is None:

3770

# This file_id isn't present in the new rev, so we don't

3771

# care about it.

3772

continue

3773

if not new_path:

3774

# Rich roots are handled elsewhere...

3775

continue

3776

kind = new_entry.kind

3777

if kind != 'directory' and kind != 'file':

3778

# No text record associated with this inventory entry.

3779

continue

3780

# This is a directory or file that has changed somehow.

3781

texts_possibly_new_in_tree.add((file_id, new_entry.revision))

3782

3577

deltas.append((len(delta), basis_id, delta))

3783

3578

deltas.sort()

3784

3579

return deltas[0][1:]

3785

3580

3786

def _fetch_parent_invs_for_stacking(self, parent_map, cache):

3787

"""Find all parent revisions that are absent, but for which the

3788

inventory is present, and copy those inventories.

3581

def _get_parent_keys(self, root_key, parent_map):

3582

"""Get the parent keys for a given root id."""

3583

root_id, rev_id = root_key

3584

# Include direct parents of the revision, but only if they used

3585

# the same root_id.

3586

parent_keys = []

3587

for parent_id in parent_map[rev_id]:

3588

if parent_id == _mod_revision.NULL_REVISION:

3589

continue

3590

if parent_id not in self._revision_id_to_root_id:

3591

# We probably didn't read this revision, go spend the

3592

# extra effort to actually check

3593

try:

3594

tree = self.source.revision_tree(parent_id)

3595

except errors.NoSuchRevision:

3596

# Ghost, fill out _revision_id_to_root_id in case we

3597

# encounter this again.

3598

# But set parent_root_id to None since we don't really know

3599

parent_root_id = None

3600

else:

3601

parent_root_id = tree.get_root_id()

3602

self._revision_id_to_root_id[parent_id] = None

3603

else:

3604

parent_root_id = self._revision_id_to_root_id[parent_id]

3605

if root_id == parent_root_id or parent_root_id is None:

3606

parent_keys.append((root_id, parent_id))

3607

return tuple(parent_keys)

3789

3608

3790

This is necessary to preserve correctness when the source is stacked

3791

without fallbacks configured. (Note that in cases like upgrade the

3792

source may be not have _fallback_repositories even though it is

3793

stacked.)

3794

"""

3795

parent_revs = set()

3796

for parents in parent_map.values():

3797

parent_revs.update(parents)

3798

present_parents = self.source.get_parent_map(parent_revs)

3799

absent_parents = set(parent_revs).difference(present_parents)

3800

parent_invs_keys_for_stacking = self.source.inventories.get_parent_map(

3801

(rev_id,) for rev_id in absent_parents)

3802

parent_inv_ids = [key[-1] for key in parent_invs_keys_for_stacking]

3803

for parent_tree in self.source.revision_trees(parent_inv_ids):

3804

current_revision_id = parent_tree.get_revision_id()

3805

parents_parents_keys = parent_invs_keys_for_stacking[

3806

(current_revision_id,)]

3807

parents_parents = [key[-1] for key in parents_parents_keys]

3808

basis_id = _mod_revision.NULL_REVISION

3809

basis_tree = self.source.revision_tree(basis_id)

3810

delta = parent_tree.inventory._make_delta(basis_tree.inventory)

3811

self.target.add_inventory_by_delta(

3812

basis_id, delta, current_revision_id, parents_parents)

3813

cache[current_revision_id] = parent_tree

3609

def _new_root_data_stream(self, root_keys_to_create, parent_map):

3610

for root_key in root_keys_to_create:

3611

parent_keys = self._get_parent_keys(root_key, parent_map)

3612

yield versionedfile.FulltextContentFactory(root_key,

3613

parent_keys, None, '')

3814

3614

3815

3615

def _fetch_batch(self, revision_ids, basis_id, cache):

3816

3616

"""Fetch across a few revisions.

3830

3630

pending_deltas = []

3831

3631

pending_revisions = []

3832

3632

parent_map = self.source.get_parent_map(revision_ids)

3833

self._fetch_parent_invs_for_stacking(parent_map, cache)

3834

3633

for tree in self.source.revision_trees(revision_ids):

3835

# Find a inventory delta for this revision.

3836

# Find text entries that need to be copied, too.

3837

3634

current_revision_id = tree.get_revision_id()

3838

3635

parent_ids = parent_map.get(current_revision_id, ())

3839

parent_trees = self._get_trees(parent_ids, cache)

3840

possible_trees = list(parent_trees)

3841

if len(possible_trees) == 0:

3842

# There either aren't any parents, or the parents are ghosts,

3843

# so just use the last converted tree.

3844

possible_trees.append((basis_id, cache[basis_id]))

3845

3636

basis_id, delta = self._get_delta_for_revision(tree, parent_ids,

3846

possible_trees)

3847

revision = self.source.get_revision(current_revision_id)

3848

pending_deltas.append((basis_id, delta,

3849

current_revision_id, revision.parent_ids))

3637

basis_id, cache)

3850

3638

if self._converting_to_rich_root:

3851

3639

self._revision_id_to_root_id[current_revision_id] = \

3852

3640

tree.get_root_id()

3853

# Determine which texts are in present in this revision but not in

3854

# any of the available parents.

3855

texts_possibly_new_in_tree = set()

3641

# Find text entries that need to be copied

3856

3642

for old_path, new_path, file_id, entry in delta:

3857

if new_path is None:

3858

# This file_id isn't present in the new rev

3859

continue

3860

if not new_path:

3861

# This is the root

3862

if not self.target.supports_rich_root():

3863

# The target doesn't support rich root, so we don't

3864

# copy

3865

continue

3866

if self._converting_to_rich_root:

3867

# This can't be copied normally, we have to insert

3868

# it specially

3869

root_keys_to_create.add((file_id, entry.revision))

3870

continue

3871

kind = entry.kind

3872

texts_possibly_new_in_tree.add((file_id, entry.revision))

3873

for basis_id, basis_tree in possible_trees:

3874

basis_inv = basis_tree.inventory

3875

for file_key in list(texts_possibly_new_in_tree):

3876

file_id, file_revision = file_key

3877

try:

3878

entry = basis_inv[file_id]

3879

except errors.NoSuchId:

3880

continue

3881

if entry.revision == file_revision:

3882

texts_possibly_new_in_tree.remove(file_key)

3883

text_keys.update(texts_possibly_new_in_tree)

3643

if new_path is not None:

3644

if not new_path:

3645

# This is the root

3646

if not self.target.supports_rich_root():

3647

# The target doesn't support rich root, so we don't

3648

# copy

3649

continue

3650

if self._converting_to_rich_root:

3651

# This can't be copied normally, we have to insert

3652

# it specially

3653

root_keys_to_create.add((file_id, entry.revision))

3654

continue

3655

text_keys.add((file_id, entry.revision))

3656

revision = self.source.get_revision(current_revision_id)

3657

pending_deltas.append((basis_id, delta,

3658

current_revision_id, revision.parent_ids))

3884

3659

pending_revisions.append(revision)

3885

3660

cache[current_revision_id] = tree

3886

3661

basis_id = current_revision_id

3888

3663

from_texts = self.source.texts

3889

3664

to_texts = self.target.texts

3890

3665

if root_keys_to_create:

3891

from bzrlib.fetch import _new_root_data_stream

3892

root_stream = _new_root_data_stream(

3893

root_keys_to_create, self._revision_id_to_root_id, parent_map,

3894

self.source)

3666

root_stream = self._new_root_data_stream(root_keys_to_create,

3667

parent_map)

3895

3668

to_texts.insert_record_stream(root_stream)

3896

3669

to_texts.insert_record_stream(from_texts.get_record_stream(

3897

3670

text_keys, self.target._format._fetch_order,

3904

3677

# for the new revisions that we are about to insert. We do this

3905

3678

# before adding the revisions so that no revision is added until

3906

3679

# all the inventories it may depend on are added.

3907

# Note that this is overzealous, as we may have fetched these in an

3908

# earlier batch.

3909

3680

parent_ids = set()

3910

3681

revision_ids = set()

3911

3682

for revision in pending_revisions:

3914

3685

parent_ids.difference_update(revision_ids)

3915

3686

parent_ids.discard(_mod_revision.NULL_REVISION)

3916

3687

parent_map = self.source.get_parent_map(parent_ids)

3917

# we iterate over parent_map and not parent_ids because we don't

3918

# want to try copying any revision which is a ghost

3919

for parent_tree in self.source.revision_trees(parent_map):

3688

for parent_tree in self.source.revision_trees(parent_ids):

3689

basis_id, delta = self._get_delta_for_revision(tree, parent_ids, basis_id, cache)

3920

3690

current_revision_id = parent_tree.get_revision_id()

3921

3691

parents_parents = parent_map[current_revision_id]

3922

possible_trees = self._get_trees(parents_parents, cache)

3923

if len(possible_trees) == 0:

3924

# There either aren't any parents, or the parents are

3925

# ghosts, so just use the last converted tree.

3926

possible_trees.append((basis_id, cache[basis_id]))

3927

basis_id, delta = self._get_delta_for_revision(parent_tree,

3928

parents_parents, possible_trees)

3929

3692

self.target.add_inventory_by_delta(

3930

3693

basis_id, delta, current_revision_id, parents_parents)

3931

3694

# insert signatures and revisions

3945

3708

3946

3709

:param revision_ids: The list of revisions to fetch. Must be in

3947

3710

topological order.

3948

:param pb: A ProgressTask

3711

:param pb: A ProgressBar

3949

3712

:return: None

3950

3713

"""

3951

3714

basis_id, basis_tree = self._get_basis(revision_ids[0])

3953

3716

cache = lru_cache.LRUCache(100)

3954

3717

cache[basis_id] = basis_tree

3955

3718

del basis_tree # We don't want to hang on to it here

3956

hints = []

3957

3719

for offset in range(0, len(revision_ids), batch_size):

3958

3720

self.target.start_write_group()

3959

3721

try:

3965

3727

self.target.abort_write_group()

3966

3728

raise

3967

3729

else:

3968

hint = self.target.commit_write_group()

3969

if hint:

3970

hints.extend(hint)

3971

if hints and self.target._format.pack_compresses:

3972

self.target.pack(hint=hints)

3730

self.target.commit_write_group()

3973

3731

pb.update('Transferring revisions', len(revision_ids),

3974

3732

len(revision_ids))

3975

3733

3996

3754

# Walk though all revisions; get inventory deltas, copy referenced

3997

3755

# texts that delta references, insert the delta, revision and

3998

3756

# signature.

3757

first_rev = self.source.get_revision(revision_ids[0])

3999

3758

if pb is None:

4000

3759

my_pb = ui.ui_factory.nested_progress_bar()

4001

3760

pb = my_pb

4038

3797

InterRepository.register_optimiser(InterSameDataRepository)

4039

3798

InterRepository.register_optimiser(InterWeaveRepo)

4040

3799

InterRepository.register_optimiser(InterKnitRepo)

3800

InterRepository.register_optimiser(InterPackRepo)

4041

3801

4042

3802

4043

3803

class CopyConverter(object):

4078

3838

self.source_repo.is_shared())

4079

3839

converted.lock_write()

4080

3840

try:

4081

self.step('Copying content')

3841

self.step('Copying content into repository.')

4082

3842

self.source_repo.copy_content_into(converted)

4083

3843

finally:

4084

3844

converted.unlock()

4085

self.step('Deleting old repository content')

3845

self.step('Deleting old repository content.')

4086

3846

self.repo_dir.transport.delete_tree('repository.backup')

4087

3847

self.pb.note('repository converted')

4088

3848

4124

3884

4125

3885

class _VersionedFileChecker(object):

4126

3886

4127

def __init__(self, repository, text_key_references=None, ancestors=None):

3887

def __init__(self, repository, text_key_references=None):

4128

3888

self.repository = repository

4129

3889

self.text_index = self.repository._generate_text_key_index(

4130

text_key_references=text_key_references, ancestors=ancestors)

3890

text_key_references=text_key_references)

4131

3891

4132

3892

def calculate_file_version_parents(self, text_key):

4133

3893

"""Calculate the correct parents for a file version according to

4151

3911

revision_id) tuples for versions that are present in this versioned

4152

3912

file, but not used by the corresponding inventory.

4153

3913

"""

4154

local_progress = None

4155

if progress_bar is None:

4156

local_progress = ui.ui_factory.nested_progress_bar()

4157

progress_bar = local_progress

4158

try:

4159

return self._check_file_version_parents(texts, progress_bar)

4160

finally:

4161

if local_progress:

4162

local_progress.finished()

4163

4164

def _check_file_version_parents(self, texts, progress_bar):

4165

"""See check_file_version_parents."""

4166

3914

wrong_parents = {}

4167

3915

self.file_ids = set([file_id for file_id, _ in

4168

3916

self.text_index.iterkeys()])

4169

3917

# text keys is now grouped by file_id

3918

n_weaves = len(self.file_ids)

3919

files_in_revisions = {}

3920

revisions_of_files = {}

4170

3921

n_versions = len(self.text_index)

4171

3922

progress_bar.update('loading text store', 0, n_versions)

4172

3923

parent_map = self.repository.texts.get_parent_map(self.text_index)

4174

3925

text_keys = self.repository.texts.keys()

4175

3926

unused_keys = frozenset(text_keys) - set(self.text_index)

4176

3927

for num, key in enumerate(self.text_index.iterkeys()):

4177

progress_bar.update('checking text graph', num, n_versions)

3928

if progress_bar is not None:

3929

progress_bar.update('checking text graph', num, n_versions)

4178

3930

correct_parents = self.calculate_file_version_parents(key)

4179

3931

try:

4180

3932

knit_parents = parent_map[key]

4229

3981

try:

4230

3982

if resume_tokens:

4231

3983

self.target_repo.resume_write_group(resume_tokens)

4232

is_resume = True

4233

3984

else:

4234

3985

self.target_repo.start_write_group()

4235

is_resume = False

4236

3986

try:

4237

3987

# locked_insert_stream performs a commit|suspend.

4238

return self._locked_insert_stream(stream, src_format, is_resume)

3988

return self._locked_insert_stream(stream, src_format)

4239

3989

except:

4240

3990

self.target_repo.abort_write_group(suppress_errors=True)

4241

3991

raise

4242

3992

finally:

4243

3993

self.target_repo.unlock()

4244

3994

4245

def _locked_insert_stream(self, stream, src_format, is_resume):

3995

def _locked_insert_stream(self, stream, src_format):

4246

3996

to_serializer = self.target_repo._format._serializer

4247

3997

src_serializer = src_format._serializer

4248

new_pack = None

4249

3998

if to_serializer == src_serializer:

4250

3999

# If serializers match and the target is a pack repository, set the

4251

4000

# write cache size on the new pack. This avoids poor performance

4265

4014

else:

4266

4015

new_pack.set_write_cache_size(1024*1024)

4267

4016

for substream_type, substream in stream:

4268

if 'stream' in debug.debug_flags:

4269

mutter('inserting substream: %s', substream_type)

4270

4017

if substream_type == 'texts':

4271

4018

self.target_repo.texts.insert_record_stream(substream)

4272

4019

elif substream_type == 'inventories':

4276

4023

else:

4277

4024

self._extract_and_insert_inventories(

4278

4025

substream, src_serializer)

4279

elif substream_type == 'inventory-deltas':

4280

self._extract_and_insert_inventory_deltas(

4281

substream, src_serializer)

4282

4026

elif substream_type == 'chk_bytes':

4283

4027

# XXX: This doesn't support conversions, as it assumes the

4284

4028

# conversion was done in the fetch code.

4297

4041

self.target_repo.signatures.insert_record_stream(substream)

4298

4042

else:

4299

4043

raise AssertionError('kaboom! %s' % (substream_type,))

4300

# Done inserting data, and the missing_keys calculations will try to

4301

# read back from the inserted data, so flush the writes to the new pack

4302

# (if this is pack format).

4303

if new_pack is not None:

4304

new_pack._write_data('', flush=True)

4305

4044

# Find all the new revisions (including ones from resume_tokens)

4306

missing_keys = self.target_repo.get_missing_parent_inventories(

4307

check_for_missing_texts=is_resume)

4045

missing_keys = self.target_repo.get_missing_parent_inventories()

4308

4046

try:

4309

4047

for prefix, versioned_file in (

4310

4048

('texts', self.target_repo.texts),

4311

4049

('inventories', self.target_repo.inventories),

4312

4050

('revisions', self.target_repo.revisions),

4313

4051

('signatures', self.target_repo.signatures),

4314

('chk_bytes', self.target_repo.chk_bytes),

4315

4052

4316

if versioned_file is None:

4317

continue

4318

4053

missing_keys.update((prefix,) + key for key in

4319

4054

versioned_file.get_missing_compression_parent_keys())

4320

4055

except NotImplementedError:

4329

4064

# missing keys can handle suspending a write group).

4330

4065

write_group_tokens = self.target_repo.suspend_write_group()

4331

4066

return write_group_tokens, missing_keys

4332

hint = self.target_repo.commit_write_group()

4333

if (to_serializer != src_serializer and

4334

self.target_repo._format.pack_compresses):

4335

self.target_repo.pack(hint=hint)

4067

self.target_repo.commit_write_group()

4336

4068

return [], set()

4337

4069

4338

def _extract_and_insert_inventory_deltas(self, substream, serializer):

4339

target_rich_root = self.target_repo._format.rich_root_data

4340

target_tree_refs = self.target_repo._format.supports_tree_reference

4341

for record in substream:

4342

# Insert the delta directly

4343

inventory_delta_bytes = record.get_bytes_as('fulltext')

4344

deserialiser = inventory_delta.InventoryDeltaDeserializer()

4345

try:

4346

parse_result = deserialiser.parse_text_bytes(

4347

inventory_delta_bytes)

4348

except inventory_delta.IncompatibleInventoryDelta, err:

4349

trace.mutter("Incompatible delta: %s", err.msg)

4350

raise errors.IncompatibleRevision(self.target_repo._format)

4351

basis_id, new_id, rich_root, tree_refs, inv_delta = parse_result

4352

revision_id = new_id

4353

parents = [key[0] for key in record.parents]

4354

self.target_repo.add_inventory_by_delta(

4355

basis_id, inv_delta, revision_id, parents)

4356

4357

def _extract_and_insert_inventories(self, substream, serializer,

4358

parse_delta=None):

4070

def _extract_and_insert_inventories(self, substream, serializer):

4359

4071

"""Generate a new inventory versionedfile in target, converting data.

4360

4072

4361

4073

The inventory is retrieved from the source, (deserializing it), and

4362

4074

stored in the target (reserializing it in a different format).

4363

4075

"""

4364

target_rich_root = self.target_repo._format.rich_root_data

4365

target_tree_refs = self.target_repo._format.supports_tree_reference

4366

4076

for record in substream:

4367

# It's not a delta, so it must be a fulltext in the source

4368

# serializer's format.

4369

4077

bytes = record.get_bytes_as('fulltext')

4370

4078

revision_id = record.key[0]

4371

4079

inv = serializer.read_inventory_from_string(bytes, revision_id)

4372

4080

parents = [key[0] for key in record.parents]

4373

4081

self.target_repo.add_inventory(revision_id, inv, parents)

4374

# No need to keep holding this full inv in memory when the rest of

4375

# the substream is likely to be all deltas.

4376

del inv

4377

4082

4378

4083

def _extract_and_insert_revisions(self, substream, serializer):

4379

4084

for record in substream:

4428

4133

return [('signatures', signatures), ('revisions', revisions)]

4429

4134

4430

4135

def _generate_root_texts(self, revs):

4431

"""This will be called by get_stream between fetching weave texts and

4136

"""This will be called by __fetch between fetching weave texts and

4432

4137

fetching the inventory weave.

4138

4139

Subclasses should override this if they need to generate root texts

4140

after fetching weave texts.

4433

4141

"""

4434

4142

if self._rich_root_upgrade():

4435

4143

import bzrlib.fetch

4442

4150

phase = 'file'

4443

4151

revs = search.get_keys()

4444

4152

graph = self.from_repository.get_graph()

4445

revs = tsort.topo_sort(graph.get_parent_map(revs))

4153

revs = list(graph.iter_topo_order(revs))

4446

4154

data_to_fetch = self.from_repository.item_keys_introduced_by(revs)

4447

4155

text_keys = []

4448

4156

for knit_kind, file_id, revisions in data_to_fetch:

4467

4175

# will be valid.

4468

4176

for _ in self._generate_root_texts(revs):

4469

4177

yield _

4178

# NB: This currently reopens the inventory weave in source;

4179

# using a single stream interface instead would avoid this.

4180

from_weave = self.from_repository.inventories

4470

4181

# we fetch only the referenced inventories because we do not

4471

4182

# know for unselected inventories whether all their required

4472

4183

# texts are present in the other repository - it could be

4491

4202

keys['texts'] = set()

4492

4203

keys['revisions'] = set()

4493

4204

keys['inventories'] = set()

4494

keys['chk_bytes'] = set()

4495

4205

keys['signatures'] = set()

4496

4206

for key in missing_keys:

4497

4207

keys[key[0]].add(key[1:])

4504

4214

keys['revisions'],))

4505

4215

for substream_kind, keys in keys.iteritems():

4506

4216

vf = getattr(self.from_repository, substream_kind)

4507

if vf is None and keys:

4508

raise AssertionError(

4509

"cannot fill in keys for a versioned file we don't"

4510

" have: %s needs %s" % (substream_kind, keys))

4511

if not keys:

4512

# No need to stream something we don't have

4513

continue

4514

if substream_kind == 'inventories':

4515

# Some missing keys are genuinely ghosts, filter those out.

4516

present = self.from_repository.inventories.get_parent_map(keys)

4517

revs = [key[0] for key in present]

4518

# Get the inventory stream more-or-less as we do for the

4519

# original stream; there's no reason to assume that records

4520

# direct from the source will be suitable for the sink. (Think

4521

# e.g. 2a -> 1.9-rich-root).

4522

for info in self._get_inventory_stream(revs, missing=True):

4523

yield info

4524

continue

4525

4526

4217

# Ask for full texts always so that we don't need more round trips

4527

4218

# after this stream.

4528

# Some of the missing keys are genuinely ghosts, so filter absent

4529

# records. The Sink is responsible for doing another check to

4530

# ensure that ghosts don't introduce missing data for future

4531

# fetches.

4532

stream = versionedfile.filter_absent(vf.get_record_stream(keys,

4533

self.to_format._fetch_order, True))

4219

stream = vf.get_record_stream(keys,

4220

self.to_format._fetch_order, True)

4534

4221

yield substream_kind, stream

4535

4222

4536

4223

def inventory_fetch_order(self):

4543

4230

return (not self.from_repository._format.rich_root_data and

4544

4231

self.to_format.rich_root_data)

4545

4232

4546

def _get_inventory_stream(self, revision_ids, missing=False):

4233

def _get_inventory_stream(self, revision_ids):

4547

4234

from_format = self.from_repository._format

4548

if (from_format.supports_chks and self.to_format.supports_chks and

4549

from_format.network_name() == self.to_format.network_name()):

4550

raise AssertionError(

4551

"this case should be handled by GroupCHKStreamSource")

4552

elif 'forceinvdeltas' in debug.debug_flags:

4553

return self._get_convertable_inventory_stream(revision_ids,

4554

delta_versus_null=missing)

4555

elif from_format.network_name() == self.to_format.network_name():

4556

# Same format.

4557

return self._get_simple_inventory_stream(revision_ids,

4558

missing=missing)

4559

elif (not from_format.supports_chks and not self.to_format.supports_chks

4560

and from_format._serializer == self.to_format._serializer):

4561

# Essentially the same format.

4562

return self._get_simple_inventory_stream(revision_ids,

4563

missing=missing)

4235

if (from_format.supports_chks and self.to_format.supports_chks

4236

and (from_format._serializer == self.to_format._serializer)):

4237

# Both sides support chks, and they use the same serializer, so it

4238

# is safe to transmit the chk pages and inventory pages across

4239

# as-is.

4240

return self._get_chk_inventory_stream(revision_ids)

4241

elif (not from_format.supports_chks):

4242

# Source repository doesn't support chks. So we can transmit the

4243

# inventories 'as-is' and either they are just accepted on the

4244

# target, or the Sink will properly convert it.

4245

return self._get_simple_inventory_stream(revision_ids)

4564

4246

else:

4565

# Any time we switch serializations, we want to use an

4566

# inventory-delta based approach.

4567

return self._get_convertable_inventory_stream(revision_ids,

4568

delta_versus_null=missing)

4247

# XXX: Hack to make not-chk->chk fetch: copy the inventories as

4248

# inventories. Note that this should probably be done somehow

4249

# as part of bzrlib.repository.StreamSink. Except JAM couldn't

4250

# figure out how a non-chk repository could possibly handle

4251

# deserializing an inventory stream from a chk repo, as it

4252

# doesn't have a way to understand individual pages.

4253

return self._get_convertable_inventory_stream(revision_ids)

4569

4254

4570

def _get_simple_inventory_stream(self, revision_ids, missing=False):

4571

# NB: This currently reopens the inventory weave in source;

4572

# using a single stream interface instead would avoid this.

4255

def _get_simple_inventory_stream(self, revision_ids):

4573

4256

from_weave = self.from_repository.inventories

4574

if missing:

4575

delta_closure = True

4576

else:

4577

delta_closure = not self.delta_on_metadata()

4578

4257

yield ('inventories', from_weave.get_record_stream(

4579

4258

[(rev_id,) for rev_id in revision_ids],

4580

self.inventory_fetch_order(), delta_closure))

4581

4582

def _get_convertable_inventory_stream(self, revision_ids,

4583

delta_versus_null=False):

4584

# The source is using CHKs, but the target either doesn't or it has a

4585

# different serializer. The StreamSink code expects to be able to

4586

# convert on the target, so we need to put bytes-on-the-wire that can

4587

# be converted. That means inventory deltas (if the remote is <1.19,

4588

# RemoteStreamSink will fallback to VFS to insert the deltas).

4589

yield ('inventory-deltas',

4590

self._stream_invs_as_deltas(revision_ids,

4591

delta_versus_null=delta_versus_null))

4592

4593

def _stream_invs_as_deltas(self, revision_ids, delta_versus_null=False):

4594

"""Return a stream of inventory-deltas for the given rev ids.

4595

4596

:param revision_ids: The list of inventories to transmit

4597

:param delta_versus_null: Don't try to find a minimal delta for this

4598

entry, instead compute the delta versus the NULL_REVISION. This

4599

effectively streams a complete inventory. Used for stuff like

4600

filling in missing parents, etc.

4601

"""

4259

self.inventory_fetch_order(),

4260

not self.delta_on_metadata()))

4261

4262

def _get_chk_inventory_stream(self, revision_ids):

4263

"""Fetch the inventory texts, along with the associated chk maps."""

4264

# We want an inventory outside of the search set, so that we can filter

4265

# out uninteresting chk pages. For now we use

4266

# _find_revision_outside_set, but if we had a Search with cut_revs, we

4267

# could use that instead.

4268

start_rev_id = self.from_repository._find_revision_outside_set(

4269

revision_ids)

4270

start_rev_key = (start_rev_id,)

4271

inv_keys_to_fetch = [(rev_id,) for rev_id in revision_ids]

4272

if start_rev_id != _mod_revision.NULL_REVISION:

4273

inv_keys_to_fetch.append((start_rev_id,))

4274

# Any repo that supports chk_bytes must also support out-of-order

4275

# insertion. At least, that is how we expect it to work

4276

# We use get_record_stream instead of iter_inventories because we want

4277

# to be able to insert the stream as well. We could instead fetch

4278

# allowing deltas, and then iter_inventories, but we don't know whether

4279

# source or target is more 'local' anway.

4280

inv_stream = self.from_repository.inventories.get_record_stream(

4281

inv_keys_to_fetch, 'unordered',

4282

True) # We need them as full-texts so we can find their references

4283

uninteresting_chk_roots = set()

4284

interesting_chk_roots = set()

4285

def filter_inv_stream(inv_stream):

4286

for idx, record in enumerate(inv_stream):

4287

### child_pb.update('fetch inv', idx, len(inv_keys_to_fetch))

4288

bytes = record.get_bytes_as('fulltext')

4289

chk_inv = inventory.CHKInventory.deserialise(

4290

self.from_repository.chk_bytes, bytes, record.key)

4291

if record.key == start_rev_key:

4292

uninteresting_chk_roots.add(chk_inv.id_to_entry.key())

4293

p_id_map = chk_inv.parent_id_basename_to_file_id

4294

if p_id_map is not None:

4295

uninteresting_chk_roots.add(p_id_map.key())

4296

else:

4297

yield record

4298

interesting_chk_roots.add(chk_inv.id_to_entry.key())

4299

p_id_map = chk_inv.parent_id_basename_to_file_id

4300

if p_id_map is not None:

4301

interesting_chk_roots.add(p_id_map.key())

4302

### pb.update('fetch inventory', 0, 2)

4303

yield ('inventories', filter_inv_stream(inv_stream))

4304

# Now that we have worked out all of the interesting root nodes, grab

4305

# all of the interesting pages and insert them

4306

### pb.update('fetch inventory', 1, 2)

4307

interesting = chk_map.iter_interesting_nodes(

4308

self.from_repository.chk_bytes, interesting_chk_roots,

4309

uninteresting_chk_roots)

4310

def to_stream_adapter():

4311

"""Adapt the iter_interesting_nodes result to a single stream.

4312

4313

iter_interesting_nodes returns records as it processes them, along

4314

with keys. However, we only want to return the records themselves.

4315

"""

4316

for record, items in interesting:

4317

if record is not None:

4318

yield record

4319

# XXX: We could instead call get_record_stream(records.keys())

4320

# ATM, this will always insert the records as fulltexts, and

4321

# requires that you can hang on to records once you have gone

4322

# on to the next one. Further, it causes the target to

4323

# recompress the data. Testing shows it to be faster than

4324

# requesting the records again, though.

4325

yield ('chk_bytes', to_stream_adapter())

4326

### pb.update('fetch inventory', 2, 2)

4327

4328

def _get_convertable_inventory_stream(self, revision_ids):

4329

# XXX: One of source or target is using chks, and they don't have

4330

# compatible serializations. The StreamSink code expects to be

4331

# able to convert on the target, so we need to put

4332

# bytes-on-the-wire that can be converted

4333

yield ('inventories', self._stream_invs_as_fulltexts(revision_ids))

4334

4335

def _stream_invs_as_fulltexts(self, revision_ids):

4602

4336

from_repo = self.from_repository

4337

from_serializer = from_repo._format._serializer

4603

4338

revision_keys = [(rev_id,) for rev_id in revision_ids]

4604

4339

parent_map = from_repo.inventories.get_parent_map(revision_keys)

4605

# XXX: possibly repos could implement a more efficient iter_inv_deltas

4606

# method...

4607

inventories = self.from_repository.iter_inventories(

4608

revision_ids, 'topological')

4609

format = from_repo._format

4610

invs_sent_so_far = set([_mod_revision.NULL_REVISION])

4611

inventory_cache = lru_cache.LRUCache(50)

4612

null_inventory = from_repo.revision_tree(

4613

_mod_revision.NULL_REVISION).inventory

4614

# XXX: ideally the rich-root/tree-refs flags would be per-revision, not

4615

# per-repo (e.g. streaming a non-rich-root revision out of a rich-root

4616

# repo back into a non-rich-root repo ought to be allowed)

4617

serializer = inventory_delta.InventoryDeltaSerializer(

4618

versioned_root=format.rich_root_data,

4619

tree_references=format.supports_tree_reference)

4620

for inv in inventories:

4340

for inv in self.from_repository.iter_inventories(revision_ids):

4341

# XXX: This is a bit hackish, but it works. Basically,

4342

# CHKSerializer 'accidentally' supports

4343

# read/write_inventory_to_string, even though that is never

4344

# the format that is stored on disk. It *does* give us a

4345

# single string representation for an inventory, so live with

4346

# it for now.

4347

# This would be far better if we had a 'serialized inventory

4348

# delta' form. Then we could use 'inventory._make_delta', and

4349

# transmit that. This would both be faster to generate, and

4350

# result in fewer bytes-on-the-wire.

4351

as_bytes = from_serializer.write_inventory_to_string(inv)

4621

4352

key = (inv.revision_id,)

4622

4353

parent_keys = parent_map.get(key, ())

4623

delta = None

4624

if not delta_versus_null and parent_keys:

4625

# The caller did not ask for complete inventories and we have

4626

# some parents that we can delta against. Make a delta against

4627

# each parent so that we can find the smallest.

4628

parent_ids = [parent_key[0] for parent_key in parent_keys]

4629

for parent_id in parent_ids:

4630

if parent_id not in invs_sent_so_far:

4631

# We don't know that the remote side has this basis, so

4632

# we can't use it.

4633

continue

4634

if parent_id == _mod_revision.NULL_REVISION:

4635

parent_inv = null_inventory

4636

else:

4637

parent_inv = inventory_cache.get(parent_id, None)

4638

if parent_inv is None:

4639

parent_inv = from_repo.get_inventory(parent_id)

4640

candidate_delta = inv._make_delta(parent_inv)

4641

if (delta is None or

4642

len(delta) > len(candidate_delta)):

4643

delta = candidate_delta

4644

basis_id = parent_id

4645

if delta is None:

4646

# Either none of the parents ended up being suitable, or we

4647

# were asked to delta against NULL

4648

basis_id = _mod_revision.NULL_REVISION

4649

delta = inv._make_delta(null_inventory)

4650

invs_sent_so_far.add(inv.revision_id)

4651

inventory_cache[inv.revision_id] = inv

4652

delta_serialized = ''.join(

4653

serializer.delta_to_lines(basis_id, key[-1], delta))

4654

4354

yield versionedfile.FulltextContentFactory(

4655

key, parent_keys, None, delta_serialized)

4656

4657

4658

def _iter_for_revno(repo, partial_history_cache, stop_index=None,

4659

stop_revision=None):

4660

"""Extend the partial history to include a given index

4661

4662

If a stop_index is supplied, stop when that index has been reached.

4663

If a stop_revision is supplied, stop when that revision is

4664

encountered. Otherwise, stop when the beginning of history is

4665

reached.

4666

4667

:param stop_index: The index which should be present. When it is

4668

present, history extension will stop.

4669

:param stop_revision: The revision id which should be present. When

4670

it is encountered, history extension will stop.

4671

"""

4672

start_revision = partial_history_cache[-1]

4673

iterator = repo.iter_reverse_revision_history(start_revision)

4674

try:

4675

#skip the last revision in the list

4676

iterator.next()

4677

while True:

4678

if (stop_index is not None and

4679

len(partial_history_cache) > stop_index):

4680

break

4681

if partial_history_cache[-1] == stop_revision:

4682

break

4683

revision_id = iterator.next()

4684

partial_history_cache.append(revision_id)

4685

except StopIteration:

4686

# No more history

4687

return

4355

key, parent_keys, None, as_bytes)

4688

4356

Older »