~bzr-pqm/bzr/bzr.dev

Committer: Joe Julian
Date: 2010-01-10 02:25:31 UTC
mto: (4634.119.7 2.0)
mto: This revision was merged to the branch mainline in revision 4959.
Revision ID: joe@julianfamily.org-20100110022531-wqk61rsagz8xsiga

Added MANIFEST.in to allow bdist_rpm to have all the required include files and tools. bdist_rpm will still fail to build correctly on some distributions due to a disttools bug http://bugs.python.org/issue644744

files added:
MANIFEST.in

README_BDIST_RPM

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/crash.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/send.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/features.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/util/bencode.py

doc/Bazaar-Logo-For-Manuals.png

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/apport.txt

doc/developers/bug-handling.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/implementation-notes.txt

doc/developers/index-plain.txt

doc/developers/miscellaneous-notes.txt

doc/developers/plans.txt

doc/developers/process.txt

doc/developers/specifications.txt

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/quick-reference/index.txt

doc/en/tutorials/index.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/quick-reference/index.txt

doc/es/user-guide/index-plain.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/generate_release_notes.py

tools/package_docs.py

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

files removed:
bzrlib/tests/test_http_implementations.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/tests/test_bencode.py

doc/bazaar-vcs.org.kid

doc/developers/performance-contributing.txt

doc/en/developer-guide

doc/en/user-guide/index.txt

doc/es/guia-desarrollador

doc/es/notas-version

doc/es/referencia

files renamed:
bzrlib/_btree_serializer_c.pyx => bzrlib/_btree_serializer_pyx.pyx

bzrlib/_dirstate_helpers_c.h => bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_c.pyx => bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_knit_load_data_c.pyx => bzrlib/_knit_load_data_pyx.pyx

tools/doc_generate/ => bzrlib/doc_generate/

bzrlib/tests/branch_implementations/ => bzrlib/tests/per_branch/

bzrlib/tests/bzrdir_implementations/ => bzrlib/tests/per_bzrdir/

bzrlib/tests/interrepository_implementations/ => bzrlib/tests/per_interrepository/

bzrlib/tests/intertree_implementations/ => bzrlib/tests/per_intertree/

bzrlib/tests/inventory_implementations/ => bzrlib/tests/per_inventory/

bzrlib/tests/test_pack_repository.py => bzrlib/tests/per_pack_repository.py

bzrlib/tests/test_transport_implementations.py => bzrlib/tests/per_transport.py

bzrlib/tests/tree_implementations/ => bzrlib/tests/per_tree/

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py => bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/test_versionedfile.py => bzrlib/tests/per_versionedfile.py

bzrlib/tests/workingtree_implementations/ => bzrlib/tests/per_workingtree/

bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

doc/en/quick-reference/Makefile => doc/en/_static/en/Makefile

doc/en/quick-reference/quick-start-summary.pdf => doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/quick-reference/quick-start-summary.png => doc/en/_static/en/bzr-en-quick-reference.png

doc/en/quick-reference/quick-start-summary.svg => doc/en/_static/en/bzr-en-quick-reference.svg

doc/es/referencia-rapida/Makefile => doc/es/_static/es/Makefile

doc/es/referencia-rapida/referencia-rapida.svg => doc/es/_static/es/bzr-es-quick-reference.svg

doc/index.es.txt => doc/es/index.txt

doc/es/referencia-rapida/ => doc/es/quick-reference/

doc/es/guia-usuario/ => doc/es/user-guide/

generate_docs.py => tools/generate_docs.py

files modified:
.bzrignore

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/annotate.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/counted_lock.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/errors.py

bzrlib/export/dir_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_index.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_xml.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/version.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/developers/cycle.txt

doc/developers/dirstate.txt

doc/developers/index.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/overview.txt

doc/developers/performance-roadmap.txt

doc/developers/planned-change-integration.txt

doc/developers/plugin-api.txt

doc/developers/releasing.txt

doc/developers/testing.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/es/mini-tutorial/index.txt

doc/es/user-guide/index.txt

doc/index.txt

setup.py

tools/win32/build_release.py

tools/win32/bzr.iss.cog

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/repository.py

gpg,

graph,

inventory,

inventory_delta,

lazy_regex,

lockable_files,

lockdir,

entry_factory,

)

from bzrlib import registry

from bzrlib.symbol_versioning import (

deprecated_method,

)

from bzrlib.trace import (

log_exception_quietly, note, mutter, mutter_callsite, warning)

467

465

if content_summary[2] is None:

468

466

raise ValueError("Files must not have executable = None")

469

467

if not store:

470

if (# if the file length changed we have to store:

471

parent_entry.text_size != content_summary[1] or

472

# if the exec bit has changed we have to store:

468

# We can't trust a check of the file length because of content

469

# filtering...

470

if (# if the exec bit has changed we have to store:

473

471

parent_entry.executable != content_summary[2]):

474

472

store = True

475

473

elif parent_entry.text_sha1 == content_summary[3]:

494

492

ie.executable = content_summary[2]

495

493

file_obj, stat_value = tree.get_file_with_stat(ie.file_id, path)

496

494

try:

497

lines = file_obj.readlines()

495

text = file_obj.read()

498

496

finally:

499

497

file_obj.close()

500

498

try:

501

499

ie.text_sha1, ie.text_size = self._add_text_to_weave(

502

ie.file_id, lines, heads, nostore_sha)

500

ie.file_id, text, heads, nostore_sha)

503

501

# Let the caller know we generated a stat fingerprint.

504

502

fingerprint = (ie.text_sha1, stat_value)

505

503

except errors.ExistingContent:

517

515

# carry over:

518

516

ie.revision = parent_entry.revision

519

517

return self._get_delta(ie, basis_inv, path), False, None

520

lines = []

521

self._add_text_to_weave(ie.file_id, lines, heads, None)

518

self._add_text_to_weave(ie.file_id, '', heads, None)

522

519

elif kind == 'symlink':

523

520

current_link_target = content_summary[3]

524

521

if not store:

532

529

ie.symlink_target = parent_entry.symlink_target

533

530

return self._get_delta(ie, basis_inv, path), False, None

534

531

ie.symlink_target = current_link_target

535

lines = []

536

self._add_text_to_weave(ie.file_id, lines, heads, None)

532

self._add_text_to_weave(ie.file_id, '', heads, None)

537

533

elif kind == 'tree-reference':

538

534

if not store:

539

535

if content_summary[3] != parent_entry.reference_revision:

544

540

ie.revision = parent_entry.revision

545

541

return self._get_delta(ie, basis_inv, path), False, None

546

542

ie.reference_revision = content_summary[3]

547

lines = []

548

self._add_text_to_weave(ie.file_id, lines, heads, None)

543

if ie.reference_revision is None:

544

raise AssertionError("invalid content_summary for nested tree: %r"

545

% (content_summary,))

546

self._add_text_to_weave(ie.file_id, '', heads, None)

549

547

else:

550

548

raise NotImplementedError('unknown kind')

551

549

ie.revision = self._new_revision_id

745

743

entry.executable = True

746

744

else:

747

745

entry.executable = False

748

if (carry_over_possible and

746

if (carry_over_possible and

749

747

parent_entry.executable == entry.executable):

750

748

# Check the file length, content hash after reading

751

749

# the file.

754

752

nostore_sha = None

755

753

file_obj, stat_value = tree.get_file_with_stat(file_id, change[1][1])

756

754

try:

757

lines = file_obj.readlines()

755

text = file_obj.read()

758

756

finally:

759

757

file_obj.close()

760

758

try:

761

759

entry.text_sha1, entry.text_size = self._add_text_to_weave(

762

file_id, lines, heads, nostore_sha)

760

file_id, text, heads, nostore_sha)

763

761

yield file_id, change[1][1], (entry.text_sha1, stat_value)

764

762

except errors.ExistingContent:

765

763

# No content change against a carry_over parent

774

772

parent_entry.symlink_target == entry.symlink_target):

775

773

carried_over = True

776

774

else:

777

self._add_text_to_weave(change[0], [], heads, None)

775

self._add_text_to_weave(change[0], '', heads, None)

778

776

elif kind == 'directory':

779

777

if carry_over_possible:

780

778

carried_over = True

782

780

# Nothing to set on the entry.

783

781

# XXX: split into the Root and nonRoot versions.

784

782

if change[1][1] != '' or self.repository.supports_rich_root():

785

self._add_text_to_weave(change[0], [], heads, None)

783

self._add_text_to_weave(change[0], '', heads, None)

786

784

elif kind == 'tree-reference':

787

785

if not self.repository._format.supports_tree_reference:

788

786

# This isn't quite sane as an error, but we shouldn't

791

789

# references.

792

790

raise errors.UnsupportedOperation(tree.add_reference,

793

791

self.repository)

794

entry.reference_revision = \

795

tree.get_reference_revision(change[0])

792

reference_revision = tree.get_reference_revision(change[0])

793

entry.reference_revision = reference_revision

796

794

if (carry_over_possible and

797

795

parent_entry.reference_revision == reference_revision):

798

796

carried_over = True

799

797

else:

800

self._add_text_to_weave(change[0], [], heads, None)

798

self._add_text_to_weave(change[0], '', heads, None)

801

799

else:

802

800

raise AssertionError('unknown kind %r' % kind)

803

801

if not carried_over:

812

810

seen_root = True

813

811

self.new_inventory = None

814

812

if len(inv_delta):

813

# This should perhaps be guarded by a check that the basis we

814

# commit against is the basis for the commit and if not do a delta

815

# against the basis.

815

816

self._any_changes = True

816

817

if not seen_root:

817

818

# housekeeping root entry changes do not affect no-change commits.

818

819

self._require_root_change(tree)

819

820

self.basis_delta_revision = basis_revision_id

820

821

def _add_text_to_weave(self, file_id, new_lines, parents, nostore_sha):

822

# Note: as we read the content directly from the tree, we know its not

823

# been turned into unicode or badly split - but a broken tree

824

# implementation could give us bad output from readlines() so this is

825

# not a guarantee of safety. What would be better is always checking

826

# the content during test suite execution. RBC 20070912

827

parent_keys = tuple((file_id, parent) for parent in parents)

828

return self.repository.texts.add_lines(

829

(file_id, self._new_revision_id), parent_keys, new_lines,

830

nostore_sha=nostore_sha, random_id=self.random_revid,

831

check_content=False)[0:2]

822

def _add_text_to_weave(self, file_id, new_text, parents, nostore_sha):

823

parent_keys = tuple([(file_id, parent) for parent in parents])

824

return self.repository.texts._add_text(

825

(file_id, self._new_revision_id), parent_keys, new_text,

826

nostore_sha=nostore_sha, random_id=self.random_revid)[0:2]

832

827

833

828

834

829

class RootCommitBuilder(CommitBuilder):

860

855

######################################################################

861

856

# Repositories

862

857

858

863

859

class Repository(object):

864

860

"""Repository holding history for one or more branches.

865

861

935

931

"""

936

932

if self._write_group is not self.get_transaction():

937

933

# has an unlock or relock occured ?

934

if suppress_errors:

935

mutter(

936

'(suppressed) mismatched lock context and write group. %r, %r',

937

self._write_group, self.get_transaction())

938

return

938

939

raise errors.BzrError(

939

940

'mismatched lock context and write group. %r, %r' %

940

941

(self._write_group, self.get_transaction()))

969

970

"""

970

971

if not self._format.supports_external_lookups:

971

972

raise errors.UnstackableRepositoryFormat(self._format, self.base)

973

if self.is_locked():

974

# This repository will call fallback.unlock() when we transition to

975

# the unlocked state, so we make sure to increment the lock count

976

repository.lock_read()

972

977

self._check_fallback_repository(repository)

973

978

self._fallback_repositories.append(repository)

974

979

self.texts.add_fallback_versioned_files(repository.texts)

1023

1028

parents, basis_inv=None, propagate_caches=False):

1024

1029

"""Add a new inventory expressed as a delta against another revision.

1025

1030

1031

See the inventory developers documentation for the theory behind

1032

inventory deltas.

1033

1026

1034

:param basis_revision_id: The inventory id the delta was created

1027

1035

against. (This does not have to be a direct parent.)

1028

1036

:param delta: The inventory delta (see Inventory.apply_delta for

1067

1075

check_content=True):

1068

1076

"""Store lines in inv_vf and return the sha1 of the inventory."""

1069

1077

parents = [(parent,) for parent in parents]

1070

return self.inventories.add_lines((revision_id,), parents, lines,

1078

result = self.inventories.add_lines((revision_id,), parents, lines,

1071

1079

check_content=check_content)[0]

1080

self.inventories._access.flush()

1081

return result

1072

1082

1073

1083

def add_revision(self, revision_id, rev, inv=None, config=None):

1074

1084

"""Add rev to the revision store as revision_id.

1150

1160

# The old API returned a list, should this actually be a set?

1151

1161

return parent_map.keys()

1152

1162

1163

def _check_inventories(self, checker):

1164

"""Check the inventories found from the revision scan.

1165

1166

This is responsible for verifying the sha1 of inventories and

1167

creating a pending_keys set that covers data referenced by inventories.

1168

"""

1169

bar = ui.ui_factory.nested_progress_bar()

1170

try:

1171

self._do_check_inventories(checker, bar)

1172

finally:

1173

bar.finished()

1174

1175

def _do_check_inventories(self, checker, bar):

1176

"""Helper for _check_inventories."""

1177

revno = 0

1178

keys = {'chk_bytes':set(), 'inventories':set(), 'texts':set()}

1179

kinds = ['chk_bytes', 'texts']

1180

count = len(checker.pending_keys)

1181

bar.update("inventories", 0, 2)

1182

current_keys = checker.pending_keys

1183

checker.pending_keys = {}

1184

# Accumulate current checks.

1185

for key in current_keys:

1186

if key[0] != 'inventories' and key[0] not in kinds:

1187

checker._report_items.append('unknown key type %r' % (key,))

1188

keys[key[0]].add(key[1:])

1189

if keys['inventories']:

1190

# NB: output order *should* be roughly sorted - topo or

1191

# inverse topo depending on repository - either way decent

1192

# to just delta against. However, pre-CHK formats didn't

1193

# try to optimise inventory layout on disk. As such the

1194

# pre-CHK code path does not use inventory deltas.

1195

last_object = None

1196

for record in self.inventories.check(keys=keys['inventories']):

1197

if record.storage_kind == 'absent':

1198

checker._report_items.append(

1199

'Missing inventory {%s}' % (record.key,))

1200

else:

1201

last_object = self._check_record('inventories', record,

1202

checker, last_object,

1203

current_keys[('inventories',) + record.key])

1204

del keys['inventories']

1205

else:

1206

return

1207

bar.update("texts", 1)

1208

while (checker.pending_keys or keys['chk_bytes']

1209

or keys['texts']):

1210

# Something to check.

1211

current_keys = checker.pending_keys

1212

checker.pending_keys = {}

1213

# Accumulate current checks.

1214

for key in current_keys:

1215

if key[0] not in kinds:

1216

checker._report_items.append('unknown key type %r' % (key,))

1217

keys[key[0]].add(key[1:])

1218

# Check the outermost kind only - inventories || chk_bytes || texts

1219

for kind in kinds:

1220

if keys[kind]:

1221

last_object = None

1222

for record in getattr(self, kind).check(keys=keys[kind]):

1223

if record.storage_kind == 'absent':

1224

checker._report_items.append(

1225

'Missing %s {%s}' % (kind, record.key,))

1226

else:

1227

last_object = self._check_record(kind, record,

1228

checker, last_object, current_keys[(kind,) + record.key])

1229

keys[kind] = set()

1230

break

1231

1232

def _check_record(self, kind, record, checker, last_object, item_data):

1233

"""Check a single text from this repository."""

1234

if kind == 'inventories':

1235

rev_id = record.key[0]

1236

inv = self.deserialise_inventory(rev_id,

1237

record.get_bytes_as('fulltext'))

1238

if last_object is not None:

1239

delta = inv._make_delta(last_object)

1240

for old_path, path, file_id, ie in delta:

1241

if ie is None:

1242

continue

1243

ie.check(checker, rev_id, inv)

1244

else:

1245

for path, ie in inv.iter_entries():

1246

ie.check(checker, rev_id, inv)

1247

if self._format.fast_deltas:

1248

return inv

1249

elif kind == 'chk_bytes':

1250

# No code written to check chk_bytes for this repo format.

1251

checker._report_items.append(

1252

'unsupported key type chk_bytes for %s' % (record.key,))

1253

elif kind == 'texts':

1254

self._check_text(record, checker, item_data)

1255

else:

1256

checker._report_items.append(

1257

'unknown key type %s for %s' % (kind, record.key))

1258

1259

def _check_text(self, record, checker, item_data):

1260

"""Check a single text."""

1261

# Check it is extractable.

1262

# TODO: check length.

1263

if record.storage_kind == 'chunked':

1264

chunks = record.get_bytes_as(record.storage_kind)

1265

sha1 = osutils.sha_strings(chunks)

1266

length = sum(map(len, chunks))

1267

else:

1268

content = record.get_bytes_as('fulltext')

1269

sha1 = osutils.sha_string(content)

1270

length = len(content)

1271

if item_data and sha1 != item_data[1]:

1272

checker._report_items.append(

1273

'sha1 mismatch: %s has sha1 %s expected %s referenced by %s' %

1274

(record.key, sha1, item_data[1], item_data[2]))

1275

1153

1276

@staticmethod

1154

1277

def create(a_bzrdir):

1155

1278

"""Construct the current default format repository in a_bzrdir."""

1188

1311

self._inventory_entry_cache = fifo_cache.FIFOCache(10*1024)

1189

1312

1190

1313

def __repr__(self):

1191

return '%s(%r)' % (self.__class__.__name__,

1192

self.base)

1314

if self._fallback_repositories:

1315

return '%s(%r, fallback_repositories=%r)' % (

1316

self.__class__.__name__,

1317

self.base,

1318

self._fallback_repositories)

1319

else:

1320

return '%s(%r)' % (self.__class__.__name__,

1321

self.base)

1322

1323

def _has_same_fallbacks(self, other_repo):

1324

"""Returns true if the repositories have the same fallbacks."""

1325

my_fb = self._fallback_repositories

1326

other_fb = other_repo._fallback_repositories

1327

if len(my_fb) != len(other_fb):

1328

return False

1329

for f, g in zip(my_fb, other_fb):

1330

if not f.has_same_location(g):

1331

return False

1332

return True

1193

1333

1194

1334

def has_same_location(self, other):

1195

1335

"""Returns a boolean indicating if this repository is at the same

1240

1380

"""

1241

1381

locked = self.is_locked()

1242

1382

result = self.control_files.lock_write(token=token)

1243

for repo in self._fallback_repositories:

1244

# Writes don't affect fallback repos

1245

repo.lock_read()

1246

1383

if not locked:

1384

for repo in self._fallback_repositories:

1385

# Writes don't affect fallback repos

1386

repo.lock_read()

1247

1387

self._refresh_data()

1248

1388

return result

1249

1389

1250

1390

def lock_read(self):

1251

1391

locked = self.is_locked()

1252

1392

self.control_files.lock_read()

1253

for repo in self._fallback_repositories:

1254

repo.lock_read()

1255

1393

if not locked:

1394

for repo in self._fallback_repositories:

1395

repo.lock_read()

1256

1396

self._refresh_data()

1257

1397

1258

1398

def get_physical_lock_status(self):

1403

1543

"""Commit the contents accrued within the current write group.

1404

1544

1405

1545

:seealso: start_write_group.

1546

1547

:return: it may return an opaque hint that can be passed to 'pack'.

1406

1548

"""

1407

1549

if self._write_group is not self.get_transaction():

1408

1550

# has an unlock or relock occured ?

1409

1551

raise errors.BzrError('mismatched lock context %r and '

1410

1552

'write group %r.' %

1411

1553

(self.get_transaction(), self._write_group))

1412

self._commit_write_group()

1554

result = self._commit_write_group()

1413

1555

self._write_group = None

1556

return result

1414

1557

1415

1558

def _commit_write_group(self):

1416

1559

"""Template method for per-repository write group cleanup.

1424

1567

def suspend_write_group(self):

1425

1568

raise errors.UnsuspendableWriteGroup(self)

1426

1569

1570

def get_missing_parent_inventories(self, check_for_missing_texts=True):

1571

"""Return the keys of missing inventory parents for revisions added in

1572

this write group.

1573

1574

A revision is not complete if the inventory delta for that revision

1575

cannot be calculated. Therefore if the parent inventories of a

1576

revision are not present, the revision is incomplete, and e.g. cannot

1577

be streamed by a smart server. This method finds missing inventory

1578

parents for revisions added in this write group.

1579

"""

1580

if not self._format.supports_external_lookups:

1581

# This is only an issue for stacked repositories

1582

return set()

1583

if not self.is_in_write_group():

1584

raise AssertionError('not in a write group')

1585

1586

# XXX: We assume that every added revision already has its

1587

# corresponding inventory, so we only check for parent inventories that

1588

# might be missing, rather than all inventories.

1589

parents = set(self.revisions._index.get_missing_parents())

1590

parents.discard(_mod_revision.NULL_REVISION)

1591

unstacked_inventories = self.inventories._index

1592

present_inventories = unstacked_inventories.get_parent_map(

1593

key[-1:] for key in parents)

1594

parents.difference_update(present_inventories)

1595

if len(parents) == 0:

1596

# No missing parent inventories.

1597

return set()

1598

if not check_for_missing_texts:

1599

return set(('inventories', rev_id) for (rev_id,) in parents)

1600

# Ok, now we have a list of missing inventories. But these only matter

1601

# if the inventories that reference them are missing some texts they

1602

# appear to introduce.

1603

# XXX: Texts referenced by all added inventories need to be present,

1604

# but at the moment we're only checking for texts referenced by

1605

# inventories at the graph's edge.

1606

key_deps = self.revisions._index._key_dependencies

1607

key_deps.satisfy_refs_for_keys(present_inventories)

1608

referrers = frozenset(r[0] for r in key_deps.get_referrers())

1609

file_ids = self.fileids_altered_by_revision_ids(referrers)

1610

missing_texts = set()

1611

for file_id, version_ids in file_ids.iteritems():

1612

missing_texts.update(

1613

(file_id, version_id) for version_id in version_ids)

1614

present_texts = self.texts.get_parent_map(missing_texts)

1615

missing_texts.difference_update(present_texts)

1616

if not missing_texts:

1617

# No texts are missing, so all revisions and their deltas are

1618

# reconstructable.

1619

return set()

1620

# Alternatively the text versions could be returned as the missing

1621

# keys, but this is likely to be less data.

1622

missing_keys = set(('inventories', rev_id) for (rev_id,) in parents)

1623

return missing_keys

1624

1427

1625

def refresh_data(self):

1428

1626

"""Re-read any data needed to to synchronise with disk.

1429

1627

1478

1676

raise errors.InternalBzrError(

1479

1677

"May not fetch while in a write group.")

1480

1678

# fast path same-url fetch operations

1481

if self.has_same_location(source) and fetch_spec is None:

1679

# TODO: lift out to somewhere common with RemoteRepository

1680

# <https://bugs.edge.launchpad.net/bzr/+bug/401646>

1681

if (self.has_same_location(source)

1682

and fetch_spec is None

1683

and self._has_same_fallbacks(source)):

1482

1684

# check that last_revision is in 'from' and then return a

1483

1685

# no-operation.

1484

1686

if (revision_id is not None and

1509

1711

:param revprops: Optional dictionary of revision properties.

1510

1712

:param revision_id: Optional revision id.

1511

1713

"""

1714

if self._fallback_repositories:

1715

raise errors.BzrError("Cannot commit from a lightweight checkout "

1716

"to a stacked branch. See "

1717

"https://bugs.launchpad.net/bzr/+bug/375013 for details.")

1512

1718

result = self._commit_builder_class(self, parents, config,

1513

1719

timestamp, timezone, committer, revprops, revision_id)

1514

1720

self.start_write_group()

1525

1731

self.control_files.unlock()

1526

1732

if self.control_files._lock_count == 0:

1527

1733

self._inventory_entry_cache.clear()

1528

for repo in self._fallback_repositories:

1529

repo.unlock()

1734

for repo in self._fallback_repositories:

1735

repo.unlock()

1530

1736

1531

1737

@needs_read_lock

1532

1738

def clone(self, a_bzrdir, revision_id=None):

1641

1847

1642

1848

@needs_read_lock

1643

1849

def get_revisions(self, revision_ids):

1644

"""Get many revisions at once."""

1850

"""Get many revisions at once.

1851

1852

Repositories that need to check data on every revision read should

1853

subclass this method.

1854

"""

1645

1855

return self._get_revisions(revision_ids)

1646

1856

1647

1857

@needs_read_lock

1648

1858

def _get_revisions(self, revision_ids):

1649

1859

"""Core work logic to get many revisions without sanity checks."""

1650

for rev_id in revision_ids:

1651

if not rev_id or not isinstance(rev_id, basestring):

1652

raise errors.InvalidRevisionId(revision_id=rev_id, branch=self)

1860

revs = {}

1861

for revid, rev in self._iter_revisions(revision_ids):

1862

if rev is None:

1863

raise errors.NoSuchRevision(self, revid)

1864

revs[revid] = rev

1865

return [revs[revid] for revid in revision_ids]

1866

1867

def _iter_revisions(self, revision_ids):

1868

"""Iterate over revision objects.

1869

1870

:param revision_ids: An iterable of revisions to examine. None may be

1871

passed to request all revisions known to the repository. Note that

1872

not all repositories can find unreferenced revisions; for those

1873

repositories only referenced ones will be returned.

1874

:return: An iterator of (revid, revision) tuples. Absent revisions (

1875

those asked for but not available) are returned as (revid, None).

1876

"""

1877

if revision_ids is None:

1878

revision_ids = self.all_revision_ids()

1879

else:

1880

for rev_id in revision_ids:

1881

if not rev_id or not isinstance(rev_id, basestring):

1882

raise errors.InvalidRevisionId(revision_id=rev_id, branch=self)

1653

1883

keys = [(key,) for key in revision_ids]

1654

1884

stream = self.revisions.get_record_stream(keys, 'unordered', True)

1655

revs = {}

1656

1885

for record in stream:

1886

revid = record.key[0]

1657

1887

if record.storage_kind == 'absent':

1658

raise errors.NoSuchRevision(self, record.key[0])

1659

text = record.get_bytes_as('fulltext')

1660

rev = self._serializer.read_revision_from_string(text)

1661

revs[record.key[0]] = rev

1662

return [revs[revid] for revid in revision_ids]

1888

yield (revid, None)

1889

else:

1890

text = record.get_bytes_as('fulltext')

1891

rev = self._serializer.read_revision_from_string(text)

1892

yield (revid, rev)

1663

1893

1664

1894

@needs_read_lock

1665

1895

def get_revision_xml(self, revision_id):

1860

2090

yield line, revid

1861

2091

1862

2092

def _find_file_ids_from_xml_inventory_lines(self, line_iterator,

1863

revision_ids):

2093

revision_keys):

1864

2094

"""Helper routine for fileids_altered_by_revision_ids.

1865

2095

1866

2096

This performs the translation of xml lines to revision ids.

1867

2097

1868

2098

:param line_iterator: An iterator of lines, origin_version_id

1869

:param revision_ids: The revision ids to filter for. This should be a

2099

:param revision_keys: The revision ids to filter for. This should be a

1870

2100

set or other type which supports efficient __contains__ lookups, as

1871

the revision id from each parsed line will be looked up in the

1872

revision_ids filter.

2101

the revision key from each parsed line will be looked up in the

2102

revision_keys filter.

1873

2103

:return: a dictionary mapping altered file-ids to an iterable of

1874

2104

revision_ids. Each altered file-ids has the exact revision_ids that

1875

2105

altered it listed explicitly.

1876

2106

"""

1877

2107

seen = set(self._find_text_key_references_from_xml_inventory_lines(

1878

2108

line_iterator).iterkeys())

1879

# Note that revision_ids are revision keys.

1880

parent_maps = self.revisions.get_parent_map(revision_ids)

1881

parents = set()

1882

map(parents.update, parent_maps.itervalues())

1883

parents.difference_update(revision_ids)

2109

parent_keys = self._find_parent_keys_of_revisions(revision_keys)

1884

2110

parent_seen = set(self._find_text_key_references_from_xml_inventory_lines(

1885

self._inventory_xml_lines_for_keys(parents)))

2111

self._inventory_xml_lines_for_keys(parent_keys)))

1886

2112

new_keys = seen - parent_seen

1887

2113

result = {}

1888

2114

setdefault = result.setdefault

1890

2116

setdefault(key[0], set()).add(key[-1])

1891

2117

return result

1892

2118

2119

def _find_parent_ids_of_revisions(self, revision_ids):

2120

"""Find all parent ids that are mentioned in the revision graph.

2121

2122

:return: set of revisions that are parents of revision_ids which are

2123

not part of revision_ids themselves

2124

"""

2125

parent_map = self.get_parent_map(revision_ids)

2126

parent_ids = set()

2127

map(parent_ids.update, parent_map.itervalues())

2128

parent_ids.difference_update(revision_ids)

2129

parent_ids.discard(_mod_revision.NULL_REVISION)

2130

return parent_ids

2131

2132

def _find_parent_keys_of_revisions(self, revision_keys):

2133

"""Similar to _find_parent_ids_of_revisions, but used with keys.

2134

2135

:param revision_keys: An iterable of revision_keys.

2136

:return: The parents of all revision_keys that are not already in

2137

revision_keys

2138

"""

2139

parent_map = self.revisions.get_parent_map(revision_keys)

2140

parent_keys = set()

2141

map(parent_keys.update, parent_map.itervalues())

2142

parent_keys.difference_update(revision_keys)

2143

parent_keys.discard(_mod_revision.NULL_REVISION)

2144

return parent_keys

2145

1893

2146

def fileids_altered_by_revision_ids(self, revision_ids, _inv_weave=None):

1894

2147

"""Find the file ids and versions affected by revisions.

1895

2148

1997

2250

batch_size]

1998

2251

if not to_query:

1999

2252

break

2000

for rev_tree in self.revision_trees(to_query):

2001

revision_id = rev_tree.get_revision_id()

2253

for revision_id in to_query:

2002

2254

parent_ids = ancestors[revision_id]

2003

2255

for text_key in revision_keys[revision_id]:

2004

2256

pb.update("Calculating text parents", processed_texts)

2104

2356

"""Get Inventory object by revision id."""

2105

2357

return self.iter_inventories([revision_id]).next()

2106

2358

2107

def iter_inventories(self, revision_ids):

2359

def iter_inventories(self, revision_ids, ordering=None):

2108

2360

"""Get many inventories by revision_ids.

2109

2361

2110

2362

This will buffer some or all of the texts used in constructing the

2112

2364

time.

2113

2365

2114

2366

:param revision_ids: The expected revision ids of the inventories.

2367

:param ordering: optional ordering, e.g. 'topological'. If not

2368

specified, the order of revision_ids will be preserved (by

2369

buffering if necessary).

2115

2370

:return: An iterator of inventories.

2116

2371

"""

2117

2372

if ((None in revision_ids)

2118

2373

or (_mod_revision.NULL_REVISION in revision_ids)):

2119

2374

raise ValueError('cannot get null revision inventory')

2120

return self._iter_inventories(revision_ids)

2375

return self._iter_inventories(revision_ids, ordering)

2121

2376

2122

def _iter_inventories(self, revision_ids):

2377

def _iter_inventories(self, revision_ids, ordering):

2123

2378

"""single-document based inventory iteration."""

2124

for text, revision_id in self._iter_inventory_xmls(revision_ids):

2379

inv_xmls = self._iter_inventory_xmls(revision_ids, ordering)

2380

for text, revision_id in inv_xmls:

2125

2381

yield self.deserialise_inventory(revision_id, text)

2126

2382

2127

def _iter_inventory_xmls(self, revision_ids):

2383

def _iter_inventory_xmls(self, revision_ids, ordering):

2384

if ordering is None:

2385

order_as_requested = True

2386

ordering = 'unordered'

2387

else:

2388

order_as_requested = False

2128

2389

keys = [(revision_id,) for revision_id in revision_ids]

2129

stream = self.inventories.get_record_stream(keys, 'unordered', True)

2390

if not keys:

2391

return

2392

if order_as_requested:

2393

key_iter = iter(keys)

2394

next_key = key_iter.next()

2395

stream = self.inventories.get_record_stream(keys, ordering, True)

2130

2396

text_chunks = {}

2131

2397

for record in stream:

2132

2398

if record.storage_kind != 'absent':

2133

text_chunks[record.key] = record.get_bytes_as('chunked')

2399

chunks = record.get_bytes_as('chunked')

2400

if order_as_requested:

2401

text_chunks[record.key] = chunks

2402

else:

2403

yield ''.join(chunks), record.key[-1]

2134

2404

else:

2135

2405

raise errors.NoSuchRevision(self, record.key)

2136

for key in keys:

2137

chunks = text_chunks.pop(key)

2138

yield ''.join(chunks), key[-1]

2406

if order_as_requested:

2407

# Yield as many results as we can while preserving order.

2408

while next_key in text_chunks:

2409

chunks = text_chunks.pop(next_key)

2410

yield ''.join(chunks), next_key[-1]

2411

try:

2412

next_key = key_iter.next()

2413

except StopIteration:

2414

# We still want to fully consume the get_record_stream,

2415

# just in case it is not actually finished at this point

2416

next_key = None

2417

break

2139

2418

2140

2419

def deserialise_inventory(self, revision_id, xml):

2141

2420

"""Transform the xml into an inventory object.

2162

2441

@needs_read_lock

2163

2442

def get_inventory_xml(self, revision_id):

2164

2443

"""Get inventory XML as a file object."""

2165

texts = self._iter_inventory_xmls([revision_id])

2444

texts = self._iter_inventory_xmls([revision_id], 'unordered')

2166

2445

try:

2167

2446

text, revision_id = texts.next()

2168

2447

except StopIteration:

2175

2454

"""

2176

2455

return self.get_revision(revision_id).inventory_sha1

2177

2456

2457

def get_rev_id_for_revno(self, revno, known_pair):

2458

"""Return the revision id of a revno, given a later (revno, revid)

2459

pair in the same history.

2460

2461

:return: if found (True, revid). If the available history ran out

2462

before reaching the revno, then this returns

2463

(False, (closest_revno, closest_revid)).

2464

"""

2465

known_revno, known_revid = known_pair

2466

partial_history = [known_revid]

2467

distance_from_known = known_revno - revno

2468

if distance_from_known < 0:

2469

raise ValueError(

2470

'requested revno (%d) is later than given known revno (%d)'

2471

% (revno, known_revno))

2472

try:

2473

_iter_for_revno(

2474

self, partial_history, stop_index=distance_from_known)

2475

except errors.RevisionNotPresent, err:

2476

if err.revision_id == known_revid:

2477

# The start revision (known_revid) wasn't found.

2478

raise

2479

# This is a stacked repository with no fallbacks, or a there's a

2480

# left-hand ghost. Either way, even though the revision named in

2481

# the error isn't in this repo, we know it's the next step in this

2482

# left-hand history.

2483

partial_history.append(err.revision_id)

2484

if len(partial_history) <= distance_from_known:

2485

# Didn't find enough history to get a revid for the revno.

2486

earliest_revno = known_revno - len(partial_history) + 1

2487

return (False, (earliest_revno, partial_history[-1]))

2488

if len(partial_history) - 1 > distance_from_known:

2489

raise AssertionError('_iter_for_revno returned too much history')

2490

return (True, partial_history[-1])

2491

2178

2492

def iter_reverse_revision_history(self, revision_id):

2179

2493

"""Iterate backwards through revision ids in the lefthand history

2180

2494

2186

2500

while True:

2187

2501

if next_id in (None, _mod_revision.NULL_REVISION):

2188

2502

return

2503

try:

2504

parents = graph.get_parent_map([next_id])[next_id]

2505

except KeyError:

2506

raise errors.RevisionNotPresent(next_id, self)

2189

2507

yield next_id

2190

# Note: The following line may raise KeyError in the event of

2191

# truncated history. We decided not to have a try:except:raise

2192

# RevisionNotPresent here until we see a use for it, because of the

2193

# cost in an inner loop that is by its very nature O(history).

2194

# Robert Collins 20080326

2195

parents = graph.get_parent_map([next_id])[next_id]

2196

2508

if len(parents) == 0:

2197

2509

return

2198

2510

else:

2312

2624

keys = tsort.topo_sort(parent_map)

2313

2625

return [None] + list(keys)

2314

2626

2315

def pack(self):

2627

def pack(self, hint=None):

2316

2628

"""Compress the data within the repository.

2317

2629

2318

2630

This operation only makes sense for some repository types. For other

2321

2633

This stub method does not require a lock, but subclasses should use

2322

2634

@needs_write_lock as this is a long running call its reasonable to

2323

2635

implicitly lock for the user.

2636

2637

:param hint: If not supplied, the whole repository is packed.

2638

If supplied, the repository may use the hint parameter as a

2639

hint for the parts of the repository to pack. A hint can be

2640

obtained from the result of commit_write_group(). Out of

2641

date hints are simply ignored, because concurrent operations

2642

can obsolete them rapidly.

2324

2643

"""

2325

2644

2326

2645

def get_transaction(self):

2327

2646

return self.control_files.get_transaction()

2328

2647

2329

2648

def get_parent_map(self, revision_ids):

2330

"""See graph._StackedParentsProvider.get_parent_map"""

2649

"""See graph.StackedParentsProvider.get_parent_map"""

2331

2650

# revisions index works in keys; this just works in revisions

2332

2651

# therefore wrap and unwrap

2333

2652

query_keys = []

2356

2675

parents_provider = self._make_parents_provider()

2357

2676

if (other_repository is not None and

2358

2677

not self.has_same_location(other_repository)):

2359

parents_provider = graph._StackedParentsProvider(

2678

parents_provider = graph.StackedParentsProvider(

2360

2679

[parents_provider, other_repository._make_parents_provider()])

2361

2680

return graph.Graph(parents_provider)

2362

2681

2363

def _get_versioned_file_checker(self, text_key_references=None):

2682

def _get_versioned_file_checker(self, text_key_references=None,

2683

ancestors=None):

2364

2684

"""Return an object suitable for checking versioned files.

2365

2685

2366

2686

:param text_key_references: if non-None, an already built

2368

2688

to whether they were referred to by the inventory of the

2369

2689

revision_id that they contain. If None, this will be

2370

2690

calculated.

2691

:param ancestors: Optional result from

2692

self.get_graph().get_parent_map(self.all_revision_ids()) if already

2693

available.

2371

2694

"""

2372

2695

return _VersionedFileChecker(self,

2373

text_key_references=text_key_references)

2696

text_key_references=text_key_references, ancestors=ancestors)

2374

2697

2375

2698

def revision_ids_to_search_result(self, result_set):

2376

2699

"""Convert a set of revision ids to a graph SearchResult."""

2426

2749

return record.get_bytes_as('fulltext')

2427

2750

2428

2751

@needs_read_lock

2429

def check(self, revision_ids=None):

2752

def check(self, revision_ids=None, callback_refs=None, check_repo=True):

2430

2753

"""Check consistency of all history of given revision_ids.

2431

2754

2432

2755

Different repository implementations should override _check().

2433

2756

2434

2757

:param revision_ids: A non-empty list of revision_ids whose ancestry

2435

2758

will be checked. Typically the last revision_id of a branch.

2759

:param callback_refs: A dict of check-refs to resolve and callback

2760

the check/_check method on the items listed as wanting the ref.

2761

see bzrlib.check.

2762

:param check_repo: If False do not check the repository contents, just

2763

calculate the data callback_refs requires and call them back.

2436

2764

"""

2437

return self._check(revision_ids)

2765

return self._check(revision_ids, callback_refs=callback_refs,

2766

check_repo=check_repo)

2438

2767

2439

def _check(self, revision_ids):

2440

result = check.Check(self)

2441

result.check()

2768

def _check(self, revision_ids, callback_refs, check_repo):

2769

result = check.Check(self, check_repo=check_repo)

2770

result.check(callback_refs)

2442

2771

return result

2443

2772

2444

2773

def _warn_if_deprecated(self):

2729

3058

# Does this format have < O(tree_size) delta generation. Used to hint what

2730

3059

# code path for commit, amongst other things.

2731

3060

fast_deltas = None

3061

# Does doing a pack operation compress data? Useful for the pack UI command

3062

# (so if there is one pack, the operation can still proceed because it may

3063

# help), and for fetching when data won't have come from the same

3064

# compressor.

3065

pack_compresses = False

3066

# Does the repository inventory storage understand references to trees?

3067

supports_tree_reference = None

2732

3068

2733

3069

def __str__(self):

2734

3070

return "<%s>" % self.__class__.__name__

2838

3174

raise NotImplementedError(self.network_name)

2839

3175

2840

3176

def check_conversion_target(self, target_format):

2841

raise NotImplementedError(self.check_conversion_target)

3177

if self.rich_root_data and not target_format.rich_root_data:

3178

raise errors.BadConversionTarget(

3179

'Does not support rich root data.', target_format,

3180

from_format=self)

3181

if (self.supports_tree_reference and

3182

not getattr(target_format, 'supports_tree_reference', False)):

3183

raise errors.BadConversionTarget(

3184

'Does not support nested trees', target_format,

3185

from_format=self)

2842

3186

2843

3187

def open(self, a_bzrdir, _found=False):

2844

3188

"""Return an instance of this format for the bzrdir a_bzrdir.

3003

3347

'RepositoryFormatCHK1',

3004

3348

)

3005

3349

3350

format_registry.register_lazy(

3351

'Bazaar development format - chk repository with bencode revision '

3352

'serialization (needs bzr.dev from 1.16)\n',

3353

'bzrlib.repofmt.groupcompress_repo',

3354

'RepositoryFormatCHK2',

3355

)

3356

format_registry.register_lazy(

3357

'Bazaar repository format 2a (needs bzr 1.16 or later)\n',

3358

'bzrlib.repofmt.groupcompress_repo',

3359

'RepositoryFormat2a',

3360

)

3361

3006

3362

3007

3363

class InterRepository(InterObject):

3008

3364

"""This class represents operations taking place between two repositories.

3064

3420

"""

3065

3421

target_graph = self.target.get_graph()

3066

3422

revision_ids = frozenset(revision_ids)

3067

# Fast path for the case where all the revisions are already in the

3068

# target repo.

3069

# (Although this does incur an extra round trip for the

3070

# fairly common case where the target doesn't already have the revision

3071

# we're pushing.)

3072

if set(target_graph.get_parent_map(revision_ids)) == revision_ids:

3073

return graph.SearchResult(revision_ids, set(), 0, set())

3074

3423

missing_revs = set()

3075

3424

source_graph = self.source.get_graph()

3076

3425

# ensure we don't pay silly lookup costs.

3356

3705

return self.source.revision_ids_to_search_result(result_set)

3357

3706

3358

3707

3359

class InterPackRepo(InterSameDataRepository):

3360

"""Optimised code paths between Pack based repositories."""

3361

3362

@classmethod

3363

def _get_repo_format_to_test(self):

3364

from bzrlib.repofmt import pack_repo

3365

return pack_repo.RepositoryFormatKnitPack6RichRoot()

3366

3367

@staticmethod

3368

def is_compatible(source, target):

3369

"""Be compatible with known Pack formats.

3370

3371

We don't test for the stores being of specific types because that

3372

could lead to confusing results, and there is no need to be

3373

overly general.

3374

3375

InterPackRepo does not support CHK based repositories.

3376

"""

3377

from bzrlib.repofmt.pack_repo import RepositoryFormatPack

3378

from bzrlib.repofmt.groupcompress_repo import RepositoryFormatCHK1

3379

try:

3380

are_packs = (isinstance(source._format, RepositoryFormatPack) and

3381

isinstance(target._format, RepositoryFormatPack))

3382

not_packs = (isinstance(source._format, RepositoryFormatCHK1) or

3383

isinstance(target._format, RepositoryFormatCHK1))

3384

except AttributeError:

3385

return False

3386

if not_packs or not are_packs:

3387

return False

3388

return InterRepository._same_model(source, target)

3389

3390

@needs_write_lock

3391

def fetch(self, revision_id=None, pb=None, find_ghosts=False,

3392

fetch_spec=None):

3393

"""See InterRepository.fetch()."""

3394

if (len(self.source._fallback_repositories) > 0 or

3395

len(self.target._fallback_repositories) > 0):

3396

# The pack layer is not aware of fallback repositories, so when

3397

# fetching from a stacked repository or into a stacked repository

3398

# we use the generic fetch logic which uses the VersionedFiles

3399

# attributes on repository.

3400

from bzrlib.fetch import RepoFetcher

3401

fetcher = RepoFetcher(self.target, self.source, revision_id,

3402

pb, find_ghosts, fetch_spec=fetch_spec)

3403

if fetch_spec is not None:

3404

if len(list(fetch_spec.heads)) != 1:

3405

raise AssertionError(

3406

"InterPackRepo.fetch doesn't support "

3407

"fetching multiple heads yet.")

3408

revision_id = list(fetch_spec.heads)[0]

3409

fetch_spec = None

3410

if revision_id is None:

3411

# TODO:

3412

# everything to do - use pack logic

3413

# to fetch from all packs to one without

3414

# inventory parsing etc, IFF nothing to be copied is in the target.

3415

# till then:

3416

source_revision_ids = frozenset(self.source.all_revision_ids())

3417

revision_ids = source_revision_ids - \

3418

frozenset(self.target.get_parent_map(source_revision_ids))

3419

revision_keys = [(revid,) for revid in revision_ids]

3420

index = self.target._pack_collection.revision_index.combined_index

3421

present_revision_ids = set(item[1][0] for item in

3422

index.iter_entries(revision_keys))

3423

revision_ids = set(revision_ids) - present_revision_ids

3424

# implementing the TODO will involve:

3425

# - detecting when all of a pack is selected

3426

# - avoiding as much as possible pre-selection, so the

3427

# more-core routines such as create_pack_from_packs can filter in

3428

# a just-in-time fashion. (though having a HEADS list on a

3429

# repository might make this a lot easier, because we could

3430

# sensibly detect 'new revisions' without doing a full index scan.

3431

elif _mod_revision.is_null(revision_id):

3432

# nothing to do:

3433

return (0, [])

3434

else:

3435

try:

3436

revision_ids = self.search_missing_revision_ids(revision_id,

3437

find_ghosts=find_ghosts).get_keys()

3438

except errors.NoSuchRevision:

3439

raise errors.InstallFailed([revision_id])

3440

if len(revision_ids) == 0:

3441

return (0, [])

3442

return self._pack(self.source, self.target, revision_ids)

3443

3444

def _pack(self, source, target, revision_ids):

3445

from bzrlib.repofmt.pack_repo import Packer

3446

packs = source._pack_collection.all_packs()

3447

pack = Packer(self.target._pack_collection, packs, '.fetch',

3448

revision_ids).pack()

3449

if pack is not None:

3450

self.target._pack_collection._save_pack_names()

3451

copied_revs = pack.get_revision_count()

3452

# Trigger an autopack. This may duplicate effort as we've just done

3453

# a pack creation, but for now it is simpler to think about as

3454

# 'upload data, then repack if needed'.

3455

self.target._pack_collection.autopack()

3456

return (copied_revs, [])

3457

else:

3458

return (0, [])

3459

3460

@needs_read_lock

3461

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

3462

"""See InterRepository.missing_revision_ids().

3463

3464

:param find_ghosts: Find ghosts throughout the ancestry of

3465

revision_id.

3466

"""

3467

if not find_ghosts and revision_id is not None:

3468

return self._walk_to_common_revisions([revision_id])

3469

elif revision_id is not None:

3470

# Find ghosts: search for revisions pointing from one repository to

3471

# the other, and vice versa, anywhere in the history of revision_id.

3472

graph = self.target.get_graph(other_repository=self.source)

3473

searcher = graph._make_breadth_first_searcher([revision_id])

3474

found_ids = set()

3475

while True:

3476

try:

3477

next_revs, ghosts = searcher.next_with_ghosts()

3478

except StopIteration:

3479

break

3480

if revision_id in ghosts:

3481

raise errors.NoSuchRevision(self.source, revision_id)

3482

found_ids.update(next_revs)

3483

found_ids.update(ghosts)

3484

found_ids = frozenset(found_ids)

3485

# Double query here: should be able to avoid this by changing the

3486

# graph api further.

3487

result_set = found_ids - frozenset(

3488

self.target.get_parent_map(found_ids))

3489

else:

3490

source_ids = self.source.all_revision_ids()

3491

# source_ids is the worst possible case we may need to pull.

3492

# now we want to filter source_ids against what we actually

3493

# have in target, but don't try to check for existence where we know

3494

# we do not have a revision as that would be pointless.

3495

target_ids = set(self.target.all_revision_ids())

3496

result_set = set(source_ids).difference(target_ids)

3497

return self.source.revision_ids_to_search_result(result_set)

3498

3499

3500

3708

class InterDifferingSerializer(InterRepository):

3501

3709

3502

3710

@classmethod

3509

3717

# This is redundant with format.check_conversion_target(), however that

3510

3718

# raises an exception, and we just want to say "False" as in we won't

3511

3719

# support converting between these formats.

3720

if 'IDS_never' in debug.debug_flags:

3721

return False

3512

3722

if source.supports_rich_root() and not target.supports_rich_root():

3513

3723

return False

3514

3724

if (source._format.supports_tree_reference

3515

3725

and not target._format.supports_tree_reference):

3516

3726

return False

3727

if target._fallback_repositories and target._format.supports_chks:

3728

# IDS doesn't know how to copy CHKs for the parent inventories it

3729

# adds to stacked repos.

3730

return False

3731

if 'IDS_always' in debug.debug_flags:

3732

return True

3733

# Only use this code path for local source and target. IDS does far

3734

# too much IO (both bandwidth and roundtrips) over a network.

3735

if not source.bzrdir.transport.base.startswith('file:///'):

3736

return False

3737

if not target.bzrdir.transport.base.startswith('file:///'):

3738

return False

3517

3739

return True

3518

3740

3519

def _get_delta_for_revision(self, tree, parent_ids, basis_id, cache):

3741

def _get_trees(self, revision_ids, cache):

3742

possible_trees = []

3743

for rev_id in revision_ids:

3744

if rev_id in cache:

3745

possible_trees.append((rev_id, cache[rev_id]))

3746

else:

3747

# Not cached, but inventory might be present anyway.

3748

try:

3749

tree = self.source.revision_tree(rev_id)

3750

except errors.NoSuchRevision:

3751

# Nope, parent is ghost.

3752

pass

3753

else:

3754

cache[rev_id] = tree

3755

possible_trees.append((rev_id, tree))

3756

return possible_trees

3757

3758

def _get_delta_for_revision(self, tree, parent_ids, possible_trees):

3520

3759

"""Get the best delta and base for this revision.

3521

3760

3522

3761

:return: (basis_id, delta)

3523

3762

"""

3524

possible_trees = [(parent_id, cache[parent_id])

3525

for parent_id in parent_ids

3526

if parent_id in cache]

3527

if len(possible_trees) == 0:

3528

# There either aren't any parents, or the parents aren't in the

3529

# cache, so just use the last converted tree

3530

possible_trees.append((basis_id, cache[basis_id]))

3531

3763

deltas = []

3764

# Generate deltas against each tree, to find the shortest.

3765

texts_possibly_new_in_tree = set()

3532

3766

for basis_id, basis_tree in possible_trees:

3533

3767

delta = tree.inventory._make_delta(basis_tree.inventory)

3768

for old_path, new_path, file_id, new_entry in delta:

3769

if new_path is None:

3770

# This file_id isn't present in the new rev, so we don't

3771

# care about it.

3772

continue

3773

if not new_path:

3774

# Rich roots are handled elsewhere...

3775

continue

3776

kind = new_entry.kind

3777

if kind != 'directory' and kind != 'file':

3778

# No text record associated with this inventory entry.

3779

continue

3780

# This is a directory or file that has changed somehow.

3781

texts_possibly_new_in_tree.add((file_id, new_entry.revision))

3534

3782

deltas.append((len(delta), basis_id, delta))

3535

3783

deltas.sort()

3536

3784

return deltas[0][1:]

3537

3785

3538

def _get_parent_keys(self, root_key, parent_map):

3539

"""Get the parent keys for a given root id."""

3540

root_id, rev_id = root_key

3541

# Include direct parents of the revision, but only if they used

3542

# the same root_id.

3543

parent_keys = []

3544

for parent_id in parent_map[rev_id]:

3545

if parent_id == _mod_revision.NULL_REVISION:

3546

continue

3547

if parent_id not in self._revision_id_to_root_id:

3548

# We probably didn't read this revision, go spend the

3549

# extra effort to actually check

3550

try:

3551

tree = self.source.revision_tree(parent_id)

3552

except errors.NoSuchRevision:

3553

# Ghost, fill out _revision_id_to_root_id in case we

3554

# encounter this again.

3555

# But set parent_root_id to None since we don't really know

3556

parent_root_id = None

3557

else:

3558

parent_root_id = tree.get_root_id()

3559

self._revision_id_to_root_id[parent_id] = None

3560

else:

3561

parent_root_id = self._revision_id_to_root_id[parent_id]

3562

if root_id == parent_root_id or parent_root_id is None:

3563

parent_keys.append((root_id, parent_id))

3564

return tuple(parent_keys)

3786

def _fetch_parent_invs_for_stacking(self, parent_map, cache):

3787

"""Find all parent revisions that are absent, but for which the

3788

inventory is present, and copy those inventories.

3565

3789

3566

def _new_root_data_stream(self, root_keys_to_create, parent_map):

3567

for root_key in root_keys_to_create:

3568

parent_keys = self._get_parent_keys(root_key, parent_map)

3569

yield versionedfile.FulltextContentFactory(root_key,

3570

parent_keys, None, '')

3790

This is necessary to preserve correctness when the source is stacked

3791

without fallbacks configured. (Note that in cases like upgrade the

3792

source may be not have _fallback_repositories even though it is

3793

stacked.)

3794

"""

3795

parent_revs = set()

3796

for parents in parent_map.values():

3797

parent_revs.update(parents)

3798

present_parents = self.source.get_parent_map(parent_revs)

3799

absent_parents = set(parent_revs).difference(present_parents)

3800

parent_invs_keys_for_stacking = self.source.inventories.get_parent_map(

3801

(rev_id,) for rev_id in absent_parents)

3802

parent_inv_ids = [key[-1] for key in parent_invs_keys_for_stacking]

3803

for parent_tree in self.source.revision_trees(parent_inv_ids):

3804

current_revision_id = parent_tree.get_revision_id()

3805

parents_parents_keys = parent_invs_keys_for_stacking[

3806

(current_revision_id,)]

3807

parents_parents = [key[-1] for key in parents_parents_keys]

3808

basis_id = _mod_revision.NULL_REVISION

3809

basis_tree = self.source.revision_tree(basis_id)

3810

delta = parent_tree.inventory._make_delta(basis_tree.inventory)

3811

self.target.add_inventory_by_delta(

3812

basis_id, delta, current_revision_id, parents_parents)

3813

cache[current_revision_id] = parent_tree

3571

3814

3572

3815

def _fetch_batch(self, revision_ids, basis_id, cache):

3573

3816

"""Fetch across a few revisions.

3587

3830

pending_deltas = []

3588

3831

pending_revisions = []

3589

3832

parent_map = self.source.get_parent_map(revision_ids)

3833

self._fetch_parent_invs_for_stacking(parent_map, cache)

3590

3834

for tree in self.source.revision_trees(revision_ids):

3835

# Find a inventory delta for this revision.

3836

# Find text entries that need to be copied, too.

3591

3837

current_revision_id = tree.get_revision_id()

3592

3838

parent_ids = parent_map.get(current_revision_id, ())

3839

parent_trees = self._get_trees(parent_ids, cache)

3840

possible_trees = list(parent_trees)

3841

if len(possible_trees) == 0:

3842

# There either aren't any parents, or the parents are ghosts,

3843

# so just use the last converted tree.

3844

possible_trees.append((basis_id, cache[basis_id]))

3593

3845

basis_id, delta = self._get_delta_for_revision(tree, parent_ids,

3594

basis_id, cache)

3846

possible_trees)

3847

revision = self.source.get_revision(current_revision_id)

3848

pending_deltas.append((basis_id, delta,

3849

current_revision_id, revision.parent_ids))

3595

3850

if self._converting_to_rich_root:

3596

3851

self._revision_id_to_root_id[current_revision_id] = \

3597

3852

tree.get_root_id()

3598

# Find text entries that need to be copied

3853

# Determine which texts are in present in this revision but not in

3854

# any of the available parents.

3855

texts_possibly_new_in_tree = set()

3599

3856

for old_path, new_path, file_id, entry in delta:

3600

if new_path is not None:

3601

if not new_path:

3602

# This is the root

3603

if not self.target.supports_rich_root():

3604

# The target doesn't support rich root, so we don't

3605

# copy

3606

continue

3607

if self._converting_to_rich_root:

3608

# This can't be copied normally, we have to insert

3609

# it specially

3610

root_keys_to_create.add((file_id, entry.revision))

3611

continue

3612

text_keys.add((file_id, entry.revision))

3613

revision = self.source.get_revision(current_revision_id)

3614

pending_deltas.append((basis_id, delta,

3615

current_revision_id, revision.parent_ids))

3857

if new_path is None:

3858

# This file_id isn't present in the new rev

3859

continue

3860

if not new_path:

3861

# This is the root

3862

if not self.target.supports_rich_root():

3863

# The target doesn't support rich root, so we don't

3864

# copy

3865

continue

3866

if self._converting_to_rich_root:

3867

# This can't be copied normally, we have to insert

3868

# it specially

3869

root_keys_to_create.add((file_id, entry.revision))

3870

continue

3871

kind = entry.kind

3872

texts_possibly_new_in_tree.add((file_id, entry.revision))

3873

for basis_id, basis_tree in possible_trees:

3874

basis_inv = basis_tree.inventory

3875

for file_key in list(texts_possibly_new_in_tree):

3876

file_id, file_revision = file_key

3877

try:

3878

entry = basis_inv[file_id]

3879

except errors.NoSuchId:

3880

continue

3881

if entry.revision == file_revision:

3882

texts_possibly_new_in_tree.remove(file_key)

3883

text_keys.update(texts_possibly_new_in_tree)

3616

3884

pending_revisions.append(revision)

3617

3885

cache[current_revision_id] = tree

3618

3886

basis_id = current_revision_id

3620

3888

from_texts = self.source.texts

3621

3889

to_texts = self.target.texts

3622

3890

if root_keys_to_create:

3623

root_stream = self._new_root_data_stream(root_keys_to_create,

3624

parent_map)

3891

from bzrlib.fetch import _new_root_data_stream

3892

root_stream = _new_root_data_stream(

3893

root_keys_to_create, self._revision_id_to_root_id, parent_map,

3894

self.source)

3625

3895

to_texts.insert_record_stream(root_stream)

3626

3896

to_texts.insert_record_stream(from_texts.get_record_stream(

3627

3897

text_keys, self.target._format._fetch_order,

3634

3904

# for the new revisions that we are about to insert. We do this

3635

3905

# before adding the revisions so that no revision is added until

3636

3906

# all the inventories it may depend on are added.

3907

# Note that this is overzealous, as we may have fetched these in an

3908

# earlier batch.

3637

3909

parent_ids = set()

3638

3910

revision_ids = set()

3639

3911

for revision in pending_revisions:

3642

3914

parent_ids.difference_update(revision_ids)

3643

3915

parent_ids.discard(_mod_revision.NULL_REVISION)

3644

3916

parent_map = self.source.get_parent_map(parent_ids)

3645

for parent_tree in self.source.revision_trees(parent_ids):

3646

basis_id, delta = self._get_delta_for_revision(tree, parent_ids, basis_id, cache)

3917

# we iterate over parent_map and not parent_ids because we don't

3918

# want to try copying any revision which is a ghost

3919

for parent_tree in self.source.revision_trees(parent_map):

3647

3920

current_revision_id = parent_tree.get_revision_id()

3648

3921

parents_parents = parent_map[current_revision_id]

3922

possible_trees = self._get_trees(parents_parents, cache)

3923

if len(possible_trees) == 0:

3924

# There either aren't any parents, or the parents are

3925

# ghosts, so just use the last converted tree.

3926

possible_trees.append((basis_id, cache[basis_id]))

3927

basis_id, delta = self._get_delta_for_revision(parent_tree,

3928

parents_parents, possible_trees)

3649

3929

self.target.add_inventory_by_delta(

3650

3930

basis_id, delta, current_revision_id, parents_parents)

3651

3931

# insert signatures and revisions

3665

3945

3666

3946

:param revision_ids: The list of revisions to fetch. Must be in

3667

3947

topological order.

3668

:param pb: A ProgressBar

3948

:param pb: A ProgressTask

3669

3949

:return: None

3670

3950

"""

3671

3951

basis_id, basis_tree = self._get_basis(revision_ids[0])

3673

3953

cache = lru_cache.LRUCache(100)

3674

3954

cache[basis_id] = basis_tree

3675

3955

del basis_tree # We don't want to hang on to it here

3956

hints = []

3676

3957

for offset in range(0, len(revision_ids), batch_size):

3677

3958

self.target.start_write_group()

3678

3959

try:

3684

3965

self.target.abort_write_group()

3685

3966

raise

3686

3967

else:

3687

self.target.commit_write_group()

3968

hint = self.target.commit_write_group()

3969

if hint:

3970

hints.extend(hint)

3971

if hints and self.target._format.pack_compresses:

3972

self.target.pack(hint=hints)

3688

3973

pb.update('Transferring revisions', len(revision_ids),

3689

3974

len(revision_ids))

3690

3975

3711

3996

# Walk though all revisions; get inventory deltas, copy referenced

3712

3997

# texts that delta references, insert the delta, revision and

3713

3998

# signature.

3714

first_rev = self.source.get_revision(revision_ids[0])

3715

3999

if pb is None:

3716

4000

my_pb = ui.ui_factory.nested_progress_bar()

3717

4001

pb = my_pb

3754

4038

InterRepository.register_optimiser(InterSameDataRepository)

3755

4039

InterRepository.register_optimiser(InterWeaveRepo)

3756

4040

InterRepository.register_optimiser(InterKnitRepo)

3757

InterRepository.register_optimiser(InterPackRepo)

3758

4041

3759

4042

3760

4043

class CopyConverter(object):

3841

4124

3842

4125

class _VersionedFileChecker(object):

3843

4126

3844

def __init__(self, repository, text_key_references=None):

4127

def __init__(self, repository, text_key_references=None, ancestors=None):

3845

4128

self.repository = repository

3846

4129

self.text_index = self.repository._generate_text_key_index(

3847

text_key_references=text_key_references)

4130

text_key_references=text_key_references, ancestors=ancestors)

3848

4131

3849

4132

def calculate_file_version_parents(self, text_key):

3850

4133

"""Calculate the correct parents for a file version according to

3868

4151

revision_id) tuples for versions that are present in this versioned

3869

4152

file, but not used by the corresponding inventory.

3870

4153

"""

4154

local_progress = None

4155

if progress_bar is None:

4156

local_progress = ui.ui_factory.nested_progress_bar()

4157

progress_bar = local_progress

4158

try:

4159

return self._check_file_version_parents(texts, progress_bar)

4160

finally:

4161

if local_progress:

4162

local_progress.finished()

4163

4164

def _check_file_version_parents(self, texts, progress_bar):

4165

"""See check_file_version_parents."""

3871

4166

wrong_parents = {}

3872

4167

self.file_ids = set([file_id for file_id, _ in

3873

4168

self.text_index.iterkeys()])

3874

4169

# text keys is now grouped by file_id

3875

n_weaves = len(self.file_ids)

3876

files_in_revisions = {}

3877

revisions_of_files = {}

3878

4170

n_versions = len(self.text_index)

3879

4171

progress_bar.update('loading text store', 0, n_versions)

3880

4172

parent_map = self.repository.texts.get_parent_map(self.text_index)

3882

4174

text_keys = self.repository.texts.keys()

3883

4175

unused_keys = frozenset(text_keys) - set(self.text_index)

3884

4176

for num, key in enumerate(self.text_index.iterkeys()):

3885

if progress_bar is not None:

3886

progress_bar.update('checking text graph', num, n_versions)

4177

progress_bar.update('checking text graph', num, n_versions)

3887

4178

correct_parents = self.calculate_file_version_parents(key)

3888

4179

try:

3889

4180

knit_parents = parent_map[key]

3938

4229

try:

3939

4230

if resume_tokens:

3940

4231

self.target_repo.resume_write_group(resume_tokens)

4232

is_resume = True

3941

4233

else:

3942

4234

self.target_repo.start_write_group()

4235

is_resume = False

3943

4236

try:

3944

4237

# locked_insert_stream performs a commit|suspend.

3945

return self._locked_insert_stream(stream, src_format)

4238

return self._locked_insert_stream(stream, src_format, is_resume)

3946

4239

except:

3947

4240

self.target_repo.abort_write_group(suppress_errors=True)

3948

4241

raise

3949

4242

finally:

3950

4243

self.target_repo.unlock()

3951

4244

3952

def _locked_insert_stream(self, stream, src_format):

4245

def _locked_insert_stream(self, stream, src_format, is_resume):

3953

4246

to_serializer = self.target_repo._format._serializer

3954

4247

src_serializer = src_format._serializer

4248

new_pack = None

3955

4249

if to_serializer == src_serializer:

3956

4250

# If serializers match and the target is a pack repository, set the

3957

4251

# write cache size on the new pack. This avoids poor performance

3971

4265

else:

3972

4266

new_pack.set_write_cache_size(1024*1024)

3973

4267

for substream_type, substream in stream:

4268

if 'stream' in debug.debug_flags:

4269

mutter('inserting substream: %s', substream_type)

3974

4270

if substream_type == 'texts':

3975

4271

self.target_repo.texts.insert_record_stream(substream)

3976

4272

elif substream_type == 'inventories':

3980

4276

else:

3981

4277

self._extract_and_insert_inventories(

3982

4278

substream, src_serializer)

4279

elif substream_type == 'inventory-deltas':

4280

self._extract_and_insert_inventory_deltas(

4281

substream, src_serializer)

3983

4282

elif substream_type == 'chk_bytes':

3984

4283

# XXX: This doesn't support conversions, as it assumes the

3985

4284

# conversion was done in the fetch code.

3998

4297

self.target_repo.signatures.insert_record_stream(substream)

3999

4298

else:

4000

4299

raise AssertionError('kaboom! %s' % (substream_type,))

4300

# Done inserting data, and the missing_keys calculations will try to

4301

# read back from the inserted data, so flush the writes to the new pack

4302

# (if this is pack format).

4303

if new_pack is not None:

4304

new_pack._write_data('', flush=True)

4305

# Find all the new revisions (including ones from resume_tokens)

4306

missing_keys = self.target_repo.get_missing_parent_inventories(

4307

check_for_missing_texts=is_resume)

4001

4308

try:

4002

missing_keys = set()

4003

4309

for prefix, versioned_file in (

4004

4310

('texts', self.target_repo.texts),

4005

4311

('inventories', self.target_repo.inventories),

4006

4312

('revisions', self.target_repo.revisions),

4007

4313

('signatures', self.target_repo.signatures),

4314

('chk_bytes', self.target_repo.chk_bytes),

4008

4315

4316

if versioned_file is None:

4317

continue

4009

4318

missing_keys.update((prefix,) + key for key in

4010

4319

versioned_file.get_missing_compression_parent_keys())

4011

4320

except NotImplementedError:

4020

4329

# missing keys can handle suspending a write group).

4021

4330

write_group_tokens = self.target_repo.suspend_write_group()

4022

4331

return write_group_tokens, missing_keys

4023

self.target_repo.commit_write_group()

4332

hint = self.target_repo.commit_write_group()

4333

if (to_serializer != src_serializer and

4334

self.target_repo._format.pack_compresses):

4335

self.target_repo.pack(hint=hint)

4024

4336

return [], set()

4025

4337

4026

def _extract_and_insert_inventories(self, substream, serializer):

4338

def _extract_and_insert_inventory_deltas(self, substream, serializer):

4339

target_rich_root = self.target_repo._format.rich_root_data

4340

target_tree_refs = self.target_repo._format.supports_tree_reference

4341

for record in substream:

4342

# Insert the delta directly

4343

inventory_delta_bytes = record.get_bytes_as('fulltext')

4344

deserialiser = inventory_delta.InventoryDeltaDeserializer()

4345

try:

4346

parse_result = deserialiser.parse_text_bytes(

4347

inventory_delta_bytes)

4348

except inventory_delta.IncompatibleInventoryDelta, err:

4349

trace.mutter("Incompatible delta: %s", err.msg)

4350

raise errors.IncompatibleRevision(self.target_repo._format)

4351

basis_id, new_id, rich_root, tree_refs, inv_delta = parse_result

4352

revision_id = new_id

4353

parents = [key[0] for key in record.parents]

4354

self.target_repo.add_inventory_by_delta(

4355

basis_id, inv_delta, revision_id, parents)

4356

4357

def _extract_and_insert_inventories(self, substream, serializer,

4358

parse_delta=None):

4027

4359

"""Generate a new inventory versionedfile in target, converting data.

4028

4360

4029

4361

The inventory is retrieved from the source, (deserializing it), and

4030

4362

stored in the target (reserializing it in a different format).

4031

4363

"""

4364

target_rich_root = self.target_repo._format.rich_root_data

4365

target_tree_refs = self.target_repo._format.supports_tree_reference

4032

4366

for record in substream:

4367

# It's not a delta, so it must be a fulltext in the source

4368

# serializer's format.

4033

4369

bytes = record.get_bytes_as('fulltext')

4034

4370

revision_id = record.key[0]

4035

4371

inv = serializer.read_inventory_from_string(bytes, revision_id)

4036

4372

parents = [key[0] for key in record.parents]

4037

4373

self.target_repo.add_inventory(revision_id, inv, parents)

4374

# No need to keep holding this full inv in memory when the rest of

4375

# the substream is likely to be all deltas.

4376

del inv

4038

4377

4039

4378

def _extract_and_insert_revisions(self, substream, serializer):

4040

4379

for record in substream:

4089

4428

return [('signatures', signatures), ('revisions', revisions)]

4090

4429

4091

4430

def _generate_root_texts(self, revs):

4092

"""This will be called by __fetch between fetching weave texts and

4431

"""This will be called by get_stream between fetching weave texts and

4093

4432

fetching the inventory weave.

4094

4095

Subclasses should override this if they need to generate root texts

4096

after fetching weave texts.

4097

4433

"""

4098

4434

if self._rich_root_upgrade():

4099

4435

import bzrlib.fetch

4106

4442

phase = 'file'

4107

4443

revs = search.get_keys()

4108

4444

graph = self.from_repository.get_graph()

4109

revs = list(graph.iter_topo_order(revs))

4445

revs = tsort.topo_sort(graph.get_parent_map(revs))

4110

4446

data_to_fetch = self.from_repository.item_keys_introduced_by(revs)

4111

4447

text_keys = []

4112

4448

for knit_kind, file_id, revisions in data_to_fetch:

4131

4467

# will be valid.

4132

4468

for _ in self._generate_root_texts(revs):

4133

4469

yield _

4134

# NB: This currently reopens the inventory weave in source;

4135

# using a single stream interface instead would avoid this.

4136

from_weave = self.from_repository.inventories

4137

4470

# we fetch only the referenced inventories because we do not

4138

4471

# know for unselected inventories whether all their required

4139

4472

# texts are present in the other repository - it could be

4158

4491

keys['texts'] = set()

4159

4492

keys['revisions'] = set()

4160

4493

keys['inventories'] = set()

4494

keys['chk_bytes'] = set()

4161

4495

keys['signatures'] = set()

4162

4496

for key in missing_keys:

4163

4497

keys[key[0]].add(key[1:])

4170

4504

keys['revisions'],))

4171

4505

for substream_kind, keys in keys.iteritems():

4172

4506

vf = getattr(self.from_repository, substream_kind)

4507

if vf is None and keys:

4508

raise AssertionError(

4509

"cannot fill in keys for a versioned file we don't"

4510

" have: %s needs %s" % (substream_kind, keys))

4511

if not keys:

4512

# No need to stream something we don't have

4513

continue

4514

if substream_kind == 'inventories':

4515

# Some missing keys are genuinely ghosts, filter those out.

4516

present = self.from_repository.inventories.get_parent_map(keys)

4517

revs = [key[0] for key in present]

4518

# Get the inventory stream more-or-less as we do for the

4519

# original stream; there's no reason to assume that records

4520

# direct from the source will be suitable for the sink. (Think

4521

# e.g. 2a -> 1.9-rich-root).

4522

for info in self._get_inventory_stream(revs, missing=True):

4523

yield info

4524

continue

4525

4173

4526

# Ask for full texts always so that we don't need more round trips

4174

4527

# after this stream.

4175

stream = vf.get_record_stream(keys,

4176

self.to_format._fetch_order, True)

4528

# Some of the missing keys are genuinely ghosts, so filter absent

4529

# records. The Sink is responsible for doing another check to

4530

# ensure that ghosts don't introduce missing data for future

4531

# fetches.

4532

stream = versionedfile.filter_absent(vf.get_record_stream(keys,

4533

self.to_format._fetch_order, True))

4177

4534

yield substream_kind, stream

4178

4535

4179

4536

def inventory_fetch_order(self):

4186

4543

return (not self.from_repository._format.rich_root_data and

4187

4544

self.to_format.rich_root_data)

4188

4545

4189

def _get_inventory_stream(self, revision_ids):

4546

def _get_inventory_stream(self, revision_ids, missing=False):

4190

4547

from_format = self.from_repository._format

4191

if (from_format.supports_chks and self.to_format.supports_chks

4192

and (from_format._serializer == self.to_format._serializer)):

4193

# Both sides support chks, and they use the same serializer, so it

4194

# is safe to transmit the chk pages and inventory pages across

4195

# as-is.

4196

return self._get_chk_inventory_stream(revision_ids)

4197

elif (not from_format.supports_chks):

4198

# Source repository doesn't support chks. So we can transmit the

4199

# inventories 'as-is' and either they are just accepted on the

4200

# target, or the Sink will properly convert it.

4201

return self._get_simple_inventory_stream(revision_ids)

4548

if (from_format.supports_chks and self.to_format.supports_chks and

4549

from_format.network_name() == self.to_format.network_name()):

4550

raise AssertionError(

4551

"this case should be handled by GroupCHKStreamSource")

4552

elif 'forceinvdeltas' in debug.debug_flags:

4553

return self._get_convertable_inventory_stream(revision_ids,

4554

delta_versus_null=missing)

4555

elif from_format.network_name() == self.to_format.network_name():

4556

# Same format.

4557

return self._get_simple_inventory_stream(revision_ids,

4558

missing=missing)

4559

elif (not from_format.supports_chks and not self.to_format.supports_chks

4560

and from_format._serializer == self.to_format._serializer):

4561

# Essentially the same format.

4562

return self._get_simple_inventory_stream(revision_ids,

4563

missing=missing)

4202

4564

else:

4203

# XXX: Hack to make not-chk->chk fetch: copy the inventories as

4204

# inventories. Note that this should probably be done somehow

4205

# as part of bzrlib.repository.StreamSink. Except JAM couldn't

4206

# figure out how a non-chk repository could possibly handle

4207

# deserializing an inventory stream from a chk repo, as it

4208

# doesn't have a way to understand individual pages.

4209

return self._get_convertable_inventory_stream(revision_ids)

4565

# Any time we switch serializations, we want to use an

4566

# inventory-delta based approach.

4567

return self._get_convertable_inventory_stream(revision_ids,

4568

delta_versus_null=missing)

4210

4569

4211

def _get_simple_inventory_stream(self, revision_ids):

4570

def _get_simple_inventory_stream(self, revision_ids, missing=False):

4571

# NB: This currently reopens the inventory weave in source;

4572

# using a single stream interface instead would avoid this.

4212

4573

from_weave = self.from_repository.inventories

4574

if missing:

4575

delta_closure = True

4576

else:

4577

delta_closure = not self.delta_on_metadata()

4213

4578

yield ('inventories', from_weave.get_record_stream(

4214

4579

[(rev_id,) for rev_id in revision_ids],

4215

self.inventory_fetch_order(),

4216

not self.delta_on_metadata()))

4217

4218

def _get_chk_inventory_stream(self, revision_ids):

4219

"""Fetch the inventory texts, along with the associated chk maps."""

4220

# We want an inventory outside of the search set, so that we can filter

4221

# out uninteresting chk pages. For now we use

4222

# _find_revision_outside_set, but if we had a Search with cut_revs, we

4223

# could use that instead.

4224

start_rev_id = self.from_repository._find_revision_outside_set(

4225

revision_ids)

4226

start_rev_key = (start_rev_id,)

4227

inv_keys_to_fetch = [(rev_id,) for rev_id in revision_ids]

4228

if start_rev_id != _mod_revision.NULL_REVISION:

4229

inv_keys_to_fetch.append((start_rev_id,))

4230

# Any repo that supports chk_bytes must also support out-of-order

4231

# insertion. At least, that is how we expect it to work

4232

# We use get_record_stream instead of iter_inventories because we want

4233

# to be able to insert the stream as well. We could instead fetch

4234

# allowing deltas, and then iter_inventories, but we don't know whether

4235

# source or target is more 'local' anway.

4236

inv_stream = self.from_repository.inventories.get_record_stream(

4237

inv_keys_to_fetch, 'unordered',

4238

True) # We need them as full-texts so we can find their references

4239

uninteresting_chk_roots = set()

4240

interesting_chk_roots = set()

4241

def filter_inv_stream(inv_stream):

4242

for idx, record in enumerate(inv_stream):

4243

### child_pb.update('fetch inv', idx, len(inv_keys_to_fetch))

4244

bytes = record.get_bytes_as('fulltext')

4245

chk_inv = inventory.CHKInventory.deserialise(

4246

self.from_repository.chk_bytes, bytes, record.key)

4247

if record.key == start_rev_key:

4248

uninteresting_chk_roots.add(chk_inv.id_to_entry.key())

4249

p_id_map = chk_inv.parent_id_basename_to_file_id

4250

if p_id_map is not None:

4251

uninteresting_chk_roots.add(p_id_map.key())

4252

else:

4253

yield record

4254

interesting_chk_roots.add(chk_inv.id_to_entry.key())

4255

p_id_map = chk_inv.parent_id_basename_to_file_id

4256

if p_id_map is not None:

4257

interesting_chk_roots.add(p_id_map.key())

4258

### pb.update('fetch inventory', 0, 2)

4259

yield ('inventories', filter_inv_stream(inv_stream))

4260

# Now that we have worked out all of the interesting root nodes, grab

4261

# all of the interesting pages and insert them

4262

### pb.update('fetch inventory', 1, 2)

4263

interesting = chk_map.iter_interesting_nodes(

4264

self.from_repository.chk_bytes, interesting_chk_roots,

4265

uninteresting_chk_roots)

4266

def to_stream_adapter():

4267

"""Adapt the iter_interesting_nodes result to a single stream.

4268

4269

iter_interesting_nodes returns records as it processes them, along

4270

with keys. However, we only want to return the records themselves.

4271

"""

4272

for record, items in interesting:

4273

if record is not None:

4274

yield record

4275

# XXX: We could instead call get_record_stream(records.keys())

4276

# ATM, this will always insert the records as fulltexts, and

4277

# requires that you can hang on to records once you have gone

4278

# on to the next one. Further, it causes the target to

4279

# recompress the data. Testing shows it to be faster than

4280

# requesting the records again, though.

4281

yield ('chk_bytes', to_stream_adapter())

4282

### pb.update('fetch inventory', 2, 2)

4283

4284

def _get_convertable_inventory_stream(self, revision_ids):

4285

# XXX: One of source or target is using chks, and they don't have

4286

# compatible serializations. The StreamSink code expects to be

4287

# able to convert on the target, so we need to put

4288

# bytes-on-the-wire that can be converted

4289

yield ('inventories', self._stream_invs_as_fulltexts(revision_ids))

4290

4291

def _stream_invs_as_fulltexts(self, revision_ids):

4580

self.inventory_fetch_order(), delta_closure))

4581

4582

def _get_convertable_inventory_stream(self, revision_ids,

4583

delta_versus_null=False):

4584

# The source is using CHKs, but the target either doesn't or it has a

4585

# different serializer. The StreamSink code expects to be able to

4586

# convert on the target, so we need to put bytes-on-the-wire that can

4587

# be converted. That means inventory deltas (if the remote is <1.19,

4588

# RemoteStreamSink will fallback to VFS to insert the deltas).

4589

yield ('inventory-deltas',

4590

self._stream_invs_as_deltas(revision_ids,

4591

delta_versus_null=delta_versus_null))

4592

4593

def _stream_invs_as_deltas(self, revision_ids, delta_versus_null=False):

4594

"""Return a stream of inventory-deltas for the given rev ids.

4595

4596

:param revision_ids: The list of inventories to transmit

4597

:param delta_versus_null: Don't try to find a minimal delta for this

4598

entry, instead compute the delta versus the NULL_REVISION. This

4599

effectively streams a complete inventory. Used for stuff like

4600

filling in missing parents, etc.

4601

"""

4292

4602

from_repo = self.from_repository

4293

from_serializer = from_repo._format._serializer

4294

4603

revision_keys = [(rev_id,) for rev_id in revision_ids]

4295

4604

parent_map = from_repo.inventories.get_parent_map(revision_keys)

4296

for inv in self.from_repository.iter_inventories(revision_ids):

4297

# XXX: This is a bit hackish, but it works. Basically,

4298

# CHKSerializer 'accidentally' supports

4299

# read/write_inventory_to_string, even though that is never

4300

# the format that is stored on disk. It *does* give us a

4301

# single string representation for an inventory, so live with

4302

# it for now.

4303

# This would be far better if we had a 'serialized inventory

4304

# delta' form. Then we could use 'inventory._make_delta', and

4305

# transmit that. This would both be faster to generate, and

4306

# result in fewer bytes-on-the-wire.

4307

as_bytes = from_serializer.write_inventory_to_string(inv)

4605

# XXX: possibly repos could implement a more efficient iter_inv_deltas

4606

# method...

4607

inventories = self.from_repository.iter_inventories(

4608

revision_ids, 'topological')

4609

format = from_repo._format

4610

invs_sent_so_far = set([_mod_revision.NULL_REVISION])

4611

inventory_cache = lru_cache.LRUCache(50)

4612

null_inventory = from_repo.revision_tree(

4613

_mod_revision.NULL_REVISION).inventory

4614

# XXX: ideally the rich-root/tree-refs flags would be per-revision, not

4615

# per-repo (e.g. streaming a non-rich-root revision out of a rich-root

4616

# repo back into a non-rich-root repo ought to be allowed)

4617

serializer = inventory_delta.InventoryDeltaSerializer(

4618

versioned_root=format.rich_root_data,

4619

tree_references=format.supports_tree_reference)

4620

for inv in inventories:

4308

4621

key = (inv.revision_id,)

4309

4622

parent_keys = parent_map.get(key, ())

4623

delta = None

4624

if not delta_versus_null and parent_keys:

4625

# The caller did not ask for complete inventories and we have

4626

# some parents that we can delta against. Make a delta against

4627

# each parent so that we can find the smallest.

4628

parent_ids = [parent_key[0] for parent_key in parent_keys]

4629

for parent_id in parent_ids:

4630

if parent_id not in invs_sent_so_far:

4631

# We don't know that the remote side has this basis, so

4632

# we can't use it.

4633

continue

4634

if parent_id == _mod_revision.NULL_REVISION:

4635

parent_inv = null_inventory

4636

else:

4637

parent_inv = inventory_cache.get(parent_id, None)

4638

if parent_inv is None:

4639

parent_inv = from_repo.get_inventory(parent_id)

4640

candidate_delta = inv._make_delta(parent_inv)

4641

if (delta is None or

4642

len(delta) > len(candidate_delta)):

4643

delta = candidate_delta

4644

basis_id = parent_id

4645

if delta is None:

4646

# Either none of the parents ended up being suitable, or we

4647

# were asked to delta against NULL

4648

basis_id = _mod_revision.NULL_REVISION

4649

delta = inv._make_delta(null_inventory)

4650

invs_sent_so_far.add(inv.revision_id)

4651

inventory_cache[inv.revision_id] = inv

4652

delta_serialized = ''.join(

4653

serializer.delta_to_lines(basis_id, key[-1], delta))

4310

4654

yield versionedfile.FulltextContentFactory(

4311

key, parent_keys, None, as_bytes)

4655

key, parent_keys, None, delta_serialized)

4656

4657

4658

def _iter_for_revno(repo, partial_history_cache, stop_index=None,

4659

stop_revision=None):

4660

"""Extend the partial history to include a given index

4661

4662

If a stop_index is supplied, stop when that index has been reached.

4663

If a stop_revision is supplied, stop when that revision is

4664

encountered. Otherwise, stop when the beginning of history is

4665

reached.

4666

4667

:param stop_index: The index which should be present. When it is

4668

present, history extension will stop.

4669

:param stop_revision: The revision id which should be present. When

4670

it is encountered, history extension will stop.

4671

"""

4672

start_revision = partial_history_cache[-1]

4673

iterator = repo.iter_reverse_revision_history(start_revision)

4674

try:

4675

#skip the last revision in the list

4676

iterator.next()

4677

while True:

4678

if (stop_index is not None and

4679

len(partial_history_cache) > stop_index):

4680

break

4681

if partial_history_cache[-1] == stop_revision:

4682

break

4683

revision_id = iterator.next()

4684

partial_history_cache.append(revision_id)

4685

except StopIteration:

4686

# No more history

4687

return

4312

4688

Older »