~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/repository.py

Committer: Aaron Bentley
Date: 2007-05-18 11:42:33 UTC
mto: This revision was merged to the branch mainline in revision 2528.
Revision ID: aaron.bentley@utoronto.ca-20070518114233-dhywq002d3fi9cti

Prevent repository.get_set_default_format from corrupting inventory

files added:
bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_escaped_store.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/xml6.py

doc/README.1st

files removed:
bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_pack.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/btree_index.py

bzrlib/bundle/serializer/v4.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/email_message.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/index.py

bzrlib/inventory_delta.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/multiparent.py

bzrlib/pack.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconfigure.py

bzrlib/rename_map.py

bzrlib/repofmt/pack_repo.py

bzrlib/rules.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smtp_connection.py

bzrlib/switch.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_create_clone.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/bzrdir_implementations/test_push.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/https_server.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_index.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_eol_conversion.py

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/transport/brokenrename.py

bzrlib/transport/ftp

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/log.py

bzrlib/transport/nosmart.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version_info_formats/format_custom.py

bzrlib/views.py

bzrlib/xml5.py

bzrlib/xml6.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

doc/news-template.txt

tools/check-newsbugs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/rst2pdf.py

tools/win32/build_release.py

tools/win32/run_script.py

files renamed:
bzrlib/deprecated_graph.py => bzrlib/graph.py

bzrlib/help_topics/__init__.py => bzrlib/help_topics.py

bzrlib/_patiencediff_py.py => bzrlib/patiencediff.py

bzrlib/plugins/launchpad/lp_directory.py => bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_directory.py => bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/tests/http_utils.py => bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/http_server.py => bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_send.py => bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/per_repository/ => bzrlib/tests/repository_implementations/

bzrlib/tests/test_deprecated_graph.py => bzrlib/tests/test_graph.py

bzrlib/tests/test_revisionspec.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/transport/ftp/__init__.py => bzrlib/transport/ftp.py

bzrlib/xml8.py => bzrlib/xml5.py

doc/en/tutorials/centralized_workflow.txt => doc/centralized_workflow.txt

bzrlib/help_topics/en/configuration.txt => doc/configuration.txt

doc/developers/HACKING.txt => doc/developers/HACKING

doc/en/user-guide/http_smart_server.txt => doc/http_smart_server.txt

doc/en/user-guide/index.txt => doc/index.txt

doc/en/user-guide/plugins.txt => doc/plugins.txt

doc/en/user-guide/server.txt => doc/server.txt

doc/en/user-guide/setting_up_email.txt => doc/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt => doc/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt => doc/specifying_revisions.txt

doc/en/tutorials/tutorial.txt => doc/tutorial.txt

doc/en/user-guide/using_aliases.txt => doc/using_aliases.txt

doc/en/user-guide/version_info.txt => doc/version_info.txt

files modified:
.bzrignore

INSTALL

Makefile

NEWS

README

bzr.ico

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml7.py

bzrlib/xml_serializer.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

generate_docs.py

profile_imports.py

setup.py

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/repository.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

from cStringIO import StringIO

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

import cStringIO

import re

import time

import unittest

from bzrlib import (

bzrdir,

check,

debug,

errors,

fifo_cache,

generate_ids,

gpg,

graph,

lazy_regex,

lockable_files,

lockdir,

lru_cache,

osutils,

registry,

remote,

revision as _mod_revision,

symbol_versioning,

tsort,

transactions,

ui,

versionedfile,

)

from bzrlib.bundle import serializer

from bzrlib.revisiontree import RevisionTree

from bzrlib.store.versioned import VersionedFileStore

from bzrlib.store.text import TextStore

from bzrlib.testament import Testament

""")

from bzrlib.decorators import needs_read_lock, needs_write_lock

from bzrlib.inter import InterObject

from bzrlib.inventory import (

Inventory,

InventoryDirectory,

ROOT_ID,

entry_factory,

)

from bzrlib import registry

from bzrlib.inventory import Inventory, InventoryDirectory, ROOT_ID

from bzrlib.symbol_versioning import (

deprecated_method,

zero_nine,

)

from bzrlib.trace import (

log_exception_quietly, note, mutter, mutter_callsite, warning)

from bzrlib.trace import mutter, note, warning

# Old formats display a warning, but only once

_deprecation_warning_done = False

class CommitBuilder(object):

"""Provides an interface to build up a commit.

This allows describing a tree to be committed without needing to

know the internals of the format of the repository.

"""

# all clients should supply tree roots.

record_root_entry = True

# the default CommitBuilder does not manage trees whose root is versioned.

_versioned_root = False

def __init__(self, repository, parents, config, timestamp=None,

timezone=None, committer=None, revprops=None,

revision_id=None):

"""Initiate a CommitBuilder.

:param repository: Repository to commit to.

:param parents: Revision ids of the parents of the new revision.

:param config: Configuration to use.

:param timestamp: Optional timestamp recorded for commit.

:param timezone: Optional timezone for timestamp.

:param committer: Optional committer to set for commit.

:param revprops: Optional dictionary of revision properties.

:param revision_id: Optional revision id.

"""

self._config = config

if committer is None:

self._committer = self._config.username()

else:

100

self._committer = committer

101

102

self.new_inventory = Inventory(None)

103

self._new_revision_id = revision_id

104

self.parents = parents

105

self.repository = repository

106

107

self._revprops = {}

108

if revprops is not None:

109

self._validate_revprops(revprops)

110

self._revprops.update(revprops)

111

112

if timestamp is None:

113

timestamp = time.time()

114

# Restrict resolution to 1ms

115

self._timestamp = round(timestamp, 3)

116

117

if timezone is None:

118

self._timezone = osutils.local_time_offset()

119

else:

120

self._timezone = int(timezone)

121

122

self._generate_revision_if_needed()

123

self.__heads = graph.HeadsCache(repository.get_graph()).heads

124

self._basis_delta = []

125

# API compatibility, older code that used CommitBuilder did not call

126

# .record_delete(), which means the delta that is computed would not be

127

# valid. Callers that will call record_delete() should call

128

# .will_record_deletes() to indicate that.

129

self._recording_deletes = False

130

# memo'd check for no-op commits.

131

self._any_changes = False

132

133

def any_changes(self):

134

"""Return True if any entries were changed.

135

136

This includes merge-only changes. It is the core for the --unchanged

137

detection in commit.

138

139

:return: True if any changes have occured.

140

"""

141

return self._any_changes

142

143

def _validate_unicode_text(self, text, context):

144

"""Verify things like commit messages don't have bogus characters."""

145

if '\r' in text:

146

raise ValueError('Invalid value for %s: %r' % (context, text))

147

148

def _validate_revprops(self, revprops):

149

for key, value in revprops.iteritems():

150

# We know that the XML serializers do not round trip '\r'

151

# correctly, so refuse to accept them

152

if not isinstance(value, basestring):

153

raise ValueError('revision property (%s) is not a valid'

154

' (unicode) string: %r' % (key, value))

155

self._validate_unicode_text(value,

156

'revision property (%s)' % (key,))

157

158

def commit(self, message):

159

"""Make the actual commit.

160

161

:return: The revision id of the recorded revision.

162

"""

163

self._validate_unicode_text(message, 'commit message')

164

rev = _mod_revision.Revision(

165

timestamp=self._timestamp,

166

timezone=self._timezone,

167

committer=self._committer,

168

message=message,

169

inventory_sha1=self.inv_sha1,

170

revision_id=self._new_revision_id,

171

properties=self._revprops)

172

rev.parent_ids = self.parents

173

self.repository.add_revision(self._new_revision_id, rev,

174

self.new_inventory, self._config)

175

self.repository.commit_write_group()

176

return self._new_revision_id

177

178

def abort(self):

179

"""Abort the commit that is being built.

180

"""

181

self.repository.abort_write_group()

182

183

def revision_tree(self):

184

"""Return the tree that was just committed.

185

186

After calling commit() this can be called to get a RevisionTree

187

representing the newly committed tree. This is preferred to

188

calling Repository.revision_tree() because that may require

189

deserializing the inventory, while we already have a copy in

190

memory.

191

"""

192

if self.new_inventory is None:

193

self.new_inventory = self.repository.get_inventory(

194

self._new_revision_id)

195

return RevisionTree(self.repository, self.new_inventory,

196

self._new_revision_id)

197

198

def finish_inventory(self):

199

"""Tell the builder that the inventory is finished.

200

201

:return: The inventory id in the repository, which can be used with

202

repository.get_inventory.

203

"""

204

if self.new_inventory is None:

205

# an inventory delta was accumulated without creating a new

206

# inventory.

207

basis_id = self.basis_delta_revision

208

self.inv_sha1 = self.repository.add_inventory_by_delta(

209

basis_id, self._basis_delta, self._new_revision_id,

210

self.parents)

211

else:

212

if self.new_inventory.root is None:

213

raise AssertionError('Root entry should be supplied to'

214

' record_entry_contents, as of bzr 0.10.')

215

self.new_inventory.add(InventoryDirectory(ROOT_ID, '', None))

216

self.new_inventory.revision_id = self._new_revision_id

217

self.inv_sha1 = self.repository.add_inventory(

218

self._new_revision_id,

219

self.new_inventory,

220

self.parents

221

)

222

return self._new_revision_id

223

224

def _gen_revision_id(self):

225

"""Return new revision-id."""

226

return generate_ids.gen_revision_id(self._config.username(),

227

self._timestamp)

228

229

def _generate_revision_if_needed(self):

230

"""Create a revision id if None was supplied.

231

232

If the repository can not support user-specified revision ids

233

they should override this function and raise CannotSetRevisionId

234

if _new_revision_id is not None.

235

236

:raises: CannotSetRevisionId

237

"""

238

if self._new_revision_id is None:

239

self._new_revision_id = self._gen_revision_id()

240

self.random_revid = True

241

else:

242

self.random_revid = False

243

244

def _heads(self, file_id, revision_ids):

245

"""Calculate the graph heads for revision_ids in the graph of file_id.

246

247

This can use either a per-file graph or a global revision graph as we

248

have an identity relationship between the two graphs.

249

"""

250

return self.__heads(revision_ids)

251

252

def _check_root(self, ie, parent_invs, tree):

253

"""Helper for record_entry_contents.

254

255

:param ie: An entry being added.

256

:param parent_invs: The inventories of the parent revisions of the

257

commit.

258

:param tree: The tree that is being committed.

259

"""

260

# In this revision format, root entries have no knit or weave When

261

# serializing out to disk and back in root.revision is always

262

# _new_revision_id

263

ie.revision = self._new_revision_id

264

265

def _require_root_change(self, tree):

266

"""Enforce an appropriate root object change.

267

268

This is called once when record_iter_changes is called, if and only if

269

the root was not in the delta calculated by record_iter_changes.

270

271

:param tree: The tree which is being committed.

272

"""

273

# NB: if there are no parents then this method is not called, so no

274

# need to guard on parents having length.

275

entry = entry_factory['directory'](tree.path2id(''), '',

276

None)

277

entry.revision = self._new_revision_id

278

self._basis_delta.append(('', '', entry.file_id, entry))

279

280

def _get_delta(self, ie, basis_inv, path):

281

"""Get a delta against the basis inventory for ie."""

282

if ie.file_id not in basis_inv:

283

# add

284

result = (None, path, ie.file_id, ie)

285

self._basis_delta.append(result)

286

return result

287

elif ie != basis_inv[ie.file_id]:

288

# common but altered

289

# TODO: avoid tis id2path call.

290

result = (basis_inv.id2path(ie.file_id), path, ie.file_id, ie)

291

self._basis_delta.append(result)

292

return result

293

else:

294

# common, unaltered

295

return None

296

297

def get_basis_delta(self):

298

"""Return the complete inventory delta versus the basis inventory.

299

300

This has been built up with the calls to record_delete and

301

record_entry_contents. The client must have already called

302

will_record_deletes() to indicate that they will be generating a

303

complete delta.

304

305

:return: An inventory delta, suitable for use with apply_delta, or

306

Repository.add_inventory_by_delta, etc.

307

"""

308

if not self._recording_deletes:

309

raise AssertionError("recording deletes not activated.")

310

return self._basis_delta

311

312

def record_delete(self, path, file_id):

313

"""Record that a delete occured against a basis tree.

314

315

This is an optional API - when used it adds items to the basis_delta

316

being accumulated by the commit builder. It cannot be called unless the

317

method will_record_deletes() has been called to inform the builder that

318

a delta is being supplied.

319

320

:param path: The path of the thing deleted.

321

:param file_id: The file id that was deleted.

322

"""

323

if not self._recording_deletes:

324

raise AssertionError("recording deletes not activated.")

325

delta = (path, None, file_id, None)

326

self._basis_delta.append(delta)

327

self._any_changes = True

328

return delta

329

330

def will_record_deletes(self):

331

"""Tell the commit builder that deletes are being notified.

332

333

This enables the accumulation of an inventory delta; for the resulting

334

commit to be valid, deletes against the basis MUST be recorded via

335

builder.record_delete().

336

"""

337

self._recording_deletes = True

338

try:

339

basis_id = self.parents[0]

340

except IndexError:

341

basis_id = _mod_revision.NULL_REVISION

342

self.basis_delta_revision = basis_id

343

344

def record_entry_contents(self, ie, parent_invs, path, tree,

345

content_summary):

346

"""Record the content of ie from tree into the commit if needed.

347

348

Side effect: sets ie.revision when unchanged

349

350

:param ie: An inventory entry present in the commit.

351

:param parent_invs: The inventories of the parent revisions of the

352

commit.

353

:param path: The path the entry is at in the tree.

354

:param tree: The tree which contains this entry and should be used to

355

obtain content.

356

:param content_summary: Summary data from the tree about the paths

357

content - stat, length, exec, sha/link target. This is only

358

accessed when the entry has a revision of None - that is when it is

359

a candidate to commit.

360

:return: A tuple (change_delta, version_recorded, fs_hash).

361

change_delta is an inventory_delta change for this entry against

362

the basis tree of the commit, or None if no change occured against

363

the basis tree.

364

version_recorded is True if a new version of the entry has been

365

recorded. For instance, committing a merge where a file was only

366

changed on the other side will return (delta, False).

367

fs_hash is either None, or the hash details for the path (currently

368

a tuple of the contents sha1 and the statvalue returned by

369

tree.get_file_with_stat()).

370

"""

371

if self.new_inventory.root is None:

372

if ie.parent_id is not None:

373

raise errors.RootMissing()

374

self._check_root(ie, parent_invs, tree)

375

if ie.revision is None:

376

kind = content_summary[0]

377

else:

378

# ie is carried over from a prior commit

379

kind = ie.kind

380

# XXX: repository specific check for nested tree support goes here - if

381

# the repo doesn't want nested trees we skip it ?

382

if (kind == 'tree-reference' and

383

not self.repository._format.supports_tree_reference):

384

# mismatch between commit builder logic and repository:

385

# this needs the entry creation pushed down into the builder.

386

raise NotImplementedError('Missing repository subtree support.')

387

self.new_inventory.add(ie)

388

389

# TODO: slow, take it out of the inner loop.

390

try:

391

basis_inv = parent_invs[0]

392

except IndexError:

393

basis_inv = Inventory(root_id=None)

394

395

# ie.revision is always None if the InventoryEntry is considered

396

# for committing. We may record the previous parents revision if the

397

# content is actually unchanged against a sole head.

398

if ie.revision is not None:

399

if not self._versioned_root and path == '':

400

# repositories that do not version the root set the root's

401

# revision to the new commit even when no change occurs (more

402

# specifically, they do not record a revision on the root; and

403

# the rev id is assigned to the root during deserialisation -

404

# this masks when a change may have occurred against the basis.

405

# To match this we always issue a delta, because the revision

406

# of the root will always be changing.

407

if ie.file_id in basis_inv:

408

delta = (basis_inv.id2path(ie.file_id), path,

409

ie.file_id, ie)

410

else:

411

# add

412

delta = (None, path, ie.file_id, ie)

413

self._basis_delta.append(delta)

414

return delta, False, None

415

else:

416

# we don't need to commit this, because the caller already

417

# determined that an existing revision of this file is

418

# appropriate. If its not being considered for committing then

419

# it and all its parents to the root must be unaltered so

420

# no-change against the basis.

421

if ie.revision == self._new_revision_id:

422

raise AssertionError("Impossible situation, a skipped "

423

"inventory entry (%r) claims to be modified in this "

424

"commit (%r).", (ie, self._new_revision_id))

425

return None, False, None

426

# XXX: Friction: parent_candidates should return a list not a dict

427

# so that we don't have to walk the inventories again.

428

parent_candiate_entries = ie.parent_candidates(parent_invs)

429

head_set = self._heads(ie.file_id, parent_candiate_entries.keys())

430

heads = []

431

for inv in parent_invs:

432

if ie.file_id in inv:

433

old_rev = inv[ie.file_id].revision

434

if old_rev in head_set:

435

heads.append(inv[ie.file_id].revision)

436

head_set.remove(inv[ie.file_id].revision)

437

438

store = False

439

# now we check to see if we need to write a new record to the

440

# file-graph.

441

# We write a new entry unless there is one head to the ancestors, and

442

# the kind-derived content is unchanged.

443

444

# Cheapest check first: no ancestors, or more the one head in the

445

# ancestors, we write a new node.

446

if len(heads) != 1:

447

store = True

448

if not store:

449

# There is a single head, look it up for comparison

450

parent_entry = parent_candiate_entries[heads[0]]

451

# if the non-content specific data has changed, we'll be writing a

452

# node:

453

if (parent_entry.parent_id != ie.parent_id or

454

parent_entry.name != ie.name):

455

store = True

456

# now we need to do content specific checks:

457

if not store:

458

# if the kind changed the content obviously has

459

if kind != parent_entry.kind:

460

store = True

461

# Stat cache fingerprint feedback for the caller - None as we usually

462

# don't generate one.

463

fingerprint = None

464

if kind == 'file':

465

if content_summary[2] is None:

466

raise ValueError("Files must not have executable = None")

467

if not store:

468

if (# if the file length changed we have to store:

469

parent_entry.text_size != content_summary[1] or

470

# if the exec bit has changed we have to store:

471

parent_entry.executable != content_summary[2]):

472

store = True

473

elif parent_entry.text_sha1 == content_summary[3]:

474

# all meta and content is unchanged (using a hash cache

475

# hit to check the sha)

476

ie.revision = parent_entry.revision

477

ie.text_size = parent_entry.text_size

478

ie.text_sha1 = parent_entry.text_sha1

479

ie.executable = parent_entry.executable

480

return self._get_delta(ie, basis_inv, path), False, None

481

else:

482

# Either there is only a hash change(no hash cache entry,

483

# or same size content change), or there is no change on

484

# this file at all.

485

# Provide the parent's hash to the store layer, so that the

486

# content is unchanged we will not store a new node.

487

nostore_sha = parent_entry.text_sha1

488

if store:

489

# We want to record a new node regardless of the presence or

490

# absence of a content change in the file.

491

nostore_sha = None

492

ie.executable = content_summary[2]

493

file_obj, stat_value = tree.get_file_with_stat(ie.file_id, path)

494

try:

495

lines = file_obj.readlines()

496

finally:

497

file_obj.close()

498

try:

499

ie.text_sha1, ie.text_size = self._add_text_to_weave(

500

ie.file_id, lines, heads, nostore_sha)

501

# Let the caller know we generated a stat fingerprint.

502

fingerprint = (ie.text_sha1, stat_value)

503

except errors.ExistingContent:

504

# Turns out that the file content was unchanged, and we were

505

# only going to store a new node if it was changed. Carry over

506

# the entry.

507

ie.revision = parent_entry.revision

508

ie.text_size = parent_entry.text_size

509

ie.text_sha1 = parent_entry.text_sha1

510

ie.executable = parent_entry.executable

511

return self._get_delta(ie, basis_inv, path), False, None

512

elif kind == 'directory':

513

if not store:

514

# all data is meta here, nothing specific to directory, so

515

# carry over:

516

ie.revision = parent_entry.revision

517

return self._get_delta(ie, basis_inv, path), False, None

518

lines = []

519

self._add_text_to_weave(ie.file_id, lines, heads, None)

520

elif kind == 'symlink':

521

current_link_target = content_summary[3]

522

if not store:

523

# symlink target is not generic metadata, check if it has

524

# changed.

525

if current_link_target != parent_entry.symlink_target:

526

store = True

527

if not store:

528

# unchanged, carry over.

529

ie.revision = parent_entry.revision

530

ie.symlink_target = parent_entry.symlink_target

531

return self._get_delta(ie, basis_inv, path), False, None

532

ie.symlink_target = current_link_target

533

lines = []

534

self._add_text_to_weave(ie.file_id, lines, heads, None)

535

elif kind == 'tree-reference':

536

if not store:

537

if content_summary[3] != parent_entry.reference_revision:

538

store = True

539

if not store:

540

# unchanged, carry over.

541

ie.reference_revision = parent_entry.reference_revision

542

ie.revision = parent_entry.revision

543

return self._get_delta(ie, basis_inv, path), False, None

544

ie.reference_revision = content_summary[3]

545

lines = []

546

self._add_text_to_weave(ie.file_id, lines, heads, None)

547

else:

548

raise NotImplementedError('unknown kind')

549

ie.revision = self._new_revision_id

550

self._any_changes = True

551

return self._get_delta(ie, basis_inv, path), True, fingerprint

552

553

def record_iter_changes(self, tree, basis_revision_id, iter_changes,

554

_entry_factory=entry_factory):

555

"""Record a new tree via iter_changes.

556

557

:param tree: The tree to obtain text contents from for changed objects.

558

:param basis_revision_id: The revision id of the tree the iter_changes

559

has been generated against. Currently assumed to be the same

560

as self.parents[0] - if it is not, errors may occur.

561

:param iter_changes: An iter_changes iterator with the changes to apply

562

to basis_revision_id. The iterator must not include any items with

563

a current kind of None - missing items must be either filtered out

564

or errored-on beefore record_iter_changes sees the item.

565

:param _entry_factory: Private method to bind entry_factory locally for

566

performance.

567

:return: A generator of (file_id, relpath, fs_hash) tuples for use with

568

tree._observed_sha1.

569

"""

570

# Create an inventory delta based on deltas between all the parents and

571

# deltas between all the parent inventories. We use inventory delta's

572

# between the inventory objects because iter_changes masks

573

# last-changed-field only changes.

574

# Working data:

575

# file_id -> change map, change is fileid, paths, changed, versioneds,

576

# parents, names, kinds, executables

577

merged_ids = {}

578

# {file_id -> revision_id -> inventory entry, for entries in parent

579

# trees that are not parents[0]

580

parent_entries = {}

581

ghost_basis = False

582

try:

583

revtrees = list(self.repository.revision_trees(self.parents))

584

except errors.NoSuchRevision:

585

# one or more ghosts, slow path.

586

revtrees = []

587

for revision_id in self.parents:

588

try:

589

revtrees.append(self.repository.revision_tree(revision_id))

590

except errors.NoSuchRevision:

591

if not revtrees:

592

basis_revision_id = _mod_revision.NULL_REVISION

593

ghost_basis = True

594

revtrees.append(self.repository.revision_tree(

595

_mod_revision.NULL_REVISION))

596

# The basis inventory from a repository

597

if revtrees:

598

basis_inv = revtrees[0].inventory

599

else:

600

basis_inv = self.repository.revision_tree(

601

_mod_revision.NULL_REVISION).inventory

602

if len(self.parents) > 0:

603

if basis_revision_id != self.parents[0] and not ghost_basis:

604

raise Exception(

605

"arbitrary basis parents not yet supported with merges")

606

for revtree in revtrees[1:]:

607

for change in revtree.inventory._make_delta(basis_inv):

608

if change[1] is None:

609

# Not present in this parent.

610

continue

611

if change[2] not in merged_ids:

612

if change[0] is not None:

613

basis_entry = basis_inv[change[2]]

614

merged_ids[change[2]] = [

615

# basis revid

616

basis_entry.revision,

617

# new tree revid

618

change[3].revision]

619

parent_entries[change[2]] = {

620

# basis parent

621

basis_entry.revision:basis_entry,

622

# this parent

623

change[3].revision:change[3],

624

}

625

else:

626

merged_ids[change[2]] = [change[3].revision]

627

parent_entries[change[2]] = {change[3].revision:change[3]}

628

else:

629

merged_ids[change[2]].append(change[3].revision)

630

parent_entries[change[2]][change[3].revision] = change[3]

631

else:

632

merged_ids = {}

633

# Setup the changes from the tree:

634

# changes maps file_id -> (change, [parent revision_ids])

635

changes= {}

636

for change in iter_changes:

637

# This probably looks up in basis_inv way to much.

638

if change[1][0] is not None:

639

head_candidate = [basis_inv[change[0]].revision]

640

else:

641

head_candidate = []

642

changes[change[0]] = change, merged_ids.get(change[0],

643

head_candidate)

644

unchanged_merged = set(merged_ids) - set(changes)

645

# Extend the changes dict with synthetic changes to record merges of

646

# texts.

647

for file_id in unchanged_merged:

648

# Record a merged version of these items that did not change vs the

649

# basis. This can be either identical parallel changes, or a revert

650

# of a specific file after a merge. The recorded content will be

651

# that of the current tree (which is the same as the basis), but

652

# the per-file graph will reflect a merge.

653

# NB:XXX: We are reconstructing path information we had, this

654

# should be preserved instead.

655

# inv delta change: (file_id, (path_in_source, path_in_target),

656

# changed_content, versioned, parent, name, kind,

657

# executable)

658

try:

659

basis_entry = basis_inv[file_id]

660

except errors.NoSuchId:

661

# a change from basis->some_parents but file_id isn't in basis

662

# so was new in the merge, which means it must have changed

663

# from basis -> current, and as it hasn't the add was reverted

664

# by the user. So we discard this change.

665

pass

666

else:

667

change = (file_id,

668

(basis_inv.id2path(file_id), tree.id2path(file_id)),

669

False, (True, True),

670

(basis_entry.parent_id, basis_entry.parent_id),

671

(basis_entry.name, basis_entry.name),

672

(basis_entry.kind, basis_entry.kind),

673

(basis_entry.executable, basis_entry.executable))

674

changes[file_id] = (change, merged_ids[file_id])

675

# changes contains tuples with the change and a set of inventory

676

# candidates for the file.

677

# inv delta is:

678

# old_path, new_path, file_id, new_inventory_entry

679

seen_root = False # Is the root in the basis delta?

680

inv_delta = self._basis_delta

681

modified_rev = self._new_revision_id

682

for change, head_candidates in changes.values():

683

if change[3][1]: # versioned in target.

684

# Several things may be happening here:

685

# We may have a fork in the per-file graph

686

# - record a change with the content from tree

687

# We may have a change against < all trees

688

# - carry over the tree that hasn't changed

689

# We may have a change against all trees

690

# - record the change with the content from tree

691

kind = change[6][1]

692

file_id = change[0]

693

entry = _entry_factory[kind](file_id, change[5][1],

694

change[4][1])

695

head_set = self._heads(change[0], set(head_candidates))

696

heads = []

697

# Preserve ordering.

698

for head_candidate in head_candidates:

699

if head_candidate in head_set:

700

heads.append(head_candidate)

701

head_set.remove(head_candidate)

702

carried_over = False

703

if len(heads) == 1:

704

# Could be a carry-over situation:

705

parent_entry_revs = parent_entries.get(file_id, None)

706

if parent_entry_revs:

707

parent_entry = parent_entry_revs.get(heads[0], None)

708

else:

709

parent_entry = None

710

if parent_entry is None:

711

# The parent iter_changes was called against is the one

712

# that is the per-file head, so any change is relevant

713

# iter_changes is valid.

714

carry_over_possible = False

715

else:

716

# could be a carry over situation

717

# A change against the basis may just indicate a merge,

718

# we need to check the content against the source of the

719

# merge to determine if it was changed after the merge

720

# or carried over.

721

if (parent_entry.kind != entry.kind or

722

parent_entry.parent_id != entry.parent_id or

723

parent_entry.name != entry.name):

724

# Metadata common to all entries has changed

725

# against per-file parent

726

carry_over_possible = False

727

else:

728

carry_over_possible = True

729

# per-type checks for changes against the parent_entry

730

# are done below.

731

else:

732

# Cannot be a carry-over situation

733

carry_over_possible = False

734

# Populate the entry in the delta

735

if kind == 'file':

736

# XXX: There is still a small race here: If someone reverts the content of a file

737

# after iter_changes examines and decides it has changed,

738

# we will unconditionally record a new version even if some

739

# other process reverts it while commit is running (with

740

# the revert happening after iter_changes did it's

741

# examination).

742

if change[7][1]:

743

entry.executable = True

744

else:

745

entry.executable = False

746

if (carry_over_possible and

747

parent_entry.executable == entry.executable):

748

# Check the file length, content hash after reading

749

# the file.

750

nostore_sha = parent_entry.text_sha1

751

else:

752

nostore_sha = None

753

file_obj, stat_value = tree.get_file_with_stat(file_id, change[1][1])

754

try:

755

lines = file_obj.readlines()

756

finally:

757

file_obj.close()

758

try:

759

entry.text_sha1, entry.text_size = self._add_text_to_weave(

760

file_id, lines, heads, nostore_sha)

761

yield file_id, change[1][1], (entry.text_sha1, stat_value)

762

except errors.ExistingContent:

763

# No content change against a carry_over parent

764

# Perhaps this should also yield a fs hash update?

765

carried_over = True

766

entry.text_size = parent_entry.text_size

767

entry.text_sha1 = parent_entry.text_sha1

768

elif kind == 'symlink':

769

# Wants a path hint?

770

entry.symlink_target = tree.get_symlink_target(file_id)

771

if (carry_over_possible and

772

parent_entry.symlink_target == entry.symlink_target):

773

carried_over = True

774

else:

775

self._add_text_to_weave(change[0], [], heads, None)

776

elif kind == 'directory':

777

if carry_over_possible:

778

carried_over = True

779

else:

780

# Nothing to set on the entry.

781

# XXX: split into the Root and nonRoot versions.

782

if change[1][1] != '' or self.repository.supports_rich_root():

783

self._add_text_to_weave(change[0], [], heads, None)

784

elif kind == 'tree-reference':

785

if not self.repository._format.supports_tree_reference:

786

# This isn't quite sane as an error, but we shouldn't

787

# ever see this code path in practice: tree's don't

788

# permit references when the repo doesn't support tree

789

# references.

790

raise errors.UnsupportedOperation(tree.add_reference,

791

self.repository)

792

entry.reference_revision = \

793

tree.get_reference_revision(change[0])

794

if (carry_over_possible and

795

parent_entry.reference_revision == reference_revision):

796

carried_over = True

797

else:

798

self._add_text_to_weave(change[0], [], heads, None)

799

else:

800

raise AssertionError('unknown kind %r' % kind)

801

if not carried_over:

802

entry.revision = modified_rev

803

else:

804

entry.revision = parent_entry.revision

805

else:

806

entry = None

807

new_path = change[1][1]

808

inv_delta.append((change[1][0], new_path, change[0], entry))

809

if new_path == '':

810

seen_root = True

811

self.new_inventory = None

812

if len(inv_delta):

813

self._any_changes = True

814

if not seen_root:

815

# housekeeping root entry changes do not affect no-change commits.

816

self._require_root_change(tree)

817

self.basis_delta_revision = basis_revision_id

818

819

def _add_text_to_weave(self, file_id, new_lines, parents, nostore_sha):

820

# Note: as we read the content directly from the tree, we know its not

821

# been turned into unicode or badly split - but a broken tree

822

# implementation could give us bad output from readlines() so this is

823

# not a guarantee of safety. What would be better is always checking

824

# the content during test suite execution. RBC 20070912

825

parent_keys = tuple((file_id, parent) for parent in parents)

826

return self.repository.texts.add_lines(

827

(file_id, self._new_revision_id), parent_keys, new_lines,

828

nostore_sha=nostore_sha, random_id=self.random_revid,

829

check_content=False)[0:2]

830

831

832

class RootCommitBuilder(CommitBuilder):

833

"""This commitbuilder actually records the root id"""

834

835

# the root entry gets versioned properly by this builder.

836

_versioned_root = True

837

838

def _check_root(self, ie, parent_invs, tree):

839

"""Helper for record_entry_contents.

840

841

:param ie: An entry being added.

842

:param parent_invs: The inventories of the parent revisions of the

843

commit.

844

:param tree: The tree that is being committed.

845

"""

846

847

def _require_root_change(self, tree):

848

"""Enforce an appropriate root object change.

849

850

This is called once when record_iter_changes is called, if and only if

851

the root was not in the delta calculated by record_iter_changes.

852

853

:param tree: The tree which is being committed.

854

"""

855

# versioned roots do not change unless the tree found a change.

856

857

858

######################################################################

859

# Repositories

860

865

revisions and file history. It's normally accessed only by the Branch,

866

which views a particular line of development through that history.

867

868

The Repository builds on top of some byte storage facilies (the revisions,

869

signatures, inventories and texts attributes) and a Transport, which

870

respectively provide byte storage and a means to access the (possibly

The Repository builds on top of Stores and a Transport, which respectively

describe the disk data format and the way of accessing the (possibly

871

remote) disk.

872

873

The byte storage facilities are addressed via tuples, which we refer to

874

as 'keys' throughout the code base. Revision_keys, inventory_keys and

875

signature_keys are all 1-tuples: (revision_id,). text_keys are two-tuples:

876

(file_id, revision_id). We use this interface because it allows low

877

friction with the underlying code that implements disk indices, network

878

encoding and other parts of bzrlib.

879

880

:ivar revisions: A bzrlib.versionedfile.VersionedFiles instance containing

881

the serialised revisions for the repository. This can be used to obtain

882

revision graph information or to access raw serialised revisions.

883

The result of trying to insert data into the repository via this store

884

is undefined: it should be considered read-only except for implementors

885

of repositories.

886

:ivar signatures: A bzrlib.versionedfile.VersionedFiles instance containing

887

the serialised signatures for the repository. This can be used to

888

obtain access to raw serialised signatures. The result of trying to

889

insert data into the repository via this store is undefined: it should

890

be considered read-only except for implementors of repositories.

891

:ivar inventories: A bzrlib.versionedfile.VersionedFiles instance containing

892

the serialised inventories for the repository. This can be used to

893

obtain unserialised inventories. The result of trying to insert data

894

into the repository via this store is undefined: it should be

895

considered read-only except for implementors of repositories.

896

:ivar texts: A bzrlib.versionedfile.VersionedFiles instance containing the

897

texts of files and directories for the repository. This can be used to

898

obtain file texts or file graphs. Note that Repository.iter_file_bytes

899

is usually a better interface for accessing file texts.

900

The result of trying to insert data into the repository via this store

901

is undefined: it should be considered read-only except for implementors

902

of repositories.

903

:ivar _transport: Transport for file access to repository, typically

904

pointing to .bzr/repository.

905

"""

906

907

# What class to use for a CommitBuilder. Often its simpler to change this

908

# in a Repository class subclass rather than to override

909

# get_commit_builder.

910

_commit_builder_class = CommitBuilder

911

# The search regex used by xml based repositories to determine what things

912

# where changed in a single commit.

913

_file_ids_altered_regex = lazy_regex.lazy_compile(

914

r'file_id="(?P<file_id>[^"]+)"'

915

r'.* revision="(?P<revision_id>[^"]+)"'

r'.*revision="(?P<revision_id>[^"]+)"'

916

)

917

918

def abort_write_group(self, suppress_errors=False):

919

"""Commit the contents accrued within the current write group.

920

921

:param suppress_errors: if true, abort_write_group will catch and log

922

unexpected errors that happen during the abort, rather than

923

allowing them to propagate. Defaults to False.

924

925

:seealso: start_write_group.

926

"""

927

if self._write_group is not self.get_transaction():

928

# has an unlock or relock occured ?

929

raise errors.BzrError('mismatched lock context and write group.')

930

try:

931

self._abort_write_group()

932

except Exception, exc:

933

self._write_group = None

934

if not suppress_errors:

935

raise

936

mutter('abort_write_group failed')

937

log_exception_quietly()

938

note('bzr: ERROR (ignored): %s', exc)

939

self._write_group = None

940

941

def _abort_write_group(self):

942

"""Template method for per-repository write group cleanup.

943

944

This is called during abort before the write group is considered to be

945

finished and should cleanup any internal state accrued during the write

946

group. There is no requirement that data handed to the repository be

947

*not* made available - this is not a rollback - but neither should any

948

attempt be made to ensure that data added is fully commited. Abort is

949

invoked when an error has occured so futher disk or network operations

950

may not be possible or may error and if possible should not be

951

attempted.

952

"""

953

954

def add_fallback_repository(self, repository):

955

"""Add a repository to use for looking up data not held locally.

956

957

:param repository: A repository.

958

"""

959

if not self._format.supports_external_lookups:

960

raise errors.UnstackableRepositoryFormat(self._format, self.base)

961

self._check_fallback_repository(repository)

962

self._fallback_repositories.append(repository)

963

self.texts.add_fallback_versioned_files(repository.texts)

964

self.inventories.add_fallback_versioned_files(repository.inventories)

965

self.revisions.add_fallback_versioned_files(repository.revisions)

966

self.signatures.add_fallback_versioned_files(repository.signatures)

967

968

def _check_fallback_repository(self, repository):

969

"""Check that this repository can fallback to repository safely.

970

971

Raise an error if not.

972

973

:param repository: A repository to fallback to.

974

"""

975

return InterRepository._assert_same_model(self, repository)

976

@needs_write_lock

977

def add_inventory(self, revision_id, inv, parents):

978

"""Add the inventory inv to the repository as revision_id.

979

980

:param parents: The revision ids of the parents that revision_id

981

is known to have and are in the repository already.

982

983

:returns: The validator(which is a sha1 digest, though what is sha'd is

984

repository format specific) of the serialized inventory.

returns the sha1 of the serialized inventory.

985

"""

986

if not self.is_in_write_group():

987

raise AssertionError("%r not in write group" % (self,))

revision_id = osutils.safe_revision_id(revision_id)

988

_mod_revision.check_not_reserved_id(revision_id)

989

if not (inv.revision_id is None or inv.revision_id == revision_id):

990

raise AssertionError(

991

"Mismatch between inventory revision"

992

" id and insertion revid (%r, %r)"

993

% (inv.revision_id, revision_id))

994

if inv.root is None:

995

raise AssertionError()

996

inv_lines = self._serialise_inventory_to_lines(inv)

997

return self._inventory_add_lines(revision_id, parents,

998

inv_lines, check_content=False)

999

1000

def add_inventory_by_delta(self, basis_revision_id, delta, new_revision_id,

1001

parents):

1002

"""Add a new inventory expressed as a delta against another revision.

1003

1004

:param basis_revision_id: The inventory id the delta was created

1005

against. (This does not have to be a direct parent.)

1006

:param delta: The inventory delta (see Inventory.apply_delta for

1007

details).

1008

:param new_revision_id: The revision id that the inventory is being

1009

added for.

1010

:param parents: The revision ids of the parents that revision_id is

1011

known to have and are in the repository already. These are supplied

1012

for repositories that depend on the inventory graph for revision

1013

graph access, as well as for those that pun ancestry with delta

1014

compression.

1015

1016

:returns: (validator, new_inv)

1017

The validator(which is a sha1 digest, though what is sha'd is

1018

repository format specific) of the serialized inventory, and the

1019

resulting inventory.

1020

"""

1021

if not self.is_in_write_group():

1022

raise AssertionError("%r not in write group" % (self,))

1023

_mod_revision.check_not_reserved_id(new_revision_id)

1024

basis_tree = self.revision_tree(basis_revision_id)

1025

basis_tree.lock_read()

1026

try:

1027

# Note that this mutates the inventory of basis_tree, which not all

1028

# inventory implementations may support: A better idiom would be to

1029

# return a new inventory, but as there is no revision tree cache in

1030

# repository this is safe for now - RBC 20081013

1031

basis_inv = basis_tree.inventory

1032

basis_inv.apply_delta(delta)

1033

basis_inv.revision_id = new_revision_id

1034

return (self.add_inventory(new_revision_id, basis_inv, parents),

1035

basis_inv)

1036

finally:

1037

basis_tree.unlock()

1038

1039

def _inventory_add_lines(self, revision_id, parents, lines,

1040

check_content=True):

1041

"""Store lines in inv_vf and return the sha1 of the inventory."""

1042

parents = [(parent,) for parent in parents]

1043

return self.inventories.add_lines((revision_id,), parents, lines,

1044

check_content=check_content)[0]

1045

assert inv.revision_id is None or inv.revision_id == revision_id, \

"Mismatch between inventory revision" \

" id and insertion revid (%r, %r)" % (inv.revision_id, revision_id)

assert inv.root is not None

inv_text = self.serialise_inventory(inv)

100

inv_sha1 = osutils.sha_string(inv_text)

101

inv_vf = self.control_weaves.get_weave('inventory',

102

self.get_transaction())

103

self._inventory_add_lines(inv_vf, revision_id, parents,

104

osutils.split_lines(inv_text))

105

return inv_sha1

106

107

def _inventory_add_lines(self, inv_vf, revision_id, parents, lines):

108

final_parents = []

109

for parent in parents:

110

if parent in inv_vf:

111

final_parents.append(parent)

112

113

inv_vf.add_lines(revision_id, final_parents, lines)

114

115

@needs_write_lock

1046

116

def add_revision(self, revision_id, rev, inv=None, config=None):

1047

117

"""Add rev to the revision store as revision_id.

1048

118

1054

124

If supplied its signature_needed method will be used

1055

125

to determine if a signature should be made.

1056

126

"""

127

revision_id = osutils.safe_revision_id(revision_id)

1057

128

# TODO: jam 20070210 Shouldn't we check rev.revision_id and

1058

129

# rev.parent_ids?

1059

130

_mod_revision.check_not_reserved_id(revision_id)

1063

134

plaintext = Testament(rev, inv).as_short_text()

1064

135

self.store_revision_signature(

1065

136

gpg.GPGStrategy(config), plaintext, revision_id)

1066

# check inventory present

1067

if not self.inventories.get_parent_map([(revision_id,)]):

137

if not revision_id in self.get_inventory_weave():

1068

138

if inv is None:

1069

139

raise errors.WeaveRevisionNotPresent(revision_id,

1070

self.inventories)

140

self.get_inventory_weave())

1071

141

else:

1072

142

# yes, this is not suitable for adding with ghosts.

1073

rev.inventory_sha1 = self.add_inventory(revision_id, inv,

1074

rev.parent_ids)

1075

else:

1076

key = (revision_id,)

1077

rev.inventory_sha1 = self.inventories.get_sha1s([key])[key]

1078

self._add_revision(rev)

143

self.add_inventory(revision_id, inv, rev.parent_ids)

144

self._revision_store.add_revision(rev, self.get_transaction())

1079

145

1080

def _add_revision(self, revision):

1081

text = self._serializer.write_revision_to_string(revision)

1082

key = (revision.revision_id,)

1083

parents = tuple((parent,) for parent in revision.parent_ids)

1084

self.revisions.add_lines(key, parents, osutils.split_lines(text))

146

@needs_read_lock

147

def _all_possible_ids(self):

148

"""Return all the possible revisions that we could find."""

149

return self.get_inventory_weave().versions()

1085

150

1086

151

def all_revision_ids(self):

1087

"""Returns a list of all the revision ids in the repository.

152

"""Returns a list of all the revision ids in the repository.

1088

153

1089

This is conceptually deprecated because code should generally work on

1090

the graph reachable from a particular revision, and ignore any other

1091

revisions that might be present. There is no direct replacement

1092

method.

154

This is deprecated because code should generally work on the graph

155

reachable from a particular revision, and ignore any other revisions

156

that might be present. There is no direct replacement method.

1093

157

"""

1094

if 'evil' in debug.debug_flags:

1095

mutter_callsite(2, "all_revision_ids is linear with history.")

1096

158

return self._all_revision_ids()

1097

159

160

@needs_read_lock

1098

161

def _all_revision_ids(self):

1099

"""Returns a list of all the revision ids in the repository.

162

"""Returns a list of all the revision ids in the repository.

1100

163

1101

These are in as much topological order as the underlying store can

1102

present.

164

These are in as much topological order as the underlying store can

165

present: for weaves ghosts may lead to a lack of correctness until

166

the reweave updates the parents list.

1103

167

"""

1104

raise NotImplementedError(self._all_revision_ids)

168

if self._revision_store.text_store.listable():

169

return self._revision_store.all_revision_ids(self.get_transaction())

170

result = self._all_possible_ids()

171

# TODO: jam 20070210 Ensure that _all_possible_ids returns non-unicode

172

# ids. (It should, since _revision_store's API should change to

173

# return utf8 revision_ids)

174

return self._eliminate_revisions_not_present(result)

1105

175

1106

176

def break_lock(self):

1107

177

"""Break a lock if one is present from another instance.

1118

188

Returns a set of the present revisions.

1119

189

"""

1120

190

result = []

1121

graph = self.get_graph()

1122

parent_map = graph.get_parent_map(revision_ids)

1123

# The old API returned a list, should this actually be a set?

1124

return parent_map.keys()

191

for id in revision_ids:

192

if self.has_revision(id):

193

result.append(id)

194

return result

1125

195

1126

196

@staticmethod

1127

197

def create(a_bzrdir):

1128

198

"""Construct the current default format repository in a_bzrdir."""

1129

199

return RepositoryFormat.get_default_format().initialize(a_bzrdir)

1130

200

1131

def __init__(self, _format, a_bzrdir, control_files):

201

def __init__(self, _format, a_bzrdir, control_files, _revision_store, control_store, text_store):

1132

202

"""instantiate a Repository.

1133

203

1134

204

:param _format: The format of the repository on disk.

1143

213

# the following are part of the public API for Repository:

1144

214

self.bzrdir = a_bzrdir

1145

215

self.control_files = control_files

1146

self._transport = control_files._transport

1147

self.base = self._transport.base

1148

# for tests

1149

self._reconcile_does_inventory_gc = True

1150

self._reconcile_fixes_text_parents = False

1151

self._reconcile_backsup_inventory = True

1152

# not right yet - should be more semantically clear ?

1153

216

self._revision_store = _revision_store

217

self.text_store = text_store

218

# backwards compatibility

219

self.weave_store = text_store

220

# not right yet - should be more semantically clear ?

221

222

self.control_store = control_store

223

self.control_weaves = control_store

1154

224

# TODO: make sure to construct the right store classes, etc, depending

1155

225

# on whether escaping is required.

1156

226

self._warn_if_deprecated()

1157

self._write_group = None

1158

# Additional places to query for data.

1159

self._fallback_repositories = []

1160

# An InventoryEntry cache, used during deserialization

1161

self._inventory_entry_cache = fifo_cache.FIFOCache(10*1024)

1162

227

1163

228

def __repr__(self):

1164

return '%s(%r)' % (self.__class__.__name__,

1165

self.base)

1166

1167

def has_same_location(self, other):

1168

"""Returns a boolean indicating if this repository is at the same

1169

location as another repository.

1170

1171

This might return False even when two repository objects are accessing

1172

the same physical repository via different URLs.

1173

"""

1174

if self.__class__ is not other.__class__:

1175

return False

1176

return (self._transport.base == other._transport.base)

1177

1178

def is_in_write_group(self):

1179

"""Return True if there is an open write group.

1180

1181

:seealso: start_write_group.

1182

"""

1183

return self._write_group is not None

229

return '%s(%r)' % (self.__class__.__name__,

230

self.bzrdir.transport.base)

1184

231

1185

232

def is_locked(self):

1186

233

return self.control_files.is_locked()

1187

234

1188

def is_write_locked(self):

1189

"""Return True if this object is write locked."""

1190

return self.is_locked() and self.control_files._lock_mode == 'w'

1191

1192

235

def lock_write(self, token=None):

1193

236

"""Lock this repository for writing.

1194

1195

This causes caching within the repository obejct to start accumlating

1196

data during reads, and allows a 'write_group' to be obtained. Write

1197

groups must be used for actual data insertion.

1198

237

1199

238

:param token: if this is already locked, then lock_write will fail

1200

239

unless the token matches the existing lock.

1201

240

:returns: a token if this instance supports tokens, otherwise None.

1203

242

instance doesn't support using token locks.

1204

243

:raises MismatchedToken: if the specified token doesn't match the token

1205

244

of the existing lock.

1206

:seealso: start_write_group.

1207

245

1208

246

A token should be passed in if you know that you have locked the object

1209

247

some other way, and need to synchronise this object's state with that

1211

249

1212

250

XXX: this docstring is duplicated in many places, e.g. lockable_files.py

1213

251

"""

1214

locked = self.is_locked()

1215

result = self.control_files.lock_write(token=token)

1216

for repo in self._fallback_repositories:

1217

# Writes don't affect fallback repos

1218

repo.lock_read()

1219

if not locked:

1220

self._refresh_data()

1221

return result

252

return self.control_files.lock_write(token=token)

1222

253

1223

254

def lock_read(self):

1224

locked = self.is_locked()

1225

255

self.control_files.lock_read()

1226

for repo in self._fallback_repositories:

1227

repo.lock_read()

1228

if not locked:

1229

self._refresh_data()

1230

256

1231

257

def get_physical_lock_status(self):

1232

258

return self.control_files.get_physical_lock_status()

1234

260

def leave_lock_in_place(self):

1235

261

"""Tell this repository not to release the physical lock when this

1236

262

object is unlocked.

1237

263

1238

264

If lock_write doesn't return a token, then this method is not supported.

1239

265

"""

1240

266

self.control_files.leave_in_place()

1291

317

last_revision.timezone)

1292

318

1293

319

# now gather global repository information

1294

# XXX: This is available for many repos regardless of listability.

1295

320

if self.bzrdir.root_transport.listable():

1296

# XXX: do we want to __define len__() ?

1297

# Maybe the versionedfiles object should provide a different

1298

# method to get the number of keys.

1299

result['revisions'] = len(self.revisions.keys())

1300

# result['size'] = t

321

c, t = self._revision_store.total_size(self.get_transaction())

322

result['revisions'] = c

323

result['size'] = t

1301

324

return result

1302

325

1303

def find_branches(self, using=False):

1304

"""Find branches underneath this repository.

1305

1306

This will include branches inside other branches.

1307

1308

:param using: If True, list only branches using this repository.

1309

"""

1310

if using and not self.is_shared():

1311

try:

1312

return [self.bzrdir.open_branch()]

1313

except errors.NotBranchError:

1314

return []

1315

class Evaluator(object):

1316

1317

def __init__(self):

1318

self.first_call = True

1319

1320

def __call__(self, bzrdir):

1321

# On the first call, the parameter is always the bzrdir

1322

# containing the current repo.

1323

if not self.first_call:

1324

try:

1325

repository = bzrdir.open_repository()

1326

except errors.NoRepositoryPresent:

1327

pass

1328

else:

1329

return False, (None, repository)

1330

self.first_call = False

1331

try:

1332

value = (bzrdir.open_branch(), None)

1333

except errors.NotBranchError:

1334

value = (None, None)

1335

return True, value

1336

1337

branches = []

1338

for branch, repository in bzrdir.BzrDir.find_bzrdirs(

1339

self.bzrdir.root_transport, evaluate=Evaluator()):

1340

if branch is not None:

1341

branches.append(branch)

1342

if not using and repository is not None:

1343

branches.extend(repository.find_branches())

1344

return branches

1345

1346

326

@needs_read_lock

1347

def search_missing_revision_ids(self, other, revision_id=None, find_ghosts=True):

327

def missing_revision_ids(self, other, revision_id=None):

1348

328

"""Return the revision ids that other has that this does not.

1349

329

1350

330

These are returned in topological order.

1351

331

1352

332

revision_id: only return revision ids included by revision_id.

1353

333

"""

1354

return InterRepository.get(other, self).search_missing_revision_ids(

1355

revision_id, find_ghosts)

334

revision_id = osutils.safe_revision_id(revision_id)

335

return InterRepository.get(other, self).missing_revision_ids(revision_id)

1356

336

1357

337

@staticmethod

1358

338

def open(base):

1366

346

1367

347

def copy_content_into(self, destination, revision_id=None):

1368

348

"""Make a complete copy of the content in self into destination.

1369

1370

This is a destructive operation! Do not use it on existing

349

350

This is a destructive operation! Do not use it on existing

1371

351

repositories.

1372

352

"""

353

revision_id = osutils.safe_revision_id(revision_id)

1373

354

return InterRepository.get(self, destination).copy_content(revision_id)

1374

355

1375

def commit_write_group(self):

1376

"""Commit the contents accrued within the current write group.

1377

1378

:seealso: start_write_group.

1379

"""

1380

if self._write_group is not self.get_transaction():

1381

# has an unlock or relock occured ?

1382

raise errors.BzrError('mismatched lock context %r and '

1383

'write group %r.' %

1384

(self.get_transaction(), self._write_group))

1385

self._commit_write_group()

1386

self._write_group = None

1387

1388

def _commit_write_group(self):

1389

"""Template method for per-repository write group cleanup.

1390

1391

This is called before the write group is considered to be

1392

finished and should ensure that all data handed to the repository

1393

for writing during the write group is safely committed (to the

1394

extent possible considering file system caching etc).

1395

"""

1396

1397

def suspend_write_group(self):

1398

raise errors.UnsuspendableWriteGroup(self)

1399

1400

def refresh_data(self):

1401

"""Re-read any data needed to to synchronise with disk.

1402

1403

This method is intended to be called after another repository instance

1404

(such as one used by a smart server) has inserted data into the

1405

repository. It may not be called during a write group, but may be

1406

called at any other time.

1407

"""

1408

if self.is_in_write_group():

1409

raise errors.InternalBzrError(

1410

"May not refresh_data while in a write group.")

1411

self._refresh_data()

1412

1413

def resume_write_group(self, tokens):

1414

if not self.is_write_locked():

1415

raise errors.NotWriteLocked(self)

1416

if self._write_group:

1417

raise errors.BzrError('already in a write group')

1418

self._resume_write_group(tokens)

1419

# so we can detect unlock/relock - the write group is now entered.

1420

self._write_group = self.get_transaction()

1421

1422

def _resume_write_group(self, tokens):

1423

raise errors.UnsuspendableWriteGroup(self)

1424

1425

def fetch(self, source, revision_id=None, pb=None, find_ghosts=False,

1426

fetch_spec=None):

356

def fetch(self, source, revision_id=None, pb=None):

1427

357

"""Fetch the content required to construct revision_id from source.

1428

358

1429

If revision_id is None and fetch_spec is None, then all content is

1430

copied.

1431

1432

fetch() may not be used when the repository is in a write group -

1433

either finish the current write group before using fetch, or use

1434

fetch before starting the write group.

1435

1436

:param find_ghosts: Find and copy revisions in the source that are

1437

ghosts in the target (and not reachable directly by walking out to

1438

the first-present revision in target from revision_id).

1439

:param revision_id: If specified, all the content needed for this

1440

revision ID will be copied to the target. Fetch will determine for

1441

itself which content needs to be copied.

1442

:param fetch_spec: If specified, a SearchResult or

1443

PendingAncestryResult that describes which revisions to copy. This

1444

allows copying multiple heads at once. Mutually exclusive with

1445

revision_id.

359

If revision_id is None all content is copied.

1446

360

"""

1447

if fetch_spec is not None and revision_id is not None:

1448

raise AssertionError(

1449

"fetch_spec and revision_id are mutually exclusive.")

1450

if self.is_in_write_group():

1451

raise errors.InternalBzrError(

1452

"May not fetch while in a write group.")

1453

# fast path same-url fetch operations

1454

if self.has_same_location(source) and fetch_spec is None:

1455

# check that last_revision is in 'from' and then return a

1456

# no-operation.

1457

if (revision_id is not None and

1458

not _mod_revision.is_null(revision_id)):

1459

self.get_revision(revision_id)

1460

return 0, []

1461

# if there is no specific appropriate InterRepository, this will get

1462

# the InterRepository base class, which raises an

1463

# IncompatibleRepositories when asked to fetch.

361

revision_id = osutils.safe_revision_id(revision_id)

1464

362

inter = InterRepository.get(source, self)

1465

return inter.fetch(revision_id=revision_id, pb=pb,

1466

find_ghosts=find_ghosts, fetch_spec=fetch_spec)

1467

1468

def create_bundle(self, target, base, fileobj, format=None):

1469

return serializer.write_bundle(self, target, base, fileobj, format)

1470

1471

def get_commit_builder(self, branch, parents, config, timestamp=None,

1472

timezone=None, committer=None, revprops=None,

363

try:

364

return inter.fetch(revision_id=revision_id, pb=pb)

365

except NotImplementedError:

366

raise errors.IncompatibleRepositories(source, self)

367

368

def get_commit_builder(self, branch, parents, config, timestamp=None,

369

timezone=None, committer=None, revprops=None,

1473

370

revision_id=None):

1474

371

"""Obtain a CommitBuilder for this repository.

1475

372

1476

373

:param branch: Branch to commit to.

1477

374

:param parents: Revision ids of the parents of the new revision.

1478

375

:param config: Configuration to use.

1482

379

:param revprops: Optional dictionary of revision properties.

1483

380

:param revision_id: Optional revision id.

1484

381

"""

1485

result = self._commit_builder_class(self, parents, config,

1486

timestamp, timezone, committer, revprops, revision_id)

1487

self.start_write_group()

1488

return result

382

revision_id = osutils.safe_revision_id(revision_id)

383

return _CommitBuilder(self, parents, config, timestamp, timezone,

384

committer, revprops, revision_id)

1489

385

1490

386

def unlock(self):

1491

if (self.control_files._lock_count == 1 and

1492

self.control_files._lock_mode == 'w'):

1493

if self._write_group is not None:

1494

self.abort_write_group()

1495

self.control_files.unlock()

1496

raise errors.BzrError(

1497

'Must end write groups before releasing write locks.')

1498

387

self.control_files.unlock()

1499

if self.control_files._lock_count == 0:

1500

self._inventory_entry_cache.clear()

1501

for repo in self._fallback_repositories:

1502

repo.unlock()

1503

388

1504

389

@needs_read_lock

1505

390

def clone(self, a_bzrdir, revision_id=None):

1516

401

self.copy_content_into(dest_repo, revision_id)

1517

402

return dest_repo

1518

403

1519

def start_write_group(self):

1520

"""Start a write group in the repository.

1521

1522

Write groups are used by repositories which do not have a 1:1 mapping

1523

between file ids and backend store to manage the insertion of data from

1524

both fetch and commit operations.

1525

1526

A write lock is required around the start_write_group/commit_write_group

1527

for the support of lock-requiring repository formats.

1528

1529

One can only insert data into a repository inside a write group.

1530

1531

:return: None.

1532

"""

1533

if not self.is_write_locked():

1534

raise errors.NotWriteLocked(self)

1535

if self._write_group:

1536

raise errors.BzrError('already in a write group')

1537

self._start_write_group()

1538

# so we can detect unlock/relock - the write group is now entered.

1539

self._write_group = self.get_transaction()

1540

1541

def _start_write_group(self):

1542

"""Template method for per-repository write group startup.

1543

1544

This is called before the write group is considered to be

1545

entered.

1546

"""

1547

1548

404

@needs_read_lock

1549

405

def sprout(self, to_bzrdir, revision_id=None):

1550

406

"""Create a descendent repository for new development.

1568

424

dest_repo = a_bzrdir.open_repository()

1569

425

return dest_repo

1570

426

1571

def _get_sink(self):

1572

"""Return a sink for streaming into this repository."""

1573

return StreamSink(self)

1574

1575

def _get_source(self, to_format):

1576

"""Return a source for streaming from this repository."""

1577

return StreamSource(self, to_format)

1578

1579

427

@needs_read_lock

1580

428

def has_revision(self, revision_id):

1581

429

"""True if this repository has a copy of the revision."""

1582

return revision_id in self.has_revisions((revision_id,))

1583

1584

@needs_read_lock

1585

def has_revisions(self, revision_ids):

1586

"""Probe to find out the presence of multiple revisions.

1587

1588

:param revision_ids: An iterable of revision_ids.

1589

:return: A set of the revision_ids that were present.

1590

"""

1591

parent_map = self.revisions.get_parent_map(

1592

[(rev_id,) for rev_id in revision_ids])

1593

result = set()

1594

if _mod_revision.NULL_REVISION in revision_ids:

1595

result.add(_mod_revision.NULL_REVISION)

1596

result.update([key[0] for key in parent_map])

1597

return result

1598

1599

@needs_read_lock

1600

def get_revision(self, revision_id):

1601

"""Return the Revision object for a named revision."""

1602

return self.get_revisions([revision_id])[0]

430

revision_id = osutils.safe_revision_id(revision_id)

431

return self._revision_store.has_revision_id(revision_id,

432

self.get_transaction())

1603

433

1604

434

@needs_read_lock

1605

435

def get_revision_reconcile(self, revision_id):

1606

436

"""'reconcile' helper routine that allows access to a revision always.

1607

437

1608

438

This variant of get_revision does not cross check the weave graph

1609

439

against the revision one as get_revision does: but it should only

1610

440

be used by reconcile, or reconcile-alike commands that are correcting

1611

441

or testing the revision graph.

1612

442

"""

1613

return self._get_revisions([revision_id])[0]

443

if not revision_id or not isinstance(revision_id, basestring):

444

raise errors.InvalidRevisionId(revision_id=revision_id,

445

branch=self)

446

return self.get_revisions([revision_id])[0]

1614

447

1615

448

@needs_read_lock

1616

449

def get_revisions(self, revision_ids):

1617

"""Get many revisions at once."""

1618

return self._get_revisions(revision_ids)

1619

1620

@needs_read_lock

1621

def _get_revisions(self, revision_ids):

1622

"""Core work logic to get many revisions without sanity checks."""

1623

for rev_id in revision_ids:

1624

if not rev_id or not isinstance(rev_id, basestring):

1625

raise errors.InvalidRevisionId(revision_id=rev_id, branch=self)

1626

keys = [(key,) for key in revision_ids]

1627

stream = self.revisions.get_record_stream(keys, 'unordered', True)

1628

revs = {}

1629

for record in stream:

1630

if record.storage_kind == 'absent':

1631

raise errors.NoSuchRevision(self, record.key[0])

1632

text = record.get_bytes_as('fulltext')

1633

rev = self._serializer.read_revision_from_string(text)

1634

revs[record.key[0]] = rev

1635

return [revs[revid] for revid in revision_ids]

450

revision_ids = [osutils.safe_revision_id(r) for r in revision_ids]

451

revs = self._revision_store.get_revisions(revision_ids,

452

self.get_transaction())

453

for rev in revs:

454

assert not isinstance(rev.revision_id, unicode)

455

for parent_id in rev.parent_ids:

456

assert not isinstance(parent_id, unicode)

457

return revs

1636

458

1637

459

@needs_read_lock

1638

460

def get_revision_xml(self, revision_id):

1639

461

# TODO: jam 20070210 This shouldn't be necessary since get_revision

1640

462

# would have already do it.

1641

463

# TODO: jam 20070210 Just use _serializer.write_revision_to_string()

1642

# TODO: this can't just be replaced by:

1643

# return self._serializer.write_revision_to_string(

1644

# self.get_revision(revision_id))

1645

# as cStringIO preservers the encoding unlike write_revision_to_string

1646

# or some other call down the path.

464

revision_id = osutils.safe_revision_id(revision_id)

1647

465

rev = self.get_revision(revision_id)

1648

rev_tmp = cStringIO.StringIO()

466

rev_tmp = StringIO()

1649

467

# the current serializer..

1650

self._serializer.write_revision(rev, rev_tmp)

468

self._revision_store._serializer.write_revision(rev, rev_tmp)

1651

469

rev_tmp.seek(0)

1652

470

return rev_tmp.getvalue()

1653

471

1654

def get_deltas_for_revisions(self, revisions, specific_fileids=None):

472

@needs_read_lock

473

def get_revision(self, revision_id):

474

"""Return the Revision object for a named revision"""

475

# TODO: jam 20070210 get_revision_reconcile should do this for us

476

revision_id = osutils.safe_revision_id(revision_id)

477

r = self.get_revision_reconcile(revision_id)

478

# weave corruption can lead to absent revision markers that should be

479

# present.

480

# the following test is reasonably cheap (it needs a single weave read)

481

# and the weave is cached in read transactions. In write transactions

482

# it is not cached but typically we only read a small number of

483

# revisions. For knits when they are introduced we will probably want

484

# to ensure that caching write transactions are in use.

485

inv = self.get_inventory_weave()

486

self._check_revision_parents(r, inv)

487

return r

488

489

@needs_read_lock

490

def get_deltas_for_revisions(self, revisions):

1655

491

"""Produce a generator of revision deltas.

1656

492

1657

493

Note that the input is a sequence of REVISIONS, not revision_ids.

1658

494

Trees will be held in memory until the generator exits.

1659

495

Each delta is relative to the revision's lefthand predecessor.

1660

1661

:param specific_fileids: if not None, the result is filtered

1662

so that only those file-ids, their parents and their

1663

children are included.

1664

496

"""

1665

# Get the revision-ids of interest

1666

497

required_trees = set()

1667

498

for revision in revisions:

1668

499

required_trees.add(revision.revision_id)

1669

500

required_trees.update(revision.parent_ids[:1])

1670

1671

# Get the matching filtered trees. Note that it's more

1672

# efficient to pass filtered trees to changes_from() rather

1673

# than doing the filtering afterwards. changes_from() could

1674

# arguably do the filtering itself but it's path-based, not

1675

# file-id based, so filtering before or afterwards is

1676

# currently easier.

1677

if specific_fileids is None:

1678

trees = dict((t.get_revision_id(), t) for

1679

t in self.revision_trees(required_trees))

1680

else:

1681

trees = dict((t.get_revision_id(), t) for

1682

t in self._filtered_revision_trees(required_trees,

1683

specific_fileids))

1684

1685

# Calculate the deltas

501

trees = dict((t.get_revision_id(), t) for

502

t in self.revision_trees(required_trees))

1686

503

for revision in revisions:

1687

504

if not revision.parent_ids:

1688

old_tree = self.revision_tree(_mod_revision.NULL_REVISION)

505

old_tree = self.revision_tree(None)

1689

506

else:

1690

507

old_tree = trees[revision.parent_ids[0]]

1691

508

yield trees[revision.revision_id].changes_from(old_tree)

1692

509

1693

510

@needs_read_lock

1694

def get_revision_delta(self, revision_id, specific_fileids=None):

511

def get_revision_delta(self, revision_id):

1695

512

"""Return the delta for one revision.

1696

513

1697

514

The delta is relative to the left-hand predecessor of the

1698

515

revision.

1699

1700

:param specific_fileids: if not None, the result is filtered

1701

so that only those file-ids, their parents and their

1702

children are included.

1703

516

"""

1704

517

r = self.get_revision(revision_id)

1705

return list(self.get_deltas_for_revisions([r],

1706

specific_fileids=specific_fileids))[0]

518

return list(self.get_deltas_for_revisions([r]))[0]

519

520

def _check_revision_parents(self, revision, inventory):

521

"""Private to Repository and Fetch.

522

523

This checks the parentage of revision in an inventory weave for

524

consistency and is only applicable to inventory-weave-for-ancestry

525

using repository formats & fetchers.

526

"""

527

weave_parents = inventory.get_parents(revision.revision_id)

528

weave_names = inventory.versions()

529

for parent_id in revision.parent_ids:

530

if parent_id in weave_names:

531

# this parent must not be a ghost.

532

if not parent_id in weave_parents:

533

# but it is a ghost

534

raise errors.CorruptRepository(self)

1707

535

1708

536

@needs_write_lock

1709

537

def store_revision_signature(self, gpg_strategy, plaintext, revision_id):

538

revision_id = osutils.safe_revision_id(revision_id)

1710

539

signature = gpg_strategy.sign(plaintext)

1711

self.add_signature_text(revision_id, signature)

1712

1713

@needs_write_lock

1714

def add_signature_text(self, revision_id, signature):

1715

self.signatures.add_lines((revision_id,), (),

1716

osutils.split_lines(signature))

1717

1718

def find_text_key_references(self):

1719

"""Find the text key references within the repository.

1720

1721

:return: A dictionary mapping text keys ((fileid, revision_id) tuples)

1722

to whether they were referred to by the inventory of the

1723

revision_id that they contain. The inventory texts from all present

1724

revision ids are assessed to generate this report.

1725

"""

1726

revision_keys = self.revisions.keys()

1727

w = self.inventories

1728

pb = ui.ui_factory.nested_progress_bar()

1729

try:

1730

return self._find_text_key_references_from_xml_inventory_lines(

1731

w.iter_lines_added_or_present_in_keys(revision_keys, pb=pb))

1732

finally:

1733

pb.finished()

1734

1735

def _find_text_key_references_from_xml_inventory_lines(self,

1736

line_iterator):

1737

"""Core routine for extracting references to texts from inventories.

1738

1739

This performs the translation of xml lines to revision ids.

1740

1741

:param line_iterator: An iterator of lines, origin_version_id

1742

:return: A dictionary mapping text keys ((fileid, revision_id) tuples)

1743

to whether they were referred to by the inventory of the

1744

revision_id that they contain. Note that if that revision_id was

1745

not part of the line_iterator's output then False will be given -

1746

even though it may actually refer to that key.

1747

"""

1748

if not self._serializer.support_altered_by_hack:

1749

raise AssertionError(

1750

"_find_text_key_references_from_xml_inventory_lines only "

1751

"supported for branches which store inventory as unnested xml"

1752

", not on %r" % self)

540

self._revision_store.add_revision_signature_text(revision_id,

541

signature,

542

self.get_transaction())

543

544

def fileids_altered_by_revision_ids(self, revision_ids):

545

"""Find the file ids and versions affected by revisions.

546

547

:param revisions: an iterable containing revision ids.

548

:return: a dictionary mapping altered file-ids to an iterable of

549

revision_ids. Each altered file-ids has the exact revision_ids that

550

altered it listed explicitly.

551

"""

552

assert self._serializer.support_altered_by_hack, \

553

("fileids_altered_by_revision_ids only supported for branches "

554

"which store inventory as unnested xml, not on %r" % self)

555

selected_revision_ids = set(osutils.safe_revision_id(r)

556

for r in revision_ids)

557

w = self.get_inventory_weave()

1753

558

result = {}

1754

559

1755

560

# this code needs to read every new line in every inventory for the

1756

561

# inventories [revision_ids]. Seeing a line twice is ok. Seeing a line

1757

# not present in one of those inventories is unnecessary but not

562

# not present in one of those inventories is unnecessary but not

1758

563

# harmful because we are filtering by the revision id marker in the

1759

# inventory lines : we only select file ids altered in one of those

564

# inventory lines : we only select file ids altered in one of those

1760

565

# revisions. We don't need to see all lines in the inventory because

1761

566

# only those added in an inventory in rev X can contain a revision=X

1762

567

# line.

1771

576

search = self._file_ids_altered_regex.search

1772

577

unescape = _unescape_xml

1773

578

setdefault = result.setdefault

1774

for line, line_key in line_iterator:

1775

match = search(line)

1776

if match is None:

1777

continue

1778

# One call to match.group() returning multiple items is quite a

1779

# bit faster than 2 calls to match.group() each returning 1

1780

file_id, revision_id = match.group('file_id', 'revision_id')

1781

1782

# Inlining the cache lookups helps a lot when you make 170,000

1783

# lines and 350k ids, versus 8.4 unique ids.

1784

# Using a cache helps in 2 ways:

1785

# 1) Avoids unnecessary decoding calls

1786

# 2) Re-uses cached strings, which helps in future set and

1787

# equality checks.

1788

# (2) is enough that removing encoding entirely along with

1789

# the cache (so we are using plain strings) results in no

1790

# performance improvement.

1791

try:

1792

revision_id = unescape_revid_cache[revision_id]

1793

except KeyError:

1794

unescaped = unescape(revision_id)

1795

unescape_revid_cache[revision_id] = unescaped

1796

revision_id = unescaped

1797

1798

# Note that unconditionally unescaping means that we deserialise

1799

# every fileid, which for general 'pull' is not great, but we don't

1800

# really want to have some many fulltexts that this matters anyway.

1801

# RBC 20071114.

1802

try:

1803

file_id = unescape_fileid_cache[file_id]

1804

except KeyError:

1805

unescaped = unescape(file_id)

1806

unescape_fileid_cache[file_id] = unescaped

1807

file_id = unescaped

1808

1809

key = (file_id, revision_id)

1810

setdefault(key, False)

1811

if revision_id == line_key[-1]:

1812

result[key] = True

1813

return result

1814

1815

def _inventory_xml_lines_for_keys(self, keys):

1816

"""Get a line iterator of the sort needed for findind references.

1817

1818

Not relevant for non-xml inventory repositories.

1819

1820

Ghosts in revision_keys are ignored.

1821

1822

:param revision_keys: The revision keys for the inventories to inspect.

1823

:return: An iterator over (inventory line, revid) for the fulltexts of

1824

all of the xml inventories specified by revision_keys.

1825

"""

1826

stream = self.inventories.get_record_stream(keys, 'unordered', True)

1827

for record in stream:

1828

if record.storage_kind != 'absent':

1829

chunks = record.get_bytes_as('chunked')

1830

revid = record.key[-1]

1831

lines = osutils.chunks_to_lines(chunks)

1832

for line in lines:

1833

yield line, revid

1834

1835

def _find_file_ids_from_xml_inventory_lines(self, line_iterator,

1836

revision_ids):

1837

"""Helper routine for fileids_altered_by_revision_ids.

1838

1839

This performs the translation of xml lines to revision ids.

1840

1841

:param line_iterator: An iterator of lines, origin_version_id

1842

:param revision_ids: The revision ids to filter for. This should be a

1843

set or other type which supports efficient __contains__ lookups, as

1844

the revision id from each parsed line will be looked up in the

1845

revision_ids filter.

1846

:return: a dictionary mapping altered file-ids to an iterable of

1847

revision_ids. Each altered file-ids has the exact revision_ids that

1848

altered it listed explicitly.

1849

"""

1850

seen = set(self._find_text_key_references_from_xml_inventory_lines(

1851

line_iterator).iterkeys())

1852

# Note that revision_ids are revision keys.

1853

parent_maps = self.revisions.get_parent_map(revision_ids)

1854

parents = set()

1855

map(parents.update, parent_maps.itervalues())

1856

parents.difference_update(revision_ids)

1857

parent_seen = set(self._find_text_key_references_from_xml_inventory_lines(

1858

self._inventory_xml_lines_for_keys(parents)))

1859

new_keys = seen - parent_seen

1860

result = {}

1861

setdefault = result.setdefault

1862

for key in new_keys:

1863

setdefault(key[0], set()).add(key[-1])

1864

return result

1865

1866

def fileids_altered_by_revision_ids(self, revision_ids, _inv_weave=None):

1867

"""Find the file ids and versions affected by revisions.

1868

1869

:param revisions: an iterable containing revision ids.

1870

:param _inv_weave: The inventory weave from this repository or None.

1871

If None, the inventory weave will be opened automatically.

1872

:return: a dictionary mapping altered file-ids to an iterable of

1873

revision_ids. Each altered file-ids has the exact revision_ids that

1874

altered it listed explicitly.

1875

"""

1876

selected_keys = set((revid,) for revid in revision_ids)

1877

w = _inv_weave or self.inventories

1878

pb = ui.ui_factory.nested_progress_bar()

1879

try:

1880

return self._find_file_ids_from_xml_inventory_lines(

1881

w.iter_lines_added_or_present_in_keys(

1882

selected_keys, pb=pb),

1883

selected_keys)

1884

finally:

1885

pb.finished()

1886

1887

def iter_files_bytes(self, desired_files):

1888

"""Iterate through file versions.

1889

1890

Files will not necessarily be returned in the order they occur in

1891

desired_files. No specific order is guaranteed.

1892

1893

Yields pairs of identifier, bytes_iterator. identifier is an opaque

1894

value supplied by the caller as part of desired_files. It should

1895

uniquely identify the file version in the caller's context. (Examples:

1896

an index number or a TreeTransform trans_id.)

1897

1898

bytes_iterator is an iterable of bytestrings for the file. The

1899

kind of iterable and length of the bytestrings are unspecified, but for

1900

this implementation, it is a list of bytes produced by

1901

VersionedFile.get_record_stream().

1902

1903

:param desired_files: a list of (file_id, revision_id, identifier)

1904

triples

1905

"""

1906

text_keys = {}

1907

for file_id, revision_id, callable_data in desired_files:

1908

text_keys[(file_id, revision_id)] = callable_data

1909

for record in self.texts.get_record_stream(text_keys, 'unordered', True):

1910

if record.storage_kind == 'absent':

1911

raise errors.RevisionNotPresent(record.key, self)

1912

yield text_keys[record.key], record.get_bytes_as('chunked')

1913

1914

def _generate_text_key_index(self, text_key_references=None,

1915

ancestors=None):

1916

"""Generate a new text key index for the repository.

1917

1918

This is an expensive function that will take considerable time to run.

1919

1920

:return: A dict mapping text keys ((file_id, revision_id) tuples) to a

1921

list of parents, also text keys. When a given key has no parents,

1922

the parents list will be [NULL_REVISION].

1923

"""

1924

# All revisions, to find inventory parents.

1925

if ancestors is None:

1926

graph = self.get_graph()

1927

ancestors = graph.get_parent_map(self.all_revision_ids())

1928

if text_key_references is None:

1929

text_key_references = self.find_text_key_references()

1930

pb = ui.ui_factory.nested_progress_bar()

1931

try:

1932

return self._do_generate_text_key_index(ancestors,

1933

text_key_references, pb)

1934

finally:

1935

pb.finished()

1936

1937

def _do_generate_text_key_index(self, ancestors, text_key_references, pb):

1938

"""Helper for _generate_text_key_index to avoid deep nesting."""

1939

revision_order = tsort.topo_sort(ancestors)

1940

invalid_keys = set()

1941

revision_keys = {}

1942

for revision_id in revision_order:

1943

revision_keys[revision_id] = set()

1944

text_count = len(text_key_references)

1945

# a cache of the text keys to allow reuse; costs a dict of all the

1946

# keys, but saves a 2-tuple for every child of a given key.

1947

text_key_cache = {}

1948

for text_key, valid in text_key_references.iteritems():

1949

if not valid:

1950

invalid_keys.add(text_key)

1951

else:

1952

revision_keys[text_key[1]].add(text_key)

1953

text_key_cache[text_key] = text_key

1954

del text_key_references

1955

text_index = {}

1956

text_graph = graph.Graph(graph.DictParentsProvider(text_index))

1957

NULL_REVISION = _mod_revision.NULL_REVISION

1958

# Set a cache with a size of 10 - this suffices for bzr.dev but may be

1959

# too small for large or very branchy trees. However, for 55K path

1960

# trees, it would be easy to use too much memory trivially. Ideally we

1961

# could gauge this by looking at available real memory etc, but this is

1962

# always a tricky proposition.

1963

inventory_cache = lru_cache.LRUCache(10)

1964

batch_size = 10 # should be ~150MB on a 55K path tree

1965

batch_count = len(revision_order) / batch_size + 1

1966

processed_texts = 0

1967

pb.update("Calculating text parents", processed_texts, text_count)

1968

for offset in xrange(batch_count):

1969

to_query = revision_order[offset * batch_size:(offset + 1) *

1970

batch_size]

1971

if not to_query:

1972

break

1973

for rev_tree in self.revision_trees(to_query):

1974

revision_id = rev_tree.get_revision_id()

1975

parent_ids = ancestors[revision_id]

1976

for text_key in revision_keys[revision_id]:

1977

pb.update("Calculating text parents", processed_texts)

1978

processed_texts += 1

1979

candidate_parents = []

1980

for parent_id in parent_ids:

1981

parent_text_key = (text_key[0], parent_id)

1982

try:

1983

check_parent = parent_text_key not in \

1984

revision_keys[parent_id]

1985

except KeyError:

1986

# the parent parent_id is a ghost:

1987

check_parent = False

1988

# truncate the derived graph against this ghost.

1989

parent_text_key = None

1990

if check_parent:

1991

# look at the parent commit details inventories to

1992

# determine possible candidates in the per file graph.

1993

# TODO: cache here.

1994

try:

1995

inv = inventory_cache[parent_id]

1996

except KeyError:

1997

inv = self.revision_tree(parent_id).inventory

1998

inventory_cache[parent_id] = inv

1999

parent_entry = inv._byid.get(text_key[0], None)

2000

if parent_entry is not None:

2001

parent_text_key = (

2002

text_key[0], parent_entry.revision)

2003

else:

2004

parent_text_key = None

2005

if parent_text_key is not None:

2006

candidate_parents.append(

2007

text_key_cache[parent_text_key])

2008

parent_heads = text_graph.heads(candidate_parents)

2009

new_parents = list(parent_heads)

2010

new_parents.sort(key=lambda x:candidate_parents.index(x))

2011

if new_parents == []:

2012

new_parents = [NULL_REVISION]

2013

text_index[text_key] = new_parents

2014

2015

for text_key in invalid_keys:

2016

text_index[text_key] = [NULL_REVISION]

2017

return text_index

2018

2019

def item_keys_introduced_by(self, revision_ids, _files_pb=None):

2020

"""Get an iterable listing the keys of all the data introduced by a set

2021

of revision IDs.

2022

2023

The keys will be ordered so that the corresponding items can be safely

2024

fetched and inserted in that order.

2025

2026

:returns: An iterable producing tuples of (knit-kind, file-id,

2027

versions). knit-kind is one of 'file', 'inventory', 'signatures',

2028

'revisions'. file-id is None unless knit-kind is 'file'.

2029

"""

2030

# XXX: it's a bit weird to control the inventory weave caching in this

2031

# generator. Ideally the caching would be done in fetch.py I think. Or

2032

# maybe this generator should explicitly have the contract that it

2033

# should not be iterated until the previously yielded item has been

2034

# processed?

2035

inv_w = self.inventories

2036

2037

# file ids that changed

2038

file_ids = self.fileids_altered_by_revision_ids(revision_ids, inv_w)

2039

count = 0

2040

num_file_ids = len(file_ids)

2041

for file_id, altered_versions in file_ids.iteritems():

2042

if _files_pb is not None:

2043

_files_pb.update("fetch texts", count, num_file_ids)

2044

count += 1

2045

yield ("file", file_id, altered_versions)

2046

# We're done with the files_pb. Note that it finished by the caller,

2047

# just as it was created by the caller.

2048

del _files_pb

2049

2050

# inventory

2051

yield ("inventory", None, revision_ids)

2052

2053

# signatures

2054

# XXX: Note ATM no callers actually pay attention to this return

2055

# instead they just use the list of revision ids and ignore

2056

# missing sigs. Consider removing this work entirely

2057

revisions_with_signatures = set(self.signatures.get_parent_map(

2058

[(r,) for r in revision_ids]))

2059

revisions_with_signatures = set(

2060

[r for (r,) in revisions_with_signatures])

2061

revisions_with_signatures.intersection_update(revision_ids)

2062

yield ("signatures", None, revisions_with_signatures)

2063

2064

# revisions

2065

yield ("revisions", None, revision_ids)

579

pb = ui.ui_factory.nested_progress_bar()

580

try:

581

for line in w.iter_lines_added_or_present_in_versions(

582

selected_revision_ids, pb=pb):

583

match = search(line)

584

if match is None:

585

continue

586

# One call to match.group() returning multiple items is quite a

587

# bit faster than 2 calls to match.group() each returning 1

588

file_id, revision_id = match.group('file_id', 'revision_id')

589

590

# Inlining the cache lookups helps a lot when you make 170,000

591

# lines and 350k ids, versus 8.4 unique ids.

592

# Using a cache helps in 2 ways:

593

# 1) Avoids unnecessary decoding calls

594

# 2) Re-uses cached strings, which helps in future set and

595

# equality checks.

596

# (2) is enough that removing encoding entirely along with

597

# the cache (so we are using plain strings) results in no

598

# performance improvement.

599

try:

600

revision_id = unescape_revid_cache[revision_id]

601

except KeyError:

602

unescaped = unescape(revision_id)

603

unescape_revid_cache[revision_id] = unescaped

604

revision_id = unescaped

605

606

if revision_id in selected_revision_ids:

607

try:

608

file_id = unescape_fileid_cache[file_id]

609

except KeyError:

610

unescaped = unescape(file_id)

611

unescape_fileid_cache[file_id] = unescaped

612

file_id = unescaped

613

setdefault(file_id, set()).add(revision_id)

614

finally:

615

pb.finished()

616

return result

617

618

@needs_read_lock

619

def get_inventory_weave(self):

620

return self.control_weaves.get_weave('inventory',

621

self.get_transaction())

2066

622

2067

623

@needs_read_lock

2068

624

def get_inventory(self, revision_id):

2069

"""Get Inventory object by revision id."""

2070

return self.iter_inventories([revision_id]).next()

2071

2072

def iter_inventories(self, revision_ids):

2073

"""Get many inventories by revision_ids.

2074

2075

This will buffer some or all of the texts used in constructing the

2076

inventories in memory, but will only parse a single inventory at a

2077

time.

2078

2079

:param revision_ids: The expected revision ids of the inventories.

2080

:return: An iterator of inventories.

2081

"""

2082

if ((None in revision_ids)

2083

or (_mod_revision.NULL_REVISION in revision_ids)):

2084

raise ValueError('cannot get null revision inventory')

2085

return self._iter_inventories(revision_ids)

2086

2087

def _iter_inventories(self, revision_ids):

2088

"""single-document based inventory iteration."""

2089

for text, revision_id in self._iter_inventory_xmls(revision_ids):

2090

yield self.deserialise_inventory(revision_id, text)

2091

2092

def _iter_inventory_xmls(self, revision_ids):

2093

keys = [(revision_id,) for revision_id in revision_ids]

2094

stream = self.inventories.get_record_stream(keys, 'unordered', True)

2095

text_chunks = {}

2096

for record in stream:

2097

if record.storage_kind != 'absent':

2098

text_chunks[record.key] = record.get_bytes_as('chunked')

2099

else:

2100

raise errors.NoSuchRevision(self, record.key)

2101

for key in keys:

2102

chunks = text_chunks.pop(key)

2103

yield ''.join(chunks), key[-1]

625

"""Get Inventory object by hash."""

626

# TODO: jam 20070210 Technically we don't need to sanitize, since all

627

# called functions must sanitize.

628

revision_id = osutils.safe_revision_id(revision_id)

629

return self.deserialise_inventory(

630

revision_id, self.get_inventory_xml(revision_id))

2104

631

2105

632

def deserialise_inventory(self, revision_id, xml):

2106

"""Transform the xml into an inventory object.

633

"""Transform the xml into an inventory object.

2107

634

2108

635

:param revision_id: The expected revision id of the inventory.

2109

636

:param xml: A serialised inventory.

2110

637

"""

2111

result = self._serializer.read_inventory_from_string(xml, revision_id,

2112

entry_cache=self._inventory_entry_cache)

2113

if result.revision_id != revision_id:

2114

raise AssertionError('revision id mismatch %s != %s' % (

2115

result.revision_id, revision_id))

638

revision_id = osutils.safe_revision_id(revision_id)

639

result = self._serializer.read_inventory_from_string(xml)

640

result.root.revision = revision_id

2116

641

return result

2117

642

2118

643

def serialise_inventory(self, inv):

2119

644

return self._serializer.write_inventory_to_string(inv)

2120

645

2121

def _serialise_inventory_to_lines(self, inv):

2122

return self._serializer.write_inventory_to_lines(inv)

2123

2124

def get_serializer_format(self):

2125

return self._serializer.format_num

2126

2127

646

@needs_read_lock

2128

647

def get_inventory_xml(self, revision_id):

2129

648

"""Get inventory XML as a file object."""

2130

texts = self._iter_inventory_xmls([revision_id])

649

revision_id = osutils.safe_revision_id(revision_id)

2131

650

try:

2132

text, revision_id = texts.next()

2133

except StopIteration:

651

assert isinstance(revision_id, str), type(revision_id)

652

iw = self.get_inventory_weave()

653

return iw.get_text(revision_id)

654

except IndexError:

2134

655

raise errors.HistoryMissing(self, 'inventory', revision_id)

2135

return text

2136

656

2137

657

@needs_read_lock

2138

658

def get_inventory_sha1(self, revision_id):

2139

659

"""Return the sha1 hash of the inventory entry

2140

660

"""

661

# TODO: jam 20070210 Shouldn't this be deprecated / removed?

662

revision_id = osutils.safe_revision_id(revision_id)

2141

663

return self.get_revision(revision_id).inventory_sha1

2142

664

665

@needs_read_lock

666

def get_revision_graph(self, revision_id=None):

667

"""Return a dictionary containing the revision graph.

668

669

:param revision_id: The revision_id to get a graph from. If None, then

670

the entire revision graph is returned. This is a deprecated mode of

671

operation and will be removed in the future.

672

:return: a dictionary of revision_id->revision_parents_list.

673

"""

674

# special case NULL_REVISION

675

if revision_id == _mod_revision.NULL_REVISION:

676

return {}

677

revision_id = osutils.safe_revision_id(revision_id)

678

a_weave = self.get_inventory_weave()

679

all_revisions = self._eliminate_revisions_not_present(

680

a_weave.versions())

681

entire_graph = dict([(node, a_weave.get_parents(node)) for

682

node in all_revisions])

683

if revision_id is None:

684

return entire_graph

685

elif revision_id not in entire_graph:

686

raise errors.NoSuchRevision(self, revision_id)

687

else:

688

# add what can be reached from revision_id

689

result = {}

690

pending = set([revision_id])

691

while len(pending) > 0:

692

node = pending.pop()

693

result[node] = entire_graph[node]

694

for revision_id in result[node]:

695

if revision_id not in result:

696

pending.add(revision_id)

697

return result

698

699

@needs_read_lock

700

def get_revision_graph_with_ghosts(self, revision_ids=None):

701

"""Return a graph of the revisions with ghosts marked as applicable.

702

703

:param revision_ids: an iterable of revisions to graph or None for all.

704

:return: a Graph object with the graph reachable from revision_ids.

705

"""

706

result = graph.Graph()

707

if not revision_ids:

708

pending = set(self.all_revision_ids())

709

required = set([])

710

else:

711

pending = set(osutils.safe_revision_id(r) for r in revision_ids)

712

# special case NULL_REVISION

713

if _mod_revision.NULL_REVISION in pending:

714

pending.remove(_mod_revision.NULL_REVISION)

715

required = set(pending)

716

done = set([])

717

while len(pending):

718

revision_id = pending.pop()

719

try:

720

rev = self.get_revision(revision_id)

721

except errors.NoSuchRevision:

722

if revision_id in required:

723

raise

724

# a ghost

725

result.add_ghost(revision_id)

726

continue

727

for parent_id in rev.parent_ids:

728

# is this queued or done ?

729

if (parent_id not in pending and

730

parent_id not in done):

731

# no, queue it.

732

pending.add(parent_id)

733

result.add_node(revision_id, rev.parent_ids)

734

done.add(revision_id)

735

return result

736

737

def _get_history_vf(self):

738

"""Get a versionedfile whose history graph reflects all revisions.

739

740

For weave repositories, this is the inventory weave.

741

"""

742

return self.get_inventory_weave()

743

2143

744

def iter_reverse_revision_history(self, revision_id):

2144

745

"""Iterate backwards through revision ids in the lefthand history

2145

746

2146

747

:param revision_id: The revision id to start with. All its lefthand

2147

748

ancestors will be traversed.

2148

749

"""

2149

graph = self.get_graph()

750

revision_id = osutils.safe_revision_id(revision_id)

751

if revision_id in (None, _mod_revision.NULL_REVISION):

752

return

2150

753

next_id = revision_id

754

versionedfile = self._get_history_vf()

2151

755

while True:

2152

if next_id in (None, _mod_revision.NULL_REVISION):

2153

return

2154

756

yield next_id

2155

# Note: The following line may raise KeyError in the event of

2156

# truncated history. We decided not to have a try:except:raise

2157

# RevisionNotPresent here until we see a use for it, because of the

2158

# cost in an inner loop that is by its very nature O(history).

2159

# Robert Collins 20080326

2160

parents = graph.get_parent_map([next_id])[next_id]

757

parents = versionedfile.get_parents(next_id)

2161

758

if len(parents) == 0:

2162

759

return

2163

760

else:

2179

776

else:

2180

777

return self.get_inventory(revision_id)

2181

778

779

@needs_read_lock

2182

780

def is_shared(self):

2183

781

"""Return True if this repository is flagged as a shared repository."""

2184

782

raise NotImplementedError(self.is_shared)

2191

789

reconciler.reconcile()

2192

790

return reconciler

2193

791

2194

def _refresh_data(self):

2195

"""Helper called from lock_* to ensure coherency with disk.

2196

2197

The default implementation does nothing; it is however possible

2198

for repositories to maintain loaded indices across multiple locks

2199

by checking inside their implementation of this method to see

2200

whether their indices are still valid. This depends of course on

2201

the disk format being validatable in this manner. This method is

2202

also called by the refresh_data() public interface to cause a refresh

2203

to occur while in a write lock so that data inserted by a smart server

2204

push operation is visible on the client's instance of the physical

2205

repository.

2206

"""

2207

2208

792

@needs_read_lock

2209

793

def revision_tree(self, revision_id):

2210

794

"""Return Tree for a revision on this branch.

2211

795

2212

`revision_id` may be NULL_REVISION for the empty tree revision.

796

`revision_id` may be None for the empty tree revision.

2213

797

"""

2214

revision_id = _mod_revision.ensure_null(revision_id)

2215

798

# TODO: refactor this to use an existing revision object

2216

799

# so we don't need to read it in twice.

2217

if revision_id == _mod_revision.NULL_REVISION:

2218

return RevisionTree(self, Inventory(root_id=None),

800

if revision_id is None or revision_id == _mod_revision.NULL_REVISION:

801

return RevisionTree(self, Inventory(root_id=None),

2219

802

_mod_revision.NULL_REVISION)

2220

803

else:

804

revision_id = osutils.safe_revision_id(revision_id)

2221

805

inv = self.get_revision_inventory(revision_id)

2222

806

return RevisionTree(self, inv, revision_id)

2223

807

808

@needs_read_lock

2224

809

def revision_trees(self, revision_ids):

2225

"""Return Trees for revisions in this repository.

2226

2227

:param revision_ids: a sequence of revision-ids;

2228

a revision-id may not be None or 'null:'

2229

"""

2230

inventories = self.iter_inventories(revision_ids)

2231

for inv in inventories:

2232

yield RevisionTree(self, inv, inv.revision_id)

2233

2234

def _filtered_revision_trees(self, revision_ids, file_ids):

2235

"""Return Tree for a revision on this branch with only some files.

2236

2237

:param revision_ids: a sequence of revision-ids;

2238

a revision-id may not be None or 'null:'

2239

:param file_ids: if not None, the result is filtered

2240

so that only those file-ids, their parents and their

2241

children are included.

2242

"""

2243

inventories = self.iter_inventories(revision_ids)

2244

for inv in inventories:

2245

# Should we introduce a FilteredRevisionTree class rather

2246

# than pre-filter the inventory here?

2247

filtered_inv = inv.filter(file_ids)

2248

yield RevisionTree(self, filtered_inv, filtered_inv.revision_id)

810

"""Return Tree for a revision on this branch.

811

812

`revision_id` may not be None or 'null:'"""

813

assert None not in revision_ids

814

assert _mod_revision.NULL_REVISION not in revision_ids

815

texts = self.get_inventory_weave().get_texts(revision_ids)

816

for text, revision_id in zip(texts, revision_ids):

817

inv = self.deserialise_inventory(revision_id, text)

818

yield RevisionTree(self, inv, revision_id)

2249

819

2250

820

@needs_read_lock

2251

def get_ancestry(self, revision_id, topo_sorted=True):

821

def get_ancestry(self, revision_id):

2252

822

"""Return a list of revision-ids integrated by a revision.

2253

823

2254

The first element of the list is always None, indicating the origin

2255

revision. This might change when we have history horizons, or

824

The first element of the list is always None, indicating the origin

825

revision. This might change when we have history horizons, or

2256

826

perhaps we should have a new API.

2257

827

2258

828

This is topologically sorted.

2259

829

"""

2260

if _mod_revision.is_null(revision_id):

830

if revision_id is None:

2261

831

return [None]

832

revision_id = osutils.safe_revision_id(revision_id)

2262

833

if not self.has_revision(revision_id):

2263

834

raise errors.NoSuchRevision(self, revision_id)

2264

graph = self.get_graph()

2265

keys = set()

2266

search = graph._make_breadth_first_searcher([revision_id])

2267

while True:

2268

try:

2269

found, ghosts = search.next_with_ghosts()

2270

except StopIteration:

2271

break

2272

keys.update(found)

2273

if _mod_revision.NULL_REVISION in keys:

2274

keys.remove(_mod_revision.NULL_REVISION)

2275

if topo_sorted:

2276

parent_map = graph.get_parent_map(keys)

2277

keys = tsort.topo_sort(parent_map)

2278

return [None] + list(keys)

2279

2280

def pack(self):

2281

"""Compress the data within the repository.

2282

2283

This operation only makes sense for some repository types. For other

2284

types it should be a no-op that just returns.

2285

2286

This stub method does not require a lock, but subclasses should use

2287

@needs_write_lock as this is a long running call its reasonable to

2288

implicitly lock for the user.

835

w = self.get_inventory_weave()

836

candidates = w.get_ancestry(revision_id)

837

return [None] + candidates # self._eliminate_revisions_not_present(candidates)

838

839

@needs_read_lock

840

def print_file(self, file, revision_id):

841

"""Print `file` to stdout.

842

843

FIXME RBC 20060125 as John Meinel points out this is a bad api

844

- it writes to stdout, it assumes that that is valid etc. Fix

845

by creating a new more flexible convenience function.

2289

846

"""

847

revision_id = osutils.safe_revision_id(revision_id)

848

tree = self.revision_tree(revision_id)

849

# use inventory as it was in that revision

850

file_id = tree.inventory.path2id(file)

851

if not file_id:

852

# TODO: jam 20060427 Write a test for this code path

853

# it had a bug in it, and was raising the wrong

854

# exception.

855

raise errors.BzrError("%r is not present in revision %s" % (file, revision_id))

856

tree.print_file(file_id)

2290

857

2291

858

def get_transaction(self):

2292

859

return self.control_files.get_transaction()

2293

860

2294

def get_parent_map(self, revision_ids):

2295

"""See graph._StackedParentsProvider.get_parent_map"""

2296

# revisions index works in keys; this just works in revisions

2297

# therefore wrap and unwrap

2298

query_keys = []

2299

result = {}

2300

for revision_id in revision_ids:

2301

if revision_id == _mod_revision.NULL_REVISION:

2302

result[revision_id] = ()

2303

elif revision_id is None:

2304

raise ValueError('get_parent_map(None) is not valid')

2305

else:

2306

query_keys.append((revision_id ,))

2307

for ((revision_id,), parent_keys) in \

2308

self.revisions.get_parent_map(query_keys).iteritems():

2309

if parent_keys:

2310

result[revision_id] = tuple(parent_revid

2311

for (parent_revid,) in parent_keys)

2312

else:

2313

result[revision_id] = (_mod_revision.NULL_REVISION,)

2314

return result

2315

2316

def _make_parents_provider(self):

2317

return self

2318

2319

def get_graph(self, other_repository=None):

2320

"""Return the graph walker for this repository format"""

2321

parents_provider = self._make_parents_provider()

2322

if (other_repository is not None and

2323

not self.has_same_location(other_repository)):

2324

parents_provider = graph._StackedParentsProvider(

2325

[parents_provider, other_repository._make_parents_provider()])

2326

return graph.Graph(parents_provider)

2327

2328

def _get_versioned_file_checker(self, text_key_references=None):

2329

"""Return an object suitable for checking versioned files.

2330

2331

:param text_key_references: if non-None, an already built

2332

dictionary mapping text keys ((fileid, revision_id) tuples)

2333

to whether they were referred to by the inventory of the

2334

revision_id that they contain. If None, this will be

2335

calculated.

2336

"""

2337

return _VersionedFileChecker(self,

2338

text_key_references=text_key_references)

2339

2340

def revision_ids_to_search_result(self, result_set):

2341

"""Convert a set of revision ids to a graph SearchResult."""

2342

result_parents = set()

2343

for parents in self.get_graph().get_parent_map(

2344

result_set).itervalues():

2345

result_parents.update(parents)

2346

included_keys = result_set.intersection(result_parents)

2347

start_keys = result_set.difference(included_keys)

2348

exclude_keys = result_parents.difference(result_set)

2349

result = graph.SearchResult(start_keys, exclude_keys,

2350

len(result_set), result_set)

2351

return result

861

def revision_parents(self, revision_id):

862

revision_id = osutils.safe_revision_id(revision_id)

863

return self.get_inventory_weave().parent_names(revision_id)

2352

864

2353

865

@needs_write_lock

2354

866

def set_make_working_trees(self, new_value):

2361

873

working trees.

2362

874

"""

2363

875

raise NotImplementedError(self.set_make_working_trees)

2364

876

2365

877

def make_working_trees(self):

2366

878

"""Returns the policy for making working trees on new branches."""

2367

879

raise NotImplementedError(self.make_working_trees)

2368

880

2369

881

@needs_write_lock

2370

882

def sign_revision(self, revision_id, gpg_strategy):

883

revision_id = osutils.safe_revision_id(revision_id)

2371

884

plaintext = Testament.from_revision(self, revision_id).as_short_text()

2372

885

self.store_revision_signature(gpg_strategy, plaintext, revision_id)

2373

886

2374

887

@needs_read_lock

2375

888

def has_signature_for_revision_id(self, revision_id):

2376

889

"""Query for a revision signature for revision_id in the repository."""

2377

if not self.has_revision(revision_id):

2378

raise errors.NoSuchRevision(self, revision_id)

2379

sig_present = (1 == len(

2380

self.signatures.get_parent_map([(revision_id,)])))

2381

return sig_present

890

revision_id = osutils.safe_revision_id(revision_id)

891

return self._revision_store.has_signature(revision_id,

892

self.get_transaction())

2382

893

2383

894

@needs_read_lock

2384

895

def get_signature_text(self, revision_id):

2385

896

"""Return the text for a signature."""

2386

stream = self.signatures.get_record_stream([(revision_id,)],

2387

'unordered', True)

2388

record = stream.next()

2389

if record.storage_kind == 'absent':

2390

raise errors.NoSuchRevision(self, revision_id)

2391

return record.get_bytes_as('fulltext')

897

revision_id = osutils.safe_revision_id(revision_id)

898

return self._revision_store.get_signature_text(revision_id,

899

self.get_transaction())

2392

900

2393

901

@needs_read_lock

2394

def check(self, revision_ids=None):

902

def check(self, revision_ids):

2395

903

"""Check consistency of all history of given revision_ids.

2396

904

2397

905

Different repository implementations should override _check().

2399

907

:param revision_ids: A non-empty list of revision_ids whose ancestry

2400

908

will be checked. Typically the last revision_id of a branch.

2401

909

"""

910

if not revision_ids:

911

raise ValueError("revision_ids must be non-empty in %s.check"

912

% (self,))

913

revision_ids = [osutils.safe_revision_id(r) for r in revision_ids]

2402

914

return self._check(revision_ids)

2403

915

2404

916

def _check(self, revision_ids):

2433

945

except UnicodeDecodeError:

2434

946

raise errors.NonAsciiRevisionId(method, self)

2435

947

2436

def revision_graph_can_have_wrong_parents(self):

2437

"""Is it possible for this repository to have a revision graph with

2438

incorrect parents?

2439

2440

If True, then this repository must also implement

2441

_find_inconsistent_revision_parents so that check and reconcile can

2442

check for inconsistencies before proceeding with other checks that may

2443

depend on the revision index being consistent.

2444

"""

2445

raise NotImplementedError(self.revision_graph_can_have_wrong_parents)

2446

948

2447

949

2448

950

# remove these delegates a while after bzr 0.15

2481

983

2482

984

def install_revision(repository, rev, revision_tree):

2483

985

"""Install all revision data into a repository."""

2484

install_revisions(repository, [(rev, revision_tree, None)])

2485

2486

2487

def install_revisions(repository, iterable, num_revisions=None, pb=None):

2488

"""Install all revision data into a repository.

2489

2490

Accepts an iterable of revision, tree, signature tuples. The signature

2491

may be None.

2492

"""

2493

repository.start_write_group()

2494

try:

2495

for n, (revision, revision_tree, signature) in enumerate(iterable):

2496

_install_revision(repository, revision, revision_tree, signature)

2497

if pb is not None:

2498

pb.update('Transferring revisions', n + 1, num_revisions)

2499

except:

2500

repository.abort_write_group()

2501

raise

2502

else:

2503

repository.commit_write_group()

2504

2505

2506

def _install_revision(repository, rev, revision_tree, signature):

2507

"""Install all revision data into a repository."""

2508

986

present_parents = []

2509

987

parent_trees = {}

2510

988

for p_id in rev.parent_ids:

2512

990

present_parents.append(p_id)

2513

991

parent_trees[p_id] = repository.revision_tree(p_id)

2514

992

else:

2515

parent_trees[p_id] = repository.revision_tree(

2516

_mod_revision.NULL_REVISION)

993

parent_trees[p_id] = repository.revision_tree(None)

2517

994

2518

995

inv = revision_tree.inventory

2519

996

entries = inv.iter_entries()

2520

# backwards compatibility hack: skip the root id.

997

# backwards compatability hack: skip the root id.

2521

998

if not repository.supports_rich_root():

2522

999

path, root = entries.next()

2523

1000

if root.revision != rev.revision_id:

2524

1001

raise errors.IncompatibleRevision(repr(repository))

2525

text_keys = {}

1002

# Add the texts that are not already present

2526

1003

for path, ie in entries:

2527

text_keys[(ie.file_id, ie.revision)] = ie

2528

text_parent_map = repository.texts.get_parent_map(text_keys)

2529

missing_texts = set(text_keys) - set(text_parent_map)

2530

# Add the texts that are not already present

2531

for text_key in missing_texts:

2532

ie = text_keys[text_key]

2533

text_parents = []

2534

# FIXME: TODO: The following loop overlaps/duplicates that done by

2535

# commit to determine parents. There is a latent/real bug here where

2536

# the parents inserted are not those commit would do - in particular

2537

# they are not filtered by heads(). RBC, AB

2538

for revision, tree in parent_trees.iteritems():

2539

if ie.file_id not in tree:

2540

continue

2541

parent_id = tree.inventory[ie.file_id].revision

2542

if parent_id in text_parents:

2543

continue

2544

text_parents.append((ie.file_id, parent_id))

2545

lines = revision_tree.get_file(ie.file_id).readlines()

2546

repository.texts.add_lines(text_key, text_parents, lines)

1004

w = repository.weave_store.get_weave_or_empty(ie.file_id,

1005

repository.get_transaction())

1006

if ie.revision not in w:

1007

text_parents = []

1008

# FIXME: TODO: The following loop *may* be overlapping/duplicate

1009

# with InventoryEntry.find_previous_heads(). if it is, then there

1010

# is a latent bug here where the parents may have ancestors of each

1011

# other. RBC, AB

1012

for revision, tree in parent_trees.iteritems():

1013

if ie.file_id not in tree:

1014

continue

1015

parent_id = tree.inventory[ie.file_id].revision

1016

if parent_id in text_parents:

1017

continue

1018

text_parents.append(parent_id)

1019

1020

vfile = repository.weave_store.get_weave_or_empty(ie.file_id,

1021

repository.get_transaction())

1022

lines = revision_tree.get_file(ie.file_id).readlines()

1023

vfile.add_lines(rev.revision_id, text_parents, lines)

2547

1024

try:

2548

1025

# install the inventory

2549

1026

repository.add_inventory(rev.revision_id, inv, present_parents)

2550

1027

except errors.RevisionAlreadyPresent:

2551

1028

pass

2552

if signature is not None:

2553

repository.add_signature_text(rev.revision_id, signature)

2554

1029

repository.add_revision(rev.revision_id, rev, inv)

2555

1030

2556

1031

2557

1032

class MetaDirRepository(Repository):

2558

"""Repositories in the new meta-dir layout.

2559

2560

:ivar _transport: Transport for access to repository control files,

2561

typically pointing to .bzr/repository.

2562

"""

2563

2564

def __init__(self, _format, a_bzrdir, control_files):

2565

super(MetaDirRepository, self).__init__(_format, a_bzrdir, control_files)

2566

self._transport = control_files._transport

2567

1033

"""Repositories in the new meta-dir layout."""

1034

1035

def __init__(self, _format, a_bzrdir, control_files, _revision_store, control_store, text_store):

1036

super(MetaDirRepository, self).__init__(_format,

1037

a_bzrdir,

1038

control_files,

1039

_revision_store,

1040

control_store,

1041

text_store)

1042

dir_mode = self.control_files._dir_mode

1043

file_mode = self.control_files._file_mode

1044

1045

@needs_read_lock

2568

1046

def is_shared(self):

2569

1047

"""Return True if this repository is flagged as a shared repository."""

2570

return self._transport.has('shared-storage')

1048

return self.control_files._transport.has('shared-storage')

2571

1049

2572

1050

@needs_write_lock

2573

1051

def set_make_working_trees(self, new_value):

2581

1059

"""

2582

1060

if new_value:

2583

1061

try:

2584

self._transport.delete('no-working-trees')

1062

self.control_files._transport.delete('no-working-trees')

2585

1063

except errors.NoSuchFile:

2586

1064

pass

2587

1065

else:

2588

self._transport.put_bytes('no-working-trees', '',

2589

mode=self.bzrdir._get_file_mode())

2590

1066

self.control_files.put_utf8('no-working-trees', '')

1067

2591

1068

def make_working_trees(self):

2592

1069

"""Returns the policy for making working trees on new branches."""

2593

return not self._transport.has('no-working-trees')

2594

2595

2596

class MetaDirVersionedFileRepository(MetaDirRepository):

2597

"""Repositories in a meta-dir, that work via versioned file objects."""

2598

2599

def __init__(self, _format, a_bzrdir, control_files):

2600

super(MetaDirVersionedFileRepository, self).__init__(_format, a_bzrdir,

2601

control_files)

2602

2603

2604

network_format_registry = registry.FormatRegistry()

2605

"""Registry of formats indexed by their network name.

2606

2607

The network name for a repository format is an identifier that can be used when

2608

referring to formats with smart server operations. See

2609

RepositoryFormat.network_name() for more detail.

2610

"""

2611

2612

2613

format_registry = registry.FormatRegistry(network_format_registry)

2614

"""Registry of formats, indexed by their BzrDirMetaFormat format string.

1070

return not self.control_files._transport.has('no-working-trees')

1071

1072

1073

class RepositoryFormatRegistry(registry.Registry):

1074

"""Registry of RepositoryFormats.

1075

"""

1076

1077

def get(self, format_string):

1078

r = registry.Registry.get(self, format_string)

1079

if callable(r):

1080

r = r()

1081

return r

1082

1083

1084

format_registry = RepositoryFormatRegistry()

1085

"""Registry of formats, indexed by their identifying format string.

2615

1086

2616

1087

This can contain either format instances themselves, or classes/factories that

2617

1088

can be called to obtain one.

2624

1095

class RepositoryFormat(object):

2625

1096

"""A repository format.

2626

1097

2627

Formats provide four things:

1098

Formats provide three things:

2628

1099

* An initialization routine to construct repository data on disk.

2629

* a optional format string which is used when the BzrDir supports

2630

versioned children.

1100

* a format string which is used when the BzrDir supports versioned

1101

children.

2631

1102

* an open routine which returns a Repository instance.

2632

* A network name for referring to the format in smart server RPC

2633

methods.

2634

2635

There is one and only one Format subclass for each on-disk format. But

2636

there can be one Repository subclass that is used for several different

2637

formats. The _format attribute on a Repository instance can be used to

2638

determine the disk format.

2639

2640

Formats are placed in a registry by their format string for reference

2641

during opening. These should be subclasses of RepositoryFormat for

2642

consistency.

1103

1104

Formats are placed in an dict by their format string for reference

1105

during opening. These should be subclasses of RepositoryFormat

1106

for consistency.

2643

1107

2644

1108

Once a format is deprecated, just deprecate the initialize and open

2645

methods on the format class. Do not deprecate the object, as the

2646

object may be created even when a repository instance hasn't been

2647

created.

1109

methods on the format class. Do not deprecate the object, as the

1110

object will be created every system load.

2648

1111

2649

1112

Common instance attributes:

2650

1113

_matchingbzrdir - the bzrdir format that the repository format was

2651

1114

originally written to work with. This can be used if manually

2652

1115

constructing a bzrdir and repository, or more commonly for test suite

2653

parameterization.

1116

parameterisation.

2654

1117

"""

2655

1118

2656

# Set to True or False in derived classes. True indicates that the format

2657

# supports ghosts gracefully.

2658

supports_ghosts = None

2659

# Can this repository be given external locations to lookup additional

2660

# data. Set to True or False in derived classes.

2661

supports_external_lookups = None

2662

# What order should fetch operations request streams in?

2663

# The default is unordered as that is the cheapest for an origin to

2664

# provide.

2665

_fetch_order = 'unordered'

2666

# Does this repository format use deltas that can be fetched as-deltas ?

2667

# (E.g. knits, where the knit deltas can be transplanted intact.

2668

# We default to False, which will ensure that enough data to get

2669

# a full text out of any fetch stream will be grabbed.

2670

_fetch_uses_deltas = False

2671

# Should fetch trigger a reconcile after the fetch? Only needed for

2672

# some repository formats that can suffer internal inconsistencies.

2673

_fetch_reconcile = False

2674

# Does this format have < O(tree_size) delta generation. Used to hint what

2675

# code path for commit, amongst other things.

2676

fast_deltas = None

2677

2678

1119

def __str__(self):

2679

1120

return "<%s>" % self.__class__.__name__

2680

1121

2688

1129

@classmethod

2689

1130

def find_format(klass, a_bzrdir):

2690

1131

"""Return the format for the repository object in a_bzrdir.

2691

1132

2692

1133

This is used by bzr native formats that have a "format" file in

2693

the repository. Other methods may be used by different types of

1134

the repository. Other methods may be used by different types of

2694

1135

control directory.

2695

1136

"""

2696

1137

try:

2700

1141

except errors.NoSuchFile:

2701

1142

raise errors.NoRepositoryPresent(a_bzrdir)

2702

1143

except KeyError:

2703

raise errors.UnknownFormatError(format=format_string,

2704

kind='repository')

1144

raise errors.UnknownFormatError(format=format_string)

2705

1145

2706

1146

@classmethod

2707

1147

def register_format(klass, format):

2710

1150

@classmethod

2711

1151

def unregister_format(klass, format):

2712

1152

format_registry.remove(format.get_format_string())

2713

1153

2714

1154

@classmethod

2715

1155

def get_default_format(klass):

2716

1156

"""Return the current default format."""

2717

1157

from bzrlib import bzrdir

2718

1158

return bzrdir.format_registry.make_bzrdir('default').repository_format

2719

1159

1160

def _get_control_store(self, repo_transport, control_files):

1161

"""Return the control store for this repository."""

1162

raise NotImplementedError(self._get_control_store)

1163

2720

1164

def get_format_string(self):

2721

1165

"""Return the ASCII format string that identifies this format.

2722

2723

Note that in pre format ?? repositories the format string is

1166

1167

Note that in pre format ?? repositories the format string is

2724

1168

not permitted nor written to disk.

2725

1169

"""

2726

1170

raise NotImplementedError(self.get_format_string)

2729

1173

"""Return the short description for this format."""

2730

1174

raise NotImplementedError(self.get_format_description)

2731

1175

1176

def _get_revision_store(self, repo_transport, control_files):

1177

"""Return the revision store object for this a_bzrdir."""

1178

raise NotImplementedError(self._get_revision_store)

1179

1180

def _get_text_rev_store(self,

1181

transport,

1182

control_files,

1183

name,

1184

compressed=True,

1185

prefixed=False,

1186

serializer=None):

1187

"""Common logic for getting a revision store for a repository.

1188

1189

see self._get_revision_store for the subclass-overridable method to

1190

get the store for a repository.

1191

"""

1192

from bzrlib.store.revision.text import TextRevisionStore

1193

dir_mode = control_files._dir_mode

1194

file_mode = control_files._file_mode

1195

text_store = TextStore(transport.clone(name),

1196

prefixed=prefixed,

1197

compressed=compressed,

1198

dir_mode=dir_mode,

1199

file_mode=file_mode)

1200

_revision_store = TextRevisionStore(text_store, serializer)

1201

return _revision_store

1202

2732

1203

# TODO: this shouldn't be in the base class, it's specific to things that

2733

1204

# use weaves or knits -- mbp 20070207

2734

1205

def _get_versioned_file_store(self,

2757

1228

:param a_bzrdir: The bzrdir to put the new repository in it.

2758

1229

:param shared: The repository should be initialized as a sharable one.

2759

1230

:returns: The new repository object.

2760

1231

2761

1232

This may raise UninitializableFormat if shared repository are not

2762

1233

compatible the a_bzrdir.

2763

1234

"""

2767

1238

"""Is this format supported?

2768

1239

2769

1240

Supported formats must be initializable and openable.

2770

Unsupported formats may not support initialization or committing or

1241

Unsupported formats may not support initialization or committing or

2771

1242

some other features depending on the reason for not being supported.

2772

1243

"""

2773

1244

return True

2774

1245

2775

def network_name(self):

2776

"""A simple byte string uniquely identifying this format for RPC calls.

2777

2778

MetaDir repository formats use their disk format string to identify the

2779

repository over the wire. All in one formats such as bzr < 0.8, and

2780

foreign formats like svn/git and hg should use some marker which is

2781

unique and immutable.

2782

"""

2783

raise NotImplementedError(self.network_name)

2784

2785

1246

def check_conversion_target(self, target_format):

2786

1247

raise NotImplementedError(self.check_conversion_target)

2787

1248

2788

1249

def open(self, a_bzrdir, _found=False):

2789

1250

"""Return an instance of this format for the bzrdir a_bzrdir.

2790

1251

2791

1252

_found is a private parameter, do not use it.

2792

1253

"""

2793

1254

raise NotImplementedError(self.open)

2798

1259

2799

1260

rich_root_data = False

2800

1261

supports_tree_reference = False

2801

supports_external_lookups = False

2802

2803

@property

2804

def _matchingbzrdir(self):

2805

matching = bzrdir.BzrDirMetaFormat1()

2806

matching.repository_format = self

2807

return matching

1262

_matchingbzrdir = bzrdir.BzrDirMetaFormat1()

2808

1263

2809

1264

def __init__(self):

2810

1265

super(MetaDirRepositoryFormat, self).__init__()

2823

1278

"""Upload the initial blank content."""

2824

1279

control_files = self._create_control_files(a_bzrdir)

2825

1280

control_files.lock_write()

2826

transport = control_files._transport

2827

if shared == True:

2828

utf8_files += [('shared-storage', '')]

2829

1281

try:

2830

transport.mkdir_multi(dirs, mode=a_bzrdir._get_dir_mode())

2831

for (filename, content_stream) in files:

2832

transport.put_file(filename, content_stream,

2833

mode=a_bzrdir._get_file_mode())

2834

for (filename, content_bytes) in utf8_files:

2835

transport.put_bytes_non_atomic(filename, content_bytes,

2836

mode=a_bzrdir._get_file_mode())

1282

control_files._transport.mkdir_multi(dirs,

1283

mode=control_files._dir_mode)

1284

for file, content in files:

1285

control_files.put(file, content)

1286

for file, content in utf8_files:

1287

control_files.put_utf8(file, content)

1288

if shared == True:

1289

control_files.put_utf8('shared-storage', '')

2837

1290

finally:

2838

1291

control_files.unlock()

2839

1292

2840

def network_name(self):

2841

"""Metadir formats have matching disk and network format strings."""

2842

return self.get_format_string()

2843

2844

2845

# Pre-0.8 formats that don't have a disk format string (because they are

2846

# versioned by the matching control directory). We use the control directories

2847

# disk format string as a key for the network_name because they meet the

2848

# constraints (simple string, unique, immutable).

2849

network_format_registry.register_lazy(

2850

"Bazaar-NG branch, format 5\n",

2851

'bzrlib.repofmt.weaverepo',

2852

'RepositoryFormat5',

2853

)

2854

network_format_registry.register_lazy(

2855

"Bazaar-NG branch, format 6\n",

2856

'bzrlib.repofmt.weaverepo',

2857

'RepositoryFormat6',

2858

)

2859

2860

# formats which have no format string are not discoverable or independently

2861

# creatable on disk, so are not registered in format_registry. They're

1293

1294

# formats which have no format string are not discoverable

1295

# and not independently creatable, so are not registered. They're

2862

1296

# all in bzrlib.repofmt.weaverepo now. When an instance of one of these is

2863

1297

# needed, it's constructed directly by the BzrDir. Non-native formats where

2864

1298

# the repository is not separately opened are similar.

2868

1302

'bzrlib.repofmt.weaverepo',

2869

1303

'RepositoryFormat7'

2870

1304

)

1305

# KEEP in sync with bzrdir.format_registry default, which controls the overall

1306

# default control directory format

2871

1307

2872

1308

format_registry.register_lazy(

2873

1309

'Bazaar-NG Knit Repository Format 1',

2874

1310

'bzrlib.repofmt.knitrepo',

2875

1311

'RepositoryFormatKnit1',

2876

1312

)

1313

format_registry.default_key = 'Bazaar-NG Knit Repository Format 1'

2877

1314

2878

1315

format_registry.register_lazy(

2879

1316

'Bazaar Knit Repository Format 3 (bzr 0.15)\n',

2881

1318

'RepositoryFormatKnit3',

2882

1319

)

2883

1320

2884

format_registry.register_lazy(

2885

'Bazaar Knit Repository Format 4 (bzr 1.0)\n',

2886

'bzrlib.repofmt.knitrepo',

2887

'RepositoryFormatKnit4',

2888

)

2889

2890

# Pack-based formats. There is one format for pre-subtrees, and one for

2891

# post-subtrees to allow ease of testing.

2892

# NOTE: These are experimental in 0.92. Stable in 1.0 and above

2893

format_registry.register_lazy(

2894

'Bazaar pack repository format 1 (needs bzr 0.92)\n',

2895

'bzrlib.repofmt.pack_repo',

2896

'RepositoryFormatKnitPack1',

2897

)

2898

format_registry.register_lazy(

2899

'Bazaar pack repository format 1 with subtree support (needs bzr 0.92)\n',

2900

'bzrlib.repofmt.pack_repo',

2901

'RepositoryFormatKnitPack3',

2902

)

2903

format_registry.register_lazy(

2904

'Bazaar pack repository format 1 with rich root (needs bzr 1.0)\n',

2905

'bzrlib.repofmt.pack_repo',

2906

'RepositoryFormatKnitPack4',

2907

)

2908

format_registry.register_lazy(

2909

'Bazaar RepositoryFormatKnitPack5 (bzr 1.6)\n',

2910

'bzrlib.repofmt.pack_repo',

2911

'RepositoryFormatKnitPack5',

2912

)

2913

format_registry.register_lazy(

2914

'Bazaar RepositoryFormatKnitPack5RichRoot (bzr 1.6.1)\n',

2915

'bzrlib.repofmt.pack_repo',

2916

'RepositoryFormatKnitPack5RichRoot',

2917

)

2918

format_registry.register_lazy(

2919

'Bazaar RepositoryFormatKnitPack5RichRoot (bzr 1.6)\n',

2920

'bzrlib.repofmt.pack_repo',

2921

'RepositoryFormatKnitPack5RichRootBroken',

2922

)

2923

format_registry.register_lazy(

2924

'Bazaar RepositoryFormatKnitPack6 (bzr 1.9)\n',

2925

'bzrlib.repofmt.pack_repo',

2926

'RepositoryFormatKnitPack6',

2927

)

2928

format_registry.register_lazy(

2929

'Bazaar RepositoryFormatKnitPack6RichRoot (bzr 1.9)\n',

2930

'bzrlib.repofmt.pack_repo',

2931

'RepositoryFormatKnitPack6RichRoot',

2932

)

2933

2934

# Development formats.

2935

# 1.7->1.8 go below here

2936

format_registry.register_lazy(

2937

"Bazaar development format 2 (needs bzr.dev from before 1.8)\n",

2938

'bzrlib.repofmt.pack_repo',

2939

'RepositoryFormatPackDevelopment2',

2940

)

2941

format_registry.register_lazy(

2942

("Bazaar development format 2 with subtree support "

2943

"(needs bzr.dev from before 1.8)\n"),

2944

'bzrlib.repofmt.pack_repo',

2945

'RepositoryFormatPackDevelopment2Subtree',

2946

)

2947

2948

1321

2949

1322

class InterRepository(InterObject):

2950

1323

"""This class represents operations taking place between two repositories.

2951

1324

2952

1325

Its instances have methods like copy_content and fetch, and contain

2953

references to the source and target repositories these operations can be

1326

references to the source and target repositories these operations can be

2954

1327

carried out on.

2955

1328

2956

1329

Often we will provide convenience methods on 'repository' which carry out

2958

1331

InterRepository.get(other).method_name(parameters).

2959

1332

"""

2960

1333

2961

_walk_to_common_revisions_batch_size = 50

2962

1334

_optimisers = []

2963

1335

"""The available optimised InterRepository types."""

2964

1336

2965

@needs_write_lock

2966

1337

def copy_content(self, revision_id=None):

2967

"""Make a complete copy of the content in self into destination.

2968

2969

This is a destructive operation! Do not use it on existing

2970

repositories.

2971

2972

:param revision_id: Only copy the content needed to construct

2973

revision_id and its parents.

2974

"""

2975

try:

2976

self.target.set_make_working_trees(self.source.make_working_trees())

2977

except NotImplementedError:

2978

pass

2979

self.target.fetch(self.source, revision_id=revision_id)

2980

2981

@needs_write_lock

2982

def fetch(self, revision_id=None, pb=None, find_ghosts=False,

2983

fetch_spec=None):

1338

raise NotImplementedError(self.copy_content)

1339

1340

def fetch(self, revision_id=None, pb=None):

2984

1341

"""Fetch the content required to construct revision_id.

2985

1342

2986

1343

The content is copied from self.source to self.target.

2989

1346

content is copied.

2990

1347

:param pb: optional progress bar to use for progress reports. If not

2991

1348

provided a default one will be created.

2992

:return: None.

2993

"""

2994

from bzrlib.fetch import RepoFetcher

2995

f = RepoFetcher(to_repository=self.target,

2996

from_repository=self.source,

2997

last_revision=revision_id,

2998

fetch_spec=fetch_spec,

2999

pb=pb, find_ghosts=find_ghosts)

3000

3001

def _walk_to_common_revisions(self, revision_ids):

3002

"""Walk out from revision_ids in source to revisions target has.

3003

3004

:param revision_ids: The start point for the search.

3005

:return: A set of revision ids.

3006

"""

3007

target_graph = self.target.get_graph()

3008

revision_ids = frozenset(revision_ids)

3009

# Fast path for the case where all the revisions are already in the

3010

# target repo.

3011

# (Although this does incur an extra round trip for the

3012

# fairly common case where the target doesn't already have the revision

3013

# we're pushing.)

3014

if set(target_graph.get_parent_map(revision_ids)) == revision_ids:

3015

return graph.SearchResult(revision_ids, set(), 0, set())

3016

missing_revs = set()

3017

source_graph = self.source.get_graph()

3018

# ensure we don't pay silly lookup costs.

3019

searcher = source_graph._make_breadth_first_searcher(revision_ids)

3020

null_set = frozenset([_mod_revision.NULL_REVISION])

3021

searcher_exhausted = False

3022

while True:

3023

next_revs = set()

3024

ghosts = set()

3025

# Iterate the searcher until we have enough next_revs

3026

while len(next_revs) < self._walk_to_common_revisions_batch_size:

3027

try:

3028

next_revs_part, ghosts_part = searcher.next_with_ghosts()

3029

next_revs.update(next_revs_part)

3030

ghosts.update(ghosts_part)

3031

except StopIteration:

3032

searcher_exhausted = True

3033

break

3034

# If there are ghosts in the source graph, and the caller asked for

3035

# them, make sure that they are present in the target.

3036

# We don't care about other ghosts as we can't fetch them and

3037

# haven't been asked to.

3038

ghosts_to_check = set(revision_ids.intersection(ghosts))

3039

revs_to_get = set(next_revs).union(ghosts_to_check)

3040

if revs_to_get:

3041

have_revs = set(target_graph.get_parent_map(revs_to_get))

3042

# we always have NULL_REVISION present.

3043

have_revs = have_revs.union(null_set)

3044

# Check if the target is missing any ghosts we need.

3045

ghosts_to_check.difference_update(have_revs)

3046

if ghosts_to_check:

3047

# One of the caller's revision_ids is a ghost in both the

3048

# source and the target.

3049

raise errors.NoSuchRevision(

3050

self.source, ghosts_to_check.pop())

3051

missing_revs.update(next_revs - have_revs)

3052

# Because we may have walked past the original stop point, make

3053

# sure everything is stopped

3054

stop_revs = searcher.find_seen_ancestors(have_revs)

3055

searcher.stop_searching_any(stop_revs)

3056

if searcher_exhausted:

3057

break

3058

return searcher.get_result()

3059

1349

1350

Returns the copied revision count and the failed revisions in a tuple:

1351

(copied, failures).

1352

"""

1353

raise NotImplementedError(self.fetch)

1354

3060

1355

@needs_read_lock

3061

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

1356

def missing_revision_ids(self, revision_id=None):

3062

1357

"""Return the revision ids that source has that target does not.

1358

1359

These are returned in topological order.

3063

1360

3064

1361

:param revision_id: only return revision ids included by this

3065

1362

revision_id.

3066

:param find_ghosts: If True find missing revisions in deep history

3067

rather than just finding the surface difference.

3068

:return: A bzrlib.graph.SearchResult.

3069

1363

"""

3070

# stop searching at found target revisions.

3071

if not find_ghosts and revision_id is not None:

3072

return self._walk_to_common_revisions([revision_id])

3073

1364

# generic, possibly worst case, slow code path.

3074

1365

target_ids = set(self.target.all_revision_ids())

3075

1366

if revision_id is not None:

1367

# TODO: jam 20070210 InterRepository is internal enough that it

1368

# should assume revision_ids are already utf-8

1369

revision_id = osutils.safe_revision_id(revision_id)

3076

1370

source_ids = self.source.get_ancestry(revision_id)

3077

if source_ids[0] is not None:

3078

raise AssertionError()

1371

assert source_ids[0] is None

3079

1372

source_ids.pop(0)

3080

1373

else:

3081

1374

source_ids = self.source.all_revision_ids()

3082

1375

result_set = set(source_ids).difference(target_ids)

3083

return self.source.revision_ids_to_search_result(result_set)

3084

3085

@staticmethod

3086

def _same_model(source, target):

3087

"""True if source and target have the same data representation.

3088

3089

Note: this is always called on the base class; overriding it in a

3090

subclass will have no effect.

3091

"""

3092

try:

3093

InterRepository._assert_same_model(source, target)

3094

return True

3095

except errors.IncompatibleRepositories, e:

3096

return False

3097

3098

@staticmethod

3099

def _assert_same_model(source, target):

3100

"""Raise an exception if two repositories do not use the same model.

3101

"""

3102

if source.supports_rich_root() != target.supports_rich_root():

3103

raise errors.IncompatibleRepositories(source, target,

3104

"different rich-root support")

3105

if source._serializer != target._serializer:

3106

raise errors.IncompatibleRepositories(source, target,

3107

"different serializers")

1376

# this may look like a no-op: its not. It preserves the ordering

1377

# other_ids had while only returning the members from other_ids

1378

# that we've decided we need.

1379

return [rev_id for rev_id in source_ids if rev_id in result_set]

3108

1380

3109

1381

3110

1382

class InterSameDataRepository(InterRepository):

3111

1383

"""Code for converting between repositories that represent the same data.

3112

1384

3113

1385

Data format and model must match for this to work.

3114

1386

"""

3115

1387

3116

1388

@classmethod

3117

1389

def _get_repo_format_to_test(self):

3118

"""Repository format for testing with.

3119

3120

InterSameData can pull from subtree to subtree and from non-subtree to

3121

non-subtree, so we test this with the richest repository format.

3122

"""

3123

from bzrlib.repofmt import knitrepo

3124

return knitrepo.RepositoryFormatKnit3()

1390

"""Repository format for testing with."""

1391

return RepositoryFormat.get_default_format()

3125

1392

3126

1393

@staticmethod

3127

1394

def is_compatible(source, target):

3128

return InterRepository._same_model(source, target)

1395

if source.supports_rich_root() != target.supports_rich_root():

1396

return False

1397

if source._serializer != target._serializer:

1398

return False

1399

return True

1400

1401

@needs_write_lock

1402

def copy_content(self, revision_id=None):

1403

"""Make a complete copy of the content in self into destination.

1404

1405

This copies both the repository's revision data, and configuration information

1406

such as the make_working_trees setting.

1407

1408

This is a destructive operation! Do not use it on existing

1409

repositories.

1410

1411

:param revision_id: Only copy the content needed to construct

1412

revision_id and its parents.

1413

"""

1414

try:

1415

self.target.set_make_working_trees(self.source.make_working_trees())

1416

except NotImplementedError:

1417

pass

1418

# TODO: jam 20070210 This is fairly internal, so we should probably

1419

# just assert that revision_id is not unicode.

1420

revision_id = osutils.safe_revision_id(revision_id)

1421

# but don't bother fetching if we have the needed data now.

1422

if (revision_id not in (None, _mod_revision.NULL_REVISION) and

1423

self.target.has_revision(revision_id)):

1424

return

1425

self.target.fetch(self.source, revision_id=revision_id)

1426

1427

@needs_write_lock

1428

def fetch(self, revision_id=None, pb=None):

1429

"""See InterRepository.fetch()."""

1430

from bzrlib.fetch import GenericRepoFetcher

1431

mutter("Using fetch logic to copy between %s(%s) and %s(%s)",

1432

self.source, self.source._format, self.target,

1433

self.target._format)

1434

# TODO: jam 20070210 This should be an assert, not a translate

1435

revision_id = osutils.safe_revision_id(revision_id)

1436

f = GenericRepoFetcher(to_repository=self.target,

1437

from_repository=self.source,

1438

last_revision=revision_id,

1439

pb=pb)

1440

return f.count_copied, f.failed_revisions

3129

1441

3130

1442

3131

1443

class InterWeaveRepo(InterSameDataRepository):

3132

"""Optimised code paths between Weave based repositories.

3133

3134

This should be in bzrlib/repofmt/weaverepo.py but we have not yet

3135

implemented lazy inter-object optimisation.

3136

"""

1444

"""Optimised code paths between Weave based repositories."""

3137

1445

3138

1446

@classmethod

3139

1447

def _get_repo_format_to_test(self):

3143

1451

@staticmethod

3144

1452

def is_compatible(source, target):

3145

1453

"""Be compatible with known Weave formats.

3146

1454

3147

1455

We don't test for the stores being of specific types because that

3148

could lead to confusing results, and there is no need to be

1456

could lead to confusing results, and there is no need to be

3149

1457

overly general.

3150

1458

"""

3151

1459

from bzrlib.repofmt.weaverepo import (

3162

1470

RepositoryFormat7)))

3163

1471

except AttributeError:

3164

1472

return False

3165

1473

3166

1474

@needs_write_lock

3167

1475

def copy_content(self, revision_id=None):

3168

1476

"""See InterRepository.copy_content()."""

3169

1477

# weave specific optimised path:

1478

# TODO: jam 20070210 Internal, should be an assert, not translate

1479

revision_id = osutils.safe_revision_id(revision_id)

3170

1480

try:

3171

1481

self.target.set_make_working_trees(self.source.make_working_trees())

3172

except (errors.RepositoryUpgradeRequired, NotImplemented):

1482

except NotImplementedError:

3173

1483

pass

3174

1484

# FIXME do not peek!

3175

if self.source._transport.listable():

1485

if self.source.control_files._transport.listable():

3176

1486

pb = ui.ui_factory.nested_progress_bar()

3177

1487

try:

3178

self.target.texts.insert_record_stream(

3179

self.source.texts.get_record_stream(

3180

self.source.texts.keys(), 'topological', False))

1488

self.target.weave_store.copy_all_ids(

1489

self.source.weave_store,

1490

pb=pb,

1491

from_transaction=self.source.get_transaction(),

1492

to_transaction=self.target.get_transaction())

3181

1493

pb.update('copying inventory', 0, 1)

3182

self.target.inventories.insert_record_stream(

3183

self.source.inventories.get_record_stream(

3184

self.source.inventories.keys(), 'topological', False))

3185

self.target.signatures.insert_record_stream(

3186

self.source.signatures.get_record_stream(

3187

self.source.signatures.keys(),

3188

'unordered', True))

3189

self.target.revisions.insert_record_stream(

3190

self.source.revisions.get_record_stream(

3191

self.source.revisions.keys(),

3192

'topological', True))

1494

self.target.control_weaves.copy_multi(

1495

self.source.control_weaves, ['inventory'],

1496

from_transaction=self.source.get_transaction(),

1497

to_transaction=self.target.get_transaction())

1498

self.target._revision_store.text_store.copy_all_ids(

1499

self.source._revision_store.text_store,

1500

pb=pb)

3193

1501

finally:

3194

1502

pb.finished()

3195

1503

else:

3196

1504

self.target.fetch(self.source, revision_id=revision_id)

3197

1505

1506

@needs_write_lock

1507

def fetch(self, revision_id=None, pb=None):

1508

"""See InterRepository.fetch()."""

1509

from bzrlib.fetch import GenericRepoFetcher

1510

mutter("Using fetch logic to copy between %s(%s) and %s(%s)",

1511

self.source, self.source._format, self.target, self.target._format)

1512

# TODO: jam 20070210 This should be an assert, not a translate

1513

revision_id = osutils.safe_revision_id(revision_id)

1514

f = GenericRepoFetcher(to_repository=self.target,

1515

from_repository=self.source,

1516

last_revision=revision_id,

1517

pb=pb)

1518

return f.count_copied, f.failed_revisions

1519

3198

1520

@needs_read_lock

3199

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

1521

def missing_revision_ids(self, revision_id=None):

3200

1522

"""See InterRepository.missing_revision_ids()."""

3201

1523

# we want all revisions to satisfy revision_id in source.

3202

1524

# but we don't want to stat every file here and there.

3203

# we want then, all revisions other needs to satisfy revision_id

1525

# we want then, all revisions other needs to satisfy revision_id

3204

1526

# checked, but not those that we have locally.

3205

# so the first thing is to get a subset of the revisions to

1527

# so the first thing is to get a subset of the revisions to

3206

1528

# satisfy revision_id in source, and then eliminate those that

3207

# we do already have.

3208

# this is slow on high latency connection to self, but as this

3209

# disk format scales terribly for push anyway due to rewriting

1529

# we do already have.

1530

# this is slow on high latency connection to self, but as as this

1531

# disk format scales terribly for push anyway due to rewriting

3210

1532

# inventory.weave, this is considered acceptable.

3211

1533

# - RBC 20060209

3212

1534

if revision_id is not None:

3213

1535

source_ids = self.source.get_ancestry(revision_id)

3214

if source_ids[0] is not None:

3215

raise AssertionError()

1536

assert source_ids[0] is None

3216

1537

source_ids.pop(0)

3217

1538

else:

3218

1539

source_ids = self.source._all_possible_ids()

3223

1544

# we do not have a revision as that would be pointless.

3224

1545

target_ids = set(self.target._all_possible_ids())

3225

1546

possibly_present_revisions = target_ids.intersection(source_ids_set)

3226

actually_present_revisions = set(

3227

self.target._eliminate_revisions_not_present(possibly_present_revisions))

1547

actually_present_revisions = set(self.target._eliminate_revisions_not_present(possibly_present_revisions))

3228

1548

required_revisions = source_ids_set.difference(actually_present_revisions)

1549

required_topo_revisions = [rev_id for rev_id in source_ids if rev_id in required_revisions]

3229

1550

if revision_id is not None:

3230

1551

# we used get_ancestry to determine source_ids then we are assured all

3231

1552

# revisions referenced are present as they are installed in topological order.

3232

1553

# and the tip revision was validated by get_ancestry.

3233

result_set = required_revisions

1554

return required_topo_revisions

3234

1555

else:

3235

# if we just grabbed the possibly available ids, then

1556

# if we just grabbed the possibly available ids, then

3236

1557

# we only have an estimate of whats available and need to validate

3237

1558

# that against the revision records.

3238

result_set = set(

3239

self.source._eliminate_revisions_not_present(required_revisions))

3240

return self.source.revision_ids_to_search_result(result_set)

1559

return self.source._eliminate_revisions_not_present(required_topo_revisions)

3241

1560

3242

1561

3243

1562

class InterKnitRepo(InterSameDataRepository):

3251

1570

@staticmethod

3252

1571

def is_compatible(source, target):

3253

1572

"""Be compatible with known Knit formats.

3254

1573

3255

1574

We don't test for the stores being of specific types because that

3256

could lead to confusing results, and there is no need to be

1575

could lead to confusing results, and there is no need to be

3257

1576

overly general.

3258

1577

"""

3259

from bzrlib.repofmt.knitrepo import RepositoryFormatKnit

1578

from bzrlib.repofmt.knitrepo import RepositoryFormatKnit1

3260

1579

try:

3261

are_knits = (isinstance(source._format, RepositoryFormatKnit) and

3262

isinstance(target._format, RepositoryFormatKnit))

1580

return (isinstance(source._format, (RepositoryFormatKnit1)) and

1581

isinstance(target._format, (RepositoryFormatKnit1)))

3263

1582

except AttributeError:

3264

1583

return False

3265

return are_knits and InterRepository._same_model(source, target)

1584

1585

@needs_write_lock

1586

def fetch(self, revision_id=None, pb=None):

1587

"""See InterRepository.fetch()."""

1588

from bzrlib.fetch import KnitRepoFetcher

1589

mutter("Using fetch logic to copy between %s(%s) and %s(%s)",

1590

self.source, self.source._format, self.target, self.target._format)

1591

# TODO: jam 20070210 This should be an assert, not a translate

1592

revision_id = osutils.safe_revision_id(revision_id)

1593

f = KnitRepoFetcher(to_repository=self.target,

1594

from_repository=self.source,

1595

last_revision=revision_id,

1596

pb=pb)

1597

return f.count_copied, f.failed_revisions

3266

1598

3267

1599

@needs_read_lock

3268

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

1600

def missing_revision_ids(self, revision_id=None):

3269

1601

"""See InterRepository.missing_revision_ids()."""

3270

1602

if revision_id is not None:

3271

1603

source_ids = self.source.get_ancestry(revision_id)

3272

if source_ids[0] is not None:

3273

raise AssertionError()

1604

assert source_ids[0] is None

3274

1605

source_ids.pop(0)

3275

1606

else:

3276

source_ids = self.source.all_revision_ids()

1607

source_ids = self.source._all_possible_ids()

3277

1608

source_ids_set = set(source_ids)

3278

1609

# source_ids is the worst possible case we may need to pull.

3279

1610

# now we want to filter source_ids against what we actually

3280

1611

# have in target, but don't try to check for existence where we know

3281

1612

# we do not have a revision as that would be pointless.

3282

target_ids = set(self.target.all_revision_ids())

1613

target_ids = set(self.target._all_possible_ids())

3283

1614

possibly_present_revisions = target_ids.intersection(source_ids_set)

3284

actually_present_revisions = set(

3285

self.target._eliminate_revisions_not_present(possibly_present_revisions))

1615

actually_present_revisions = set(self.target._eliminate_revisions_not_present(possibly_present_revisions))

3286

1616

required_revisions = source_ids_set.difference(actually_present_revisions)

1617

required_topo_revisions = [rev_id for rev_id in source_ids if rev_id in required_revisions]

3287

1618

if revision_id is not None:

3288

1619

# we used get_ancestry to determine source_ids then we are assured all

3289

1620

# revisions referenced are present as they are installed in topological order.

3290

1621

# and the tip revision was validated by get_ancestry.

3291

result_set = required_revisions

1622

return required_topo_revisions

3292

1623

else:

3293

# if we just grabbed the possibly available ids, then

1624

# if we just grabbed the possibly available ids, then

3294

1625

# we only have an estimate of whats available and need to validate

3295

1626

# that against the revision records.

3296

result_set = set(

3297

self.source._eliminate_revisions_not_present(required_revisions))

3298

return self.source.revision_ids_to_search_result(result_set)

3299

3300

3301

class InterPackRepo(InterSameDataRepository):

3302

"""Optimised code paths between Pack based repositories."""

1627

return self.source._eliminate_revisions_not_present(required_topo_revisions)

1628

1629

1630

class InterModel1and2(InterRepository):

3303

1631

3304

1632

@classmethod

3305

1633

def _get_repo_format_to_test(self):

3306

from bzrlib.repofmt import pack_repo

3307

return pack_repo.RepositoryFormatKnitPack1()

1634

return None

3308

1635

3309

1636

@staticmethod

3310

1637

def is_compatible(source, target):

3311

"""Be compatible with known Pack formats.

3312

3313

We don't test for the stores being of specific types because that

3314

could lead to confusing results, and there is no need to be

3315

overly general.

1638

if not source.supports_rich_root() and target.supports_rich_root():

1639

return True

1640

else:

1641

return False

1642

1643

@needs_write_lock

1644

def fetch(self, revision_id=None, pb=None):

1645

"""See InterRepository.fetch()."""

1646

from bzrlib.fetch import Model1toKnit2Fetcher

1647

# TODO: jam 20070210 This should be an assert, not a translate

1648

revision_id = osutils.safe_revision_id(revision_id)

1649

f = Model1toKnit2Fetcher(to_repository=self.target,

1650

from_repository=self.source,

1651

last_revision=revision_id,

1652

pb=pb)

1653

return f.count_copied, f.failed_revisions

1654

1655

@needs_write_lock

1656

def copy_content(self, revision_id=None):

1657

"""Make a complete copy of the content in self into destination.

1658

1659

This is a destructive operation! Do not use it on existing

1660

repositories.

1661

1662

:param revision_id: Only copy the content needed to construct

1663

revision_id and its parents.

3316

1664

"""

3317

from bzrlib.repofmt.pack_repo import RepositoryFormatPack

3318

try:

3319

are_packs = (isinstance(source._format, RepositoryFormatPack) and

3320

isinstance(target._format, RepositoryFormatPack))

1665

try:

1666

self.target.set_make_working_trees(self.source.make_working_trees())

1667

except NotImplementedError:

1668

pass

1669

# TODO: jam 20070210 Internal, assert, don't translate

1670

revision_id = osutils.safe_revision_id(revision_id)

1671

# but don't bother fetching if we have the needed data now.

1672

if (revision_id not in (None, _mod_revision.NULL_REVISION) and

1673

self.target.has_revision(revision_id)):

1674

return

1675

self.target.fetch(self.source, revision_id=revision_id)

1676

1677

1678

class InterKnit1and2(InterKnitRepo):

1679

1680

@classmethod

1681

def _get_repo_format_to_test(self):

1682

return None

1683

1684

@staticmethod

1685

def is_compatible(source, target):

1686

"""Be compatible with Knit1 source and Knit3 target"""

1687

from bzrlib.repofmt.knitrepo import RepositoryFormatKnit3

1688

try:

1689

from bzrlib.repofmt.knitrepo import RepositoryFormatKnit1, \

1690

RepositoryFormatKnit3

1691

return (isinstance(source._format, (RepositoryFormatKnit1)) and

1692

isinstance(target._format, (RepositoryFormatKnit3)))

3321

1693

except AttributeError:

3322

1694

return False

3323

return are_packs and InterRepository._same_model(source, target)

3324

1695

3325

1696

@needs_write_lock

3326

def fetch(self, revision_id=None, pb=None, find_ghosts=False,

3327

fetch_spec=None):

1697

def fetch(self, revision_id=None, pb=None):

3328

1698

"""See InterRepository.fetch()."""

3329

if (len(self.source._fallback_repositories) > 0 or

3330

len(self.target._fallback_repositories) > 0):

3331

# The pack layer is not aware of fallback repositories, so when

3332

# fetching from a stacked repository or into a stacked repository

3333

# we use the generic fetch logic which uses the VersionedFiles

3334

# attributes on repository.

3335

from bzrlib.fetch import RepoFetcher

3336

fetcher = RepoFetcher(self.target, self.source, revision_id,

3337

pb, find_ghosts, fetch_spec=fetch_spec)

3338

if fetch_spec is not None:

3339

if len(list(fetch_spec.heads)) != 1:

3340

raise AssertionError(

3341

"InterPackRepo.fetch doesn't support "

3342

"fetching multiple heads yet.")

3343

revision_id = list(fetch_spec.heads)[0]

3344

fetch_spec = None

3345

if revision_id is None:

3346

# TODO:

3347

# everything to do - use pack logic

3348

# to fetch from all packs to one without

3349

# inventory parsing etc, IFF nothing to be copied is in the target.

3350

# till then:

3351

source_revision_ids = frozenset(self.source.all_revision_ids())

3352

revision_ids = source_revision_ids - \

3353

frozenset(self.target.get_parent_map(source_revision_ids))

3354

revision_keys = [(revid,) for revid in revision_ids]

3355

index = self.target._pack_collection.revision_index.combined_index

3356

present_revision_ids = set(item[1][0] for item in

3357

index.iter_entries(revision_keys))

3358

revision_ids = set(revision_ids) - present_revision_ids

3359

# implementing the TODO will involve:

3360

# - detecting when all of a pack is selected

3361

# - avoiding as much as possible pre-selection, so the

3362

# more-core routines such as create_pack_from_packs can filter in

3363

# a just-in-time fashion. (though having a HEADS list on a

3364

# repository might make this a lot easier, because we could

3365

# sensibly detect 'new revisions' without doing a full index scan.

3366

elif _mod_revision.is_null(revision_id):

3367

# nothing to do:

3368

return (0, [])

3369

else:

3370

try:

3371

revision_ids = self.search_missing_revision_ids(revision_id,

3372

find_ghosts=find_ghosts).get_keys()

3373

except errors.NoSuchRevision:

3374

raise errors.InstallFailed([revision_id])

3375

if len(revision_ids) == 0:

3376

return (0, [])

3377

return self._pack(self.source, self.target, revision_ids)

3378

3379

def _pack(self, source, target, revision_ids):

3380

from bzrlib.repofmt.pack_repo import Packer

3381

packs = source._pack_collection.all_packs()

3382

pack = Packer(self.target._pack_collection, packs, '.fetch',

3383

revision_ids).pack()

3384

if pack is not None:

3385

self.target._pack_collection._save_pack_names()

3386

copied_revs = pack.get_revision_count()

3387

# Trigger an autopack. This may duplicate effort as we've just done

3388

# a pack creation, but for now it is simpler to think about as

3389

# 'upload data, then repack if needed'.

3390

self.target._pack_collection.autopack()

3391

return (copied_revs, [])

3392

else:

3393

return (0, [])

3394

3395

@needs_read_lock

3396

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

3397

"""See InterRepository.missing_revision_ids().

3398

3399

:param find_ghosts: Find ghosts throughout the ancestry of

3400

revision_id.

3401

"""

3402

if not find_ghosts and revision_id is not None:

3403

return self._walk_to_common_revisions([revision_id])

3404

elif revision_id is not None:

3405

# Find ghosts: search for revisions pointing from one repository to

3406

# the other, and vice versa, anywhere in the history of revision_id.

3407

graph = self.target.get_graph(other_repository=self.source)

3408

searcher = graph._make_breadth_first_searcher([revision_id])

3409

found_ids = set()

3410

while True:

3411

try:

3412

next_revs, ghosts = searcher.next_with_ghosts()

3413

except StopIteration:

3414

break

3415

if revision_id in ghosts:

3416

raise errors.NoSuchRevision(self.source, revision_id)

3417

found_ids.update(next_revs)

3418

found_ids.update(ghosts)

3419

found_ids = frozenset(found_ids)

3420

# Double query here: should be able to avoid this by changing the

3421

# graph api further.

3422

result_set = found_ids - frozenset(

3423

self.target.get_parent_map(found_ids))

3424

else:

3425

source_ids = self.source.all_revision_ids()

3426

# source_ids is the worst possible case we may need to pull.

3427

# now we want to filter source_ids against what we actually

3428

# have in target, but don't try to check for existence where we know

3429

# we do not have a revision as that would be pointless.

3430

target_ids = set(self.target.all_revision_ids())

3431

result_set = set(source_ids).difference(target_ids)

3432

return self.source.revision_ids_to_search_result(result_set)

3433

3434

3435

class InterDifferingSerializer(InterKnitRepo):

1699

from bzrlib.fetch import Knit1to2Fetcher

1700

mutter("Using fetch logic to copy between %s(%s) and %s(%s)",

1701

self.source, self.source._format, self.target,

1702

self.target._format)

1703

# TODO: jam 20070210 This should be an assert, not a translate

1704

revision_id = osutils.safe_revision_id(revision_id)

1705

f = Knit1to2Fetcher(to_repository=self.target,

1706

from_repository=self.source,

1707

last_revision=revision_id,

1708

pb=pb)

1709

return f.count_copied, f.failed_revisions

1710

1711

1712

class InterRemoteRepository(InterRepository):

1713

"""Code for converting between RemoteRepository objects.

1714

1715

This just gets an non-remote repository from the RemoteRepository, and calls

1716

InterRepository.get again.

1717

"""

1718

1719

def __init__(self, source, target):

1720

if isinstance(source, remote.RemoteRepository):

1721

source._ensure_real()

1722

real_source = source._real_repository

1723

else:

1724

real_source = source

1725

if isinstance(target, remote.RemoteRepository):

1726

target._ensure_real()

1727

real_target = target._real_repository

1728

else:

1729

real_target = target

1730

self.real_inter = InterRepository.get(real_source, real_target)

1731

1732

@staticmethod

1733

def is_compatible(source, target):

1734

if isinstance(source, remote.RemoteRepository):

1735

return True

1736

if isinstance(target, remote.RemoteRepository):

1737

return True

1738

return False

1739

1740

def copy_content(self, revision_id=None):

1741

self.real_inter.copy_content(revision_id=revision_id)

1742

1743

def fetch(self, revision_id=None, pb=None):

1744

self.real_inter.fetch(revision_id=revision_id, pb=pb)

3436

1745

3437

1746

@classmethod

3438

1747

def _get_repo_format_to_test(self):

3439

1748

return None

3440

1749

3441

@staticmethod

3442

def is_compatible(source, target):

3443

"""Be compatible with Knit2 source and Knit3 target"""

3444

if source.supports_rich_root() != target.supports_rich_root():

3445

return False

3446

# Ideally, we'd support fetching if the source had no tree references

3447

# even if it supported them...

3448

if (getattr(source, '_format.supports_tree_reference', False) and

3449

not getattr(target, '_format.supports_tree_reference', False)):

3450

return False

3451

return True

3452

3453

def _get_delta_for_revision(self, tree, parent_ids, basis_id, cache):

3454

"""Get the best delta and base for this revision.

3455

3456

:return: (basis_id, delta)

3457

"""

3458

possible_trees = [(parent_id, cache[parent_id])

3459

for parent_id in parent_ids

3460

if parent_id in cache]

3461

if len(possible_trees) == 0:

3462

# There either aren't any parents, or the parents aren't in the

3463

# cache, so just use the last converted tree

3464

possible_trees.append((basis_id, cache[basis_id]))

3465

deltas = []

3466

for basis_id, basis_tree in possible_trees:

3467

delta = tree.inventory._make_delta(basis_tree.inventory)

3468

deltas.append((len(delta), basis_id, delta))

3469

deltas.sort()

3470

return deltas[0][1:]

3471

3472

def _fetch_batch(self, revision_ids, basis_id, cache):

3473

"""Fetch across a few revisions.

3474

3475

:param revision_ids: The revisions to copy

3476

:param basis_id: The revision_id of a tree that must be in cache, used

3477

as a basis for delta when no other base is available

3478

:param cache: A cache of RevisionTrees that we can use.

3479

:return: The revision_id of the last converted tree. The RevisionTree

3480

for it will be in cache

3481

"""

3482

# Walk though all revisions; get inventory deltas, copy referenced

3483

# texts that delta references, insert the delta, revision and

3484

# signature.

3485

text_keys = set()

3486

pending_deltas = []

3487

pending_revisions = []

3488

parent_map = self.source.get_parent_map(revision_ids)

3489

for tree in self.source.revision_trees(revision_ids):

3490

current_revision_id = tree.get_revision_id()

3491

parent_ids = parent_map.get(current_revision_id, ())

3492

basis_id, delta = self._get_delta_for_revision(tree, parent_ids,

3493

basis_id, cache)

3494

# Find text entries that need to be copied

3495

for old_path, new_path, file_id, entry in delta:

3496

if new_path is not None:

3497

if not (new_path or self.target.supports_rich_root()):

3498

# We don't copy the text for the root node unless the

3499

# target supports_rich_root.

3500

continue

3501

text_keys.add((file_id, entry.revision))

3502

revision = self.source.get_revision(current_revision_id)

3503

pending_deltas.append((basis_id, delta,

3504

current_revision_id, revision.parent_ids))

3505

pending_revisions.append(revision)

3506

cache[current_revision_id] = tree

3507

basis_id = current_revision_id

3508

# Copy file texts

3509

from_texts = self.source.texts

3510

to_texts = self.target.texts

3511

to_texts.insert_record_stream(from_texts.get_record_stream(

3512

text_keys, self.target._format._fetch_order,

3513

not self.target._format._fetch_uses_deltas))

3514

# insert deltas

3515

for delta in pending_deltas:

3516

self.target.add_inventory_by_delta(*delta)

3517

# insert signatures and revisions

3518

for revision in pending_revisions:

3519

try:

3520

signature = self.source.get_signature_text(

3521

revision.revision_id)

3522

self.target.add_signature_text(revision.revision_id,

3523

signature)

3524

except errors.NoSuchRevision:

3525

pass

3526

self.target.add_revision(revision.revision_id, revision)

3527

return basis_id

3528

3529

def _fetch_all_revisions(self, revision_ids, pb):

3530

"""Fetch everything for the list of revisions.

3531

3532

:param revision_ids: The list of revisions to fetch. Must be in

3533

topological order.

3534

:param pb: A ProgressBar

3535

:return: None

3536

"""

3537

basis_id, basis_tree = self._get_basis(revision_ids[0])

3538

batch_size = 100

3539

cache = lru_cache.LRUCache(100)

3540

cache[basis_id] = basis_tree

3541

del basis_tree # We don't want to hang on to it here

3542

for offset in range(0, len(revision_ids), batch_size):

3543

self.target.start_write_group()

3544

try:

3545

pb.update('Transferring revisions', offset,

3546

len(revision_ids))

3547

batch = revision_ids[offset:offset+batch_size]

3548

basis_id = self._fetch_batch(batch, basis_id, cache)

3549

except:

3550

self.target.abort_write_group()

3551

raise

3552

else:

3553

self.target.commit_write_group()

3554

pb.update('Transferring revisions', len(revision_ids),

3555

len(revision_ids))

3556

3557

@needs_write_lock

3558

def fetch(self, revision_id=None, pb=None, find_ghosts=False,

3559

fetch_spec=None):

3560

"""See InterRepository.fetch()."""

3561

if fetch_spec is not None:

3562

raise AssertionError("Not implemented yet...")

3563

revision_ids = self.target.search_missing_revision_ids(self.source,

3564

revision_id, find_ghosts=find_ghosts).get_keys()

3565

if not revision_ids:

3566

return 0, 0

3567

revision_ids = tsort.topo_sort(

3568

self.source.get_graph().get_parent_map(revision_ids))

3569

if pb is None:

3570

my_pb = ui.ui_factory.nested_progress_bar()

3571

pb = my_pb

3572

else:

3573

symbol_versioning.warn(

3574

symbol_versioning.deprecated_in((1, 14, 0))

3575

% "pb parameter to fetch()")

3576

my_pb = None

3577

try:

3578

self._fetch_all_revisions(revision_ids, pb)

3579

finally:

3580

if my_pb is not None:

3581

my_pb.finished()

3582

return len(revision_ids), 0

3583

3584

def _get_basis(self, first_revision_id):

3585

"""Get a revision and tree which exists in the target.

3586

3587

This assumes that first_revision_id is selected for transmission

3588

because all other ancestors are already present. If we can't find an

3589

ancestor we fall back to NULL_REVISION since we know that is safe.

3590

3591

:return: (basis_id, basis_tree)

3592

"""

3593

first_rev = self.source.get_revision(first_revision_id)

3594

try:

3595

basis_id = first_rev.parent_ids[0]

3596

# only valid as a basis if the target has it

3597

self.target.get_revision(basis_id)

3598

# Try to get a basis tree - if its a ghost it will hit the

3599

# NoSuchRevision case.

3600

basis_tree = self.source.revision_tree(basis_id)

3601

except (IndexError, errors.NoSuchRevision):

3602

basis_id = _mod_revision.NULL_REVISION

3603

basis_tree = self.source.revision_tree(basis_id)

3604

return basis_id, basis_tree

3605

3606

3607

InterRepository.register_optimiser(InterDifferingSerializer)

1750

3608

1751

InterRepository.register_optimiser(InterSameDataRepository)

3609

1752

InterRepository.register_optimiser(InterWeaveRepo)

3610

1753

InterRepository.register_optimiser(InterKnitRepo)

3611

InterRepository.register_optimiser(InterPackRepo)

1754

InterRepository.register_optimiser(InterModel1and2)

1755

InterRepository.register_optimiser(InterKnit1and2)

1756

InterRepository.register_optimiser(InterRemoteRepository)

1757

1758

1759

class RepositoryTestProviderAdapter(object):

1760

"""A tool to generate a suite testing multiple repository formats at once.

1761

1762

This is done by copying the test once for each transport and injecting

1763

the transport_server, transport_readonly_server, and bzrdir_format and

1764

repository_format classes into each copy. Each copy is also given a new id()

1765

to make it easy to identify.

1766

"""

1767

1768

def __init__(self, transport_server, transport_readonly_server, formats,

1769

vfs_transport_factory=None):

1770

self._transport_server = transport_server

1771

self._transport_readonly_server = transport_readonly_server

1772

self._vfs_transport_factory = vfs_transport_factory

1773

self._formats = formats

1774

1775

def adapt(self, test):

1776

result = unittest.TestSuite()

1777

for repository_format, bzrdir_format in self._formats:

1778

from copy import deepcopy

1779

new_test = deepcopy(test)

1780

new_test.transport_server = self._transport_server

1781

new_test.transport_readonly_server = self._transport_readonly_server

1782

# Only override the test's vfs_transport_factory if one was

1783

# specified, otherwise just leave the default in place.

1784

if self._vfs_transport_factory:

1785

new_test.vfs_transport_factory = self._vfs_transport_factory

1786

new_test.bzrdir_format = bzrdir_format

1787

new_test.repository_format = repository_format

1788

def make_new_test_id():

1789

new_id = "%s(%s)" % (new_test.id(), repository_format.__class__.__name__)

1790

return lambda: new_id

1791

new_test.id = make_new_test_id()

1792

result.addTest(new_test)

1793

return result

1794

1795

1796

class InterRepositoryTestProviderAdapter(object):

1797

"""A tool to generate a suite testing multiple inter repository formats.

1798

1799

This is done by copying the test once for each interrepo provider and injecting

1800

the transport_server, transport_readonly_server, repository_format and

1801

repository_to_format classes into each copy.

1802

Each copy is also given a new id() to make it easy to identify.

1803

"""

1804

1805

def __init__(self, transport_server, transport_readonly_server, formats):

1806

self._transport_server = transport_server

1807

self._transport_readonly_server = transport_readonly_server

1808

self._formats = formats

1809

1810

def adapt(self, test):

1811

result = unittest.TestSuite()

1812

for interrepo_class, repository_format, repository_format_to in self._formats:

1813

from copy import deepcopy

1814

new_test = deepcopy(test)

1815

new_test.transport_server = self._transport_server

1816

new_test.transport_readonly_server = self._transport_readonly_server

1817

new_test.interrepo_class = interrepo_class

1818

new_test.repository_format = repository_format

1819

new_test.repository_format_to = repository_format_to

1820

def make_new_test_id():

1821

new_id = "%s(%s)" % (new_test.id(), interrepo_class.__name__)

1822

return lambda: new_id

1823

new_test.id = make_new_test_id()

1824

result.addTest(new_test)

1825

return result

1826

1827

@staticmethod

1828

def default_test_list():

1829

"""Generate the default list of interrepo permutations to test."""

1830

from bzrlib.repofmt import knitrepo, weaverepo

1831

result = []

1832

# test the default InterRepository between format 6 and the current

1833

# default format.

1834

# XXX: robertc 20060220 reinstate this when there are two supported

1835

# formats which do not have an optimal code path between them.

1836

#result.append((InterRepository,

1837

# RepositoryFormat6(),

1838

# RepositoryFormatKnit1()))

1839

for optimiser_class in InterRepository._optimisers:

1840

format_to_test = optimiser_class._get_repo_format_to_test()

1841

if format_to_test is not None:

1842

result.append((optimiser_class,

1843

format_to_test, format_to_test))

1844

# if there are specific combinations we want to use, we can add them

1845

# here.

1846

result.append((InterModel1and2,

1847

weaverepo.RepositoryFormat5(),

1848

knitrepo.RepositoryFormatKnit3()))

1849

result.append((InterKnit1and2,

1850

knitrepo.RepositoryFormatKnit1(),

1851

knitrepo.RepositoryFormatKnit3()))

1852

return result

3612

1853

3613

1854

3614

1855

class CopyConverter(object):

3615

1856

"""A repository conversion tool which just performs a copy of the content.

3616

1857

3617

1858

This is slow but quite reliable.

3618

1859

"""

3619

1860

3623

1864

:param target_format: The format the resulting repository should be.

3624

1865

"""

3625

1866

self.target_format = target_format

3626

1867

3627

1868

def convert(self, repo, pb):

3628

1869

"""Perform the conversion of to_convert, giving feedback via pb.

3629

1870

3663

1904

self.pb.update(message, self.count, self.total)

3664

1905

3665

1906

1907

class CommitBuilder(object):

1908

"""Provides an interface to build up a commit.

1909

1910

This allows describing a tree to be committed without needing to

1911

know the internals of the format of the repository.

1912

"""

1913

1914

record_root_entry = False

1915

def __init__(self, repository, parents, config, timestamp=None,

1916

timezone=None, committer=None, revprops=None,

1917

revision_id=None):

1918

"""Initiate a CommitBuilder.

1919

1920

:param repository: Repository to commit to.

1921

:param parents: Revision ids of the parents of the new revision.

1922

:param config: Configuration to use.

1923

:param timestamp: Optional timestamp recorded for commit.

1924

:param timezone: Optional timezone for timestamp.

1925

:param committer: Optional committer to set for commit.

1926

:param revprops: Optional dictionary of revision properties.

1927

:param revision_id: Optional revision id.

1928

"""

1929

self._config = config

1930

1931

if committer is None:

1932

self._committer = self._config.username()

1933

else:

1934

assert isinstance(committer, basestring), type(committer)

1935

self._committer = committer

1936

1937

self.new_inventory = Inventory(None)

1938

self._new_revision_id = osutils.safe_revision_id(revision_id)

1939

self.parents = parents

1940

self.repository = repository

1941

1942

self._revprops = {}

1943

if revprops is not None:

1944

self._revprops.update(revprops)

1945

1946

if timestamp is None:

1947

timestamp = time.time()

1948

# Restrict resolution to 1ms

1949

self._timestamp = round(timestamp, 3)

1950

1951

if timezone is None:

1952

self._timezone = osutils.local_time_offset()

1953

else:

1954

self._timezone = int(timezone)

1955

1956

self._generate_revision_if_needed()

1957

1958

def commit(self, message):

1959

"""Make the actual commit.

1960

1961

:return: The revision id of the recorded revision.

1962

"""

1963

rev = _mod_revision.Revision(

1964

timestamp=self._timestamp,

1965

timezone=self._timezone,

1966

committer=self._committer,

1967

message=message,

1968

inventory_sha1=self.inv_sha1,

1969

revision_id=self._new_revision_id,

1970

properties=self._revprops)

1971

rev.parent_ids = self.parents

1972

self.repository.add_revision(self._new_revision_id, rev,

1973

self.new_inventory, self._config)

1974

return self._new_revision_id

1975

1976

def revision_tree(self):

1977

"""Return the tree that was just committed.

1978

1979

After calling commit() this can be called to get a RevisionTree

1980

representing the newly committed tree. This is preferred to

1981

calling Repository.revision_tree() because that may require

1982

deserializing the inventory, while we already have a copy in

1983

memory.

1984

"""

1985

return RevisionTree(self.repository, self.new_inventory,

1986

self._new_revision_id)

1987

1988

def finish_inventory(self):

1989

"""Tell the builder that the inventory is finished."""

1990

if self.new_inventory.root is None:

1991

symbol_versioning.warn('Root entry should be supplied to'

1992

' record_entry_contents, as of bzr 0.10.',

1993

DeprecationWarning, stacklevel=2)

1994

self.new_inventory.add(InventoryDirectory(ROOT_ID, '', None))

1995

self.new_inventory.revision_id = self._new_revision_id

1996

self.inv_sha1 = self.repository.add_inventory(

1997

self._new_revision_id,

1998

self.new_inventory,

1999

self.parents

2000

)

2001

2002

def _gen_revision_id(self):

2003

"""Return new revision-id."""

2004

return generate_ids.gen_revision_id(self._config.username(),

2005

self._timestamp)

2006

2007

def _generate_revision_if_needed(self):

2008

"""Create a revision id if None was supplied.

2009

2010

If the repository can not support user-specified revision ids

2011

they should override this function and raise CannotSetRevisionId

2012

if _new_revision_id is not None.

2013

2014

:raises: CannotSetRevisionId

2015

"""

2016

if self._new_revision_id is None:

2017

self._new_revision_id = self._gen_revision_id()

2018

2019

def record_entry_contents(self, ie, parent_invs, path, tree):

2020

"""Record the content of ie from tree into the commit if needed.

2021

2022

Side effect: sets ie.revision when unchanged

2023

2024

:param ie: An inventory entry present in the commit.

2025

:param parent_invs: The inventories of the parent revisions of the

2026

commit.

2027

:param path: The path the entry is at in the tree.

2028

:param tree: The tree which contains this entry and should be used to

2029

obtain content.

2030

"""

2031

if self.new_inventory.root is None and ie.parent_id is not None:

2032

symbol_versioning.warn('Root entry should be supplied to'

2033

' record_entry_contents, as of bzr 0.10.',

2034

DeprecationWarning, stacklevel=2)

2035

self.record_entry_contents(tree.inventory.root.copy(), parent_invs,

2036

'', tree)

2037

self.new_inventory.add(ie)

2038

2039

# ie.revision is always None if the InventoryEntry is considered

2040

# for committing. ie.snapshot will record the correct revision

2041

# which may be the sole parent if it is untouched.

2042

if ie.revision is not None:

2043

return

2044

2045

# In this revision format, root entries have no knit or weave

2046

if ie is self.new_inventory.root:

2047

# When serializing out to disk and back in

2048

# root.revision is always _new_revision_id

2049

ie.revision = self._new_revision_id

2050

return

2051

previous_entries = ie.find_previous_heads(

2052

parent_invs,

2053

self.repository.weave_store,

2054

self.repository.get_transaction())

2055

# we are creating a new revision for ie in the history store

2056

# and inventory.

2057

ie.snapshot(self._new_revision_id, path, previous_entries, tree, self)

2058

2059

def modified_directory(self, file_id, file_parents):

2060

"""Record the presence of a symbolic link.

2061

2062

:param file_id: The file_id of the link to record.

2063

:param file_parents: The per-file parent revision ids.

2064

"""

2065

self._add_text_to_weave(file_id, [], file_parents.keys())

2066

2067

def modified_reference(self, file_id, file_parents):

2068

"""Record the modification of a reference.

2069

2070

:param file_id: The file_id of the link to record.

2071

:param file_parents: The per-file parent revision ids.

2072

"""

2073

self._add_text_to_weave(file_id, [], file_parents.keys())

2074

2075

def modified_file_text(self, file_id, file_parents,

2076

get_content_byte_lines, text_sha1=None,

2077

text_size=None):

2078

"""Record the text of file file_id

2079

2080

:param file_id: The file_id of the file to record the text of.

2081

:param file_parents: The per-file parent revision ids.

2082

:param get_content_byte_lines: A callable which will return the byte

2083

lines for the file.

2084

:param text_sha1: Optional SHA1 of the file contents.

2085

:param text_size: Optional size of the file contents.

2086

"""

2087

# mutter('storing text of file {%s} in revision {%s} into %r',

2088

# file_id, self._new_revision_id, self.repository.weave_store)

2089

# special case to avoid diffing on renames or

2090

# reparenting

2091

if (len(file_parents) == 1

2092

and text_sha1 == file_parents.values()[0].text_sha1

2093

and text_size == file_parents.values()[0].text_size):

2094

previous_ie = file_parents.values()[0]

2095

versionedfile = self.repository.weave_store.get_weave(file_id,

2096

self.repository.get_transaction())

2097

versionedfile.clone_text(self._new_revision_id,

2098

previous_ie.revision, file_parents.keys())

2099

return text_sha1, text_size

2100

else:

2101

new_lines = get_content_byte_lines()

2102

# TODO: Rather than invoking sha_strings here, _add_text_to_weave

2103

# should return the SHA1 and size

2104

self._add_text_to_weave(file_id, new_lines, file_parents.keys())

2105

return osutils.sha_strings(new_lines), \

2106

sum(map(len, new_lines))

2107

2108

def modified_link(self, file_id, file_parents, link_target):

2109

"""Record the presence of a symbolic link.

2110

2111

:param file_id: The file_id of the link to record.

2112

:param file_parents: The per-file parent revision ids.

2113

:param link_target: Target location of this link.

2114

"""

2115

self._add_text_to_weave(file_id, [], file_parents.keys())

2116

2117

def _add_text_to_weave(self, file_id, new_lines, parents):

2118

versionedfile = self.repository.weave_store.get_weave_or_empty(

2119

file_id, self.repository.get_transaction())

2120

versionedfile.add_lines(self._new_revision_id, parents, new_lines)

2121

versionedfile.clear_cache()

2122

2123

2124

class _CommitBuilder(CommitBuilder):

2125

"""Temporary class so old CommitBuilders are detected properly

2126

2127

Note: CommitBuilder works whether or not root entry is recorded.

2128

"""

2129

2130

record_root_entry = True

2131

2132

2133

class RootCommitBuilder(CommitBuilder):

2134

"""This commitbuilder actually records the root id"""

2135

2136

record_root_entry = True

2137

2138

def record_entry_contents(self, ie, parent_invs, path, tree):

2139

"""Record the content of ie from tree into the commit if needed.

2140

2141

Side effect: sets ie.revision when unchanged

2142

2143

:param ie: An inventory entry present in the commit.

2144

:param parent_invs: The inventories of the parent revisions of the

2145

commit.

2146

:param path: The path the entry is at in the tree.

2147

:param tree: The tree which contains this entry and should be used to

2148

obtain content.

2149

"""

2150

assert self.new_inventory.root is not None or ie.parent_id is None

2151

self.new_inventory.add(ie)

2152

2153

# ie.revision is always None if the InventoryEntry is considered

2154

# for committing. ie.snapshot will record the correct revision

2155

# which may be the sole parent if it is untouched.

2156

if ie.revision is not None:

2157

return

2158

2159

previous_entries = ie.find_previous_heads(

2160

parent_invs,

2161

self.repository.weave_store,

2162

self.repository.get_transaction())

2163

# we are creating a new revision for ie in the history store

2164

# and inventory.

2165

ie.snapshot(self._new_revision_id, path, previous_entries, tree, self)

2166

2167

3666

2168

_unescape_map = {

3667

2169

'apos':"'",

3668

2170

'quot':'"',

3691

2193

if _unescape_re is None:

3692

2194

_unescape_re = re.compile('\&([^;]*);')

3693

2195

return _unescape_re.sub(_unescaper, data)

3694

3695

3696

class _VersionedFileChecker(object):

3697

3698

def __init__(self, repository, text_key_references=None):

3699

self.repository = repository

3700

self.text_index = self.repository._generate_text_key_index(

3701

text_key_references=text_key_references)

3702

3703

def calculate_file_version_parents(self, text_key):

3704

"""Calculate the correct parents for a file version according to

3705

the inventories.

3706

"""

3707

parent_keys = self.text_index[text_key]

3708

if parent_keys == [_mod_revision.NULL_REVISION]:

3709

return ()

3710

return tuple(parent_keys)

3711

3712

def check_file_version_parents(self, texts, progress_bar=None):

3713

"""Check the parents stored in a versioned file are correct.

3714

3715

It also detects file versions that are not referenced by their

3716

corresponding revision's inventory.

3717

3718

:returns: A tuple of (wrong_parents, dangling_file_versions).

3719

wrong_parents is a dict mapping {revision_id: (stored_parents,

3720

correct_parents)} for each revision_id where the stored parents

3721

are not correct. dangling_file_versions is a set of (file_id,

3722

revision_id) tuples for versions that are present in this versioned

3723

file, but not used by the corresponding inventory.

3724

"""

3725

wrong_parents = {}

3726

self.file_ids = set([file_id for file_id, _ in

3727

self.text_index.iterkeys()])

3728

# text keys is now grouped by file_id

3729

n_weaves = len(self.file_ids)

3730

files_in_revisions = {}

3731

revisions_of_files = {}

3732

n_versions = len(self.text_index)

3733

progress_bar.update('loading text store', 0, n_versions)

3734

parent_map = self.repository.texts.get_parent_map(self.text_index)

3735

# On unlistable transports this could well be empty/error...

3736

text_keys = self.repository.texts.keys()

3737

unused_keys = frozenset(text_keys) - set(self.text_index)

3738

for num, key in enumerate(self.text_index.iterkeys()):

3739

if progress_bar is not None:

3740

progress_bar.update('checking text graph', num, n_versions)

3741

correct_parents = self.calculate_file_version_parents(key)

3742

try:

3743

knit_parents = parent_map[key]

3744

except errors.RevisionNotPresent:

3745

# Missing text!

3746

knit_parents = None

3747

if correct_parents != knit_parents:

3748

wrong_parents[key] = (knit_parents, correct_parents)

3749

return wrong_parents, unused_keys

3750

3751

3752

def _old_get_graph(repository, revision_id):

3753

"""DO NOT USE. That is all. I'm serious."""

3754

graph = repository.get_graph()

3755

revision_graph = dict(((key, value) for key, value in

3756

graph.iter_ancestry([revision_id]) if value is not None))

3757

return _strip_NULL_ghosts(revision_graph)

3758

3759

3760

def _strip_NULL_ghosts(revision_graph):

3761

"""Also don't use this. more compatibility code for unmigrated clients."""

3762

# Filter ghosts, and null:

3763

if _mod_revision.NULL_REVISION in revision_graph:

3764

del revision_graph[_mod_revision.NULL_REVISION]

3765

for key, parents in revision_graph.items():

3766

revision_graph[key] = tuple(parent for parent in parents if parent

3767

in revision_graph)

3768

return revision_graph

3769

3770

3771

class StreamSink(object):

3772

"""An object that can insert a stream into a repository.

3773

3774

This interface handles the complexity of reserialising inventories and

3775

revisions from different formats, and allows unidirectional insertion into

3776

stacked repositories without looking for the missing basis parents

3777

beforehand.

3778

"""

3779

3780

def __init__(self, target_repo):

3781

self.target_repo = target_repo

3782

3783

def insert_stream(self, stream, src_format, resume_tokens):

3784

"""Insert a stream's content into the target repository.

3785

3786

:param src_format: a bzr repository format.

3787

3788

:return: a list of resume tokens and an iterable of keys additional

3789

items required before the insertion can be completed.

3790

"""

3791

self.target_repo.lock_write()

3792

try:

3793

if resume_tokens:

3794

self.target_repo.resume_write_group(resume_tokens)

3795

else:

3796

self.target_repo.start_write_group()

3797

try:

3798

# locked_insert_stream performs a commit|suspend.

3799

return self._locked_insert_stream(stream, src_format)

3800

except:

3801

self.target_repo.abort_write_group(suppress_errors=True)

3802

raise

3803

finally:

3804

self.target_repo.unlock()

3805

3806

def _locked_insert_stream(self, stream, src_format):

3807

to_serializer = self.target_repo._format._serializer

3808

src_serializer = src_format._serializer

3809

if to_serializer == src_serializer:

3810

# If serializers match and the target is a pack repository, set the

3811

# write cache size on the new pack. This avoids poor performance

3812

# on transports where append is unbuffered (such as

3813

# RemoteTransport). This is safe to do because nothing should read

3814

# back from the target repository while a stream with matching

3815

# serialization is being inserted.

3816

# The exception is that a delta record from the source that should

3817

# be a fulltext may need to be expanded by the target (see

3818

# test_fetch_revisions_with_deltas_into_pack); but we take care to

3819

# explicitly flush any buffered writes first in that rare case.

3820

try:

3821

new_pack = self.target_repo._pack_collection._new_pack

3822

except AttributeError:

3823

# Not a pack repository

3824

pass

3825

else:

3826

new_pack.set_write_cache_size(1024*1024)

3827

for substream_type, substream in stream:

3828

if substream_type == 'texts':

3829

self.target_repo.texts.insert_record_stream(substream)

3830

elif substream_type == 'inventories':

3831

if src_serializer == to_serializer:

3832

self.target_repo.inventories.insert_record_stream(

3833

substream)

3834

else:

3835

self._extract_and_insert_inventories(

3836

substream, src_serializer)

3837

elif substream_type == 'revisions':

3838

# This may fallback to extract-and-insert more often than

3839

# required if the serializers are different only in terms of

3840

# the inventory.

3841

if src_serializer == to_serializer:

3842

self.target_repo.revisions.insert_record_stream(

3843

substream)

3844

else:

3845

self._extract_and_insert_revisions(substream,

3846

src_serializer)

3847

elif substream_type == 'signatures':

3848

self.target_repo.signatures.insert_record_stream(substream)

3849

else:

3850

raise AssertionError('kaboom! %s' % (substream_type,))

3851

try:

3852

missing_keys = set()

3853

for prefix, versioned_file in (

3854

('texts', self.target_repo.texts),

3855

('inventories', self.target_repo.inventories),

3856

('revisions', self.target_repo.revisions),

3857

('signatures', self.target_repo.signatures),

3858

3859

missing_keys.update((prefix,) + key for key in

3860

versioned_file.get_missing_compression_parent_keys())

3861

except NotImplementedError:

3862

# cannot even attempt suspending, and missing would have failed

3863

# during stream insertion.

3864

missing_keys = set()

3865

else:

3866

if missing_keys:

3867

# suspend the write group and tell the caller what we is

3868

# missing. We know we can suspend or else we would not have

3869

# entered this code path. (All repositories that can handle

3870

# missing keys can handle suspending a write group).

3871

write_group_tokens = self.target_repo.suspend_write_group()

3872

return write_group_tokens, missing_keys

3873

self.target_repo.commit_write_group()

3874

return [], set()

3875

3876

def _extract_and_insert_inventories(self, substream, serializer):

3877

"""Generate a new inventory versionedfile in target, converting data.

3878

3879

The inventory is retrieved from the source, (deserializing it), and

3880

stored in the target (reserializing it in a different format).

3881

"""

3882

for record in substream:

3883

bytes = record.get_bytes_as('fulltext')

3884

revision_id = record.key[0]

3885

inv = serializer.read_inventory_from_string(bytes, revision_id)

3886

parents = [key[0] for key in record.parents]

3887

self.target_repo.add_inventory(revision_id, inv, parents)

3888

3889

def _extract_and_insert_revisions(self, substream, serializer):

3890

for record in substream:

3891

bytes = record.get_bytes_as('fulltext')

3892

revision_id = record.key[0]

3893

rev = serializer.read_revision_from_string(bytes)

3894

if rev.revision_id != revision_id:

3895

raise AssertionError('wtf: %s != %s' % (rev, revision_id))

3896

self.target_repo.add_revision(revision_id, rev)

3897

3898

def finished(self):

3899

if self.target_repo._format._fetch_reconcile:

3900

self.target_repo.reconcile()

3901

3902

3903

class StreamSource(object):

3904

"""A source of a stream for fetching between repositories."""

3905

3906

def __init__(self, from_repository, to_format):

3907

"""Create a StreamSource streaming from from_repository."""

3908

self.from_repository = from_repository

3909

self.to_format = to_format

3910

3911

def delta_on_metadata(self):

3912

"""Return True if delta's are permitted on metadata streams.

3913

3914

That is on revisions and signatures.

3915

"""

3916

src_serializer = self.from_repository._format._serializer

3917

target_serializer = self.to_format._serializer

3918

return (self.to_format._fetch_uses_deltas and

3919

src_serializer == target_serializer)

3920

3921

def _fetch_revision_texts(self, revs):

3922

# fetch signatures first and then the revision texts

3923

# may need to be a InterRevisionStore call here.

3924

from_sf = self.from_repository.signatures

3925

# A missing signature is just skipped.

3926

keys = [(rev_id,) for rev_id in revs]

3927

signatures = versionedfile.filter_absent(from_sf.get_record_stream(

3928

keys,

3929

self.to_format._fetch_order,

3930

not self.to_format._fetch_uses_deltas))

3931

# If a revision has a delta, this is actually expanded inside the

3932

# insert_record_stream code now, which is an alternate fix for

3933

# bug #261339

3934

from_rf = self.from_repository.revisions

3935

revisions = from_rf.get_record_stream(

3936

keys,

3937

self.to_format._fetch_order,

3938

not self.delta_on_metadata())

3939

return [('signatures', signatures), ('revisions', revisions)]

3940

3941

def _generate_root_texts(self, revs):

3942

"""This will be called by __fetch between fetching weave texts and

3943

fetching the inventory weave.

3944

3945

Subclasses should override this if they need to generate root texts

3946

after fetching weave texts.

3947

"""

3948

if self._rich_root_upgrade():

3949

import bzrlib.fetch

3950

return bzrlib.fetch.Inter1and2Helper(

3951

self.from_repository).generate_root_texts(revs)

3952

else:

3953

return []

3954

3955

def get_stream(self, search):

3956

phase = 'file'

3957

revs = search.get_keys()

3958

graph = self.from_repository.get_graph()

3959

revs = list(graph.iter_topo_order(revs))

3960

data_to_fetch = self.from_repository.item_keys_introduced_by(revs)

3961

text_keys = []

3962

for knit_kind, file_id, revisions in data_to_fetch:

3963

if knit_kind != phase:

3964

phase = knit_kind

3965

# Make a new progress bar for this phase

3966

if knit_kind == "file":

3967

# Accumulate file texts

3968

text_keys.extend([(file_id, revision) for revision in

3969

revisions])

3970

elif knit_kind == "inventory":

3971

# Now copy the file texts.

3972

from_texts = self.from_repository.texts

3973

yield ('texts', from_texts.get_record_stream(

3974

text_keys, self.to_format._fetch_order,

3975

not self.to_format._fetch_uses_deltas))

3976

# Cause an error if a text occurs after we have done the

3977

# copy.

3978

text_keys = None

3979

# Before we process the inventory we generate the root

3980

# texts (if necessary) so that the inventories references

3981

# will be valid.

3982

for _ in self._generate_root_texts(revs):

3983

yield _

3984

# NB: This currently reopens the inventory weave in source;

3985

# using a single stream interface instead would avoid this.

3986

from_weave = self.from_repository.inventories

3987

# we fetch only the referenced inventories because we do not

3988

# know for unselected inventories whether all their required

3989

# texts are present in the other repository - it could be

3990

# corrupt.

3991

yield ('inventories', from_weave.get_record_stream(

3992

[(rev_id,) for rev_id in revs],

3993

self.inventory_fetch_order(),

3994

not self.delta_on_metadata()))

3995

elif knit_kind == "signatures":

3996

# Nothing to do here; this will be taken care of when

3997

# _fetch_revision_texts happens.

3998

pass

3999

elif knit_kind == "revisions":

4000

for record in self._fetch_revision_texts(revs):

4001

yield record

4002

else:

4003

raise AssertionError("Unknown knit kind %r" % knit_kind)

4004

4005

def get_stream_for_missing_keys(self, missing_keys):

4006

# missing keys can only occur when we are byte copying and not

4007

# translating (because translation means we don't send

4008

# unreconstructable deltas ever).

4009

keys = {}

4010

keys['texts'] = set()

4011

keys['revisions'] = set()

4012

keys['inventories'] = set()

4013

keys['signatures'] = set()

4014

for key in missing_keys:

4015

keys[key[0]].add(key[1:])

4016

if len(keys['revisions']):

4017

# If we allowed copying revisions at this point, we could end up

4018

# copying a revision without copying its required texts: a

4019

# violation of the requirements for repository integrity.

4020

raise AssertionError(

4021

'cannot copy revisions to fill in missing deltas %s' % (

4022

keys['revisions'],))

4023

for substream_kind, keys in keys.iteritems():

4024

vf = getattr(self.from_repository, substream_kind)

4025

# Ask for full texts always so that we don't need more round trips

4026

# after this stream.

4027

stream = vf.get_record_stream(keys,

4028

self.to_format._fetch_order, True)

4029

yield substream_kind, stream

4030

4031

def inventory_fetch_order(self):

4032

if self._rich_root_upgrade():

4033

return 'topological'

4034

else:

4035

return self.to_format._fetch_order

4036

4037

def _rich_root_upgrade(self):

4038

return (not self.from_repository._format.rich_root_data and

4039

self.to_format.rich_root_data)

4040

Older »