~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/repository.py

Committer: Canonical.com Patch Queue Manager
Date: 2009-10-12 22:36:42 UTC
mfrom: (4736.1.1 2.1-static-tuple-py2.4-compat)
Revision ID: pqm@pqm.ubuntu.com-20091012223642-0seiqhjw7sa587dm

(jam) Some python2.4 fixes for the StaticTuple code.

files added:
BRANCH.TODO

COPYING.txt

INSTALL

bzr.ico

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/email_message.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store/revision

bzrlib/store/versioned

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transform.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave_commands.py

bzrlib/win32utils.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/Bazaar-Logo-For-Manuals.png

doc/default.css

doc/developers

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/process.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/check-newsbugs.py

tools/generate_docs.py

tools/generate_release_notes.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
NEWS.developers

build-api

bzrlib/clone.py

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/revfile.py

bzrlib/store/compressed_text.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

bzrlib/graph.py => bzrlib/deprecated_graph.py

bzr-man.py => bzrlib/doc_generate/autodoc_man.py

bzrlib/store/weave.py => bzrlib/store/versioned/__init__.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/testannotate.py => bzrlib/tests/blackbox/test_annotate.py

bzrlib/selftest/test_revision_info.py => bzrlib/tests/blackbox/test_revision_info.py

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/HTTPTestUtil.py => bzrlib/tests/http_utils.py

bzrlib/selftest/testbranch.py => bzrlib/tests/per_branch/test_branch.py

bzrlib/selftest/test_parent.py => bzrlib/tests/per_branch/test_parent.py

bzrlib/selftest/testrevprops.py => bzrlib/tests/per_repository/test_revision.py

bzrlib/selftest/testconfig.py => bzrlib/tests/test_config.py

bzrlib/selftest/testgraph.py => bzrlib/tests/test_deprecated_graph.py

bzrlib/selftest/testdiff.py => bzrlib/tests/test_diff.py

bzrlib/selftest/testfetch.py => bzrlib/tests/test_fetch.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testidentitymap.py => bzrlib/tests/test_identitymap.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testlog.py => bzrlib/tests/test_log.py

bzrlib/selftest/testmerge.py => bzrlib/tests/test_merge.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevision.py => bzrlib/tests/test_revision.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionspec.py

bzrlib/selftest/testsampler.py => bzrlib/tests/test_sampler.py

bzrlib/selftest/teststore.py => bzrlib/tests/test_store.py

bzrlib/selftest/testtestament.py => bzrlib/tests/test_testament.py

bzrlib/selftest/testtransactions.py => bzrlib/tests/test_transactions.py

bzrlib/selftest/testtransport.py => bzrlib/tests/test_transport.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

bzrlib/selftest/testworkingtree.py => bzrlib/tests/test_workingtree.py

bzrlib/transport/http.py => bzrlib/transport/http/__init__.py

bzrlib/ui.py => bzrlib/ui/__init__.py

bzrlib/xml5.py => bzrlib/xml8.py

bzrlib/xml.py => bzrlib/xml_serializer.py

HACKING => doc/developers/HACKING.txt

tutorial.txt => doc/en/tutorials/tutorial.txt

files modified:
.bzrignore

.rsyncexclude

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/testament.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport/__init__.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

setup.py *

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/repository.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

import cStringIO

import re

import time

from bzrlib import (

bzrdir,

check,

chk_map,

debug,

errors,

fifo_cache,

generate_ids,

gpg,

graph,

inventory,

inventory_delta,

lazy_regex,

lockable_files,

lockdir,

lru_cache,

osutils,

revision as _mod_revision,

symbol_versioning,

tsort,

ui,

versionedfile,

)

from bzrlib.bundle import serializer

from bzrlib.revisiontree import RevisionTree

from bzrlib.store.versioned import VersionedFileStore

from bzrlib.testament import Testament

""")

from bzrlib.decorators import needs_read_lock, needs_write_lock, only_raises

from bzrlib.lock import _RelockDebugMixin

from bzrlib.inter import InterObject

from bzrlib.inventory import (

Inventory,

InventoryDirectory,

ROOT_ID,

entry_factory,

)

from bzrlib import registry

from bzrlib.trace import (

log_exception_quietly, note, mutter, mutter_callsite, warning)

# Old formats display a warning, but only once

_deprecation_warning_done = False

class CommitBuilder(object):

"""Provides an interface to build up a commit.

This allows describing a tree to be committed without needing to

know the internals of the format of the repository.

"""

# all clients should supply tree roots.

record_root_entry = True

# the default CommitBuilder does not manage trees whose root is versioned.

_versioned_root = False

def __init__(self, repository, parents, config, timestamp=None,

timezone=None, committer=None, revprops=None,

revision_id=None):

"""Initiate a CommitBuilder.

:param repository: Repository to commit to.

:param parents: Revision ids of the parents of the new revision.

:param config: Configuration to use.

:param timestamp: Optional timestamp recorded for commit.

:param timezone: Optional timezone for timestamp.

:param committer: Optional committer to set for commit.

:param revprops: Optional dictionary of revision properties.

:param revision_id: Optional revision id.

"""

self._config = config

if committer is None:

self._committer = self._config.username()

100

else:

101

self._committer = committer

102

103

self.new_inventory = Inventory(None)

104

self._new_revision_id = revision_id

105

self.parents = parents

106

self.repository = repository

107

108

self._revprops = {}

109

if revprops is not None:

110

self._validate_revprops(revprops)

111

self._revprops.update(revprops)

112

113

if timestamp is None:

114

timestamp = time.time()

115

# Restrict resolution to 1ms

116

self._timestamp = round(timestamp, 3)

117

118

if timezone is None:

119

self._timezone = osutils.local_time_offset()

120

else:

121

self._timezone = int(timezone)

122

123

self._generate_revision_if_needed()

124

self.__heads = graph.HeadsCache(repository.get_graph()).heads

125

self._basis_delta = []

126

# API compatibility, older code that used CommitBuilder did not call

127

# .record_delete(), which means the delta that is computed would not be

128

# valid. Callers that will call record_delete() should call

129

# .will_record_deletes() to indicate that.

130

self._recording_deletes = False

131

# memo'd check for no-op commits.

132

self._any_changes = False

133

134

def any_changes(self):

135

"""Return True if any entries were changed.

136

137

This includes merge-only changes. It is the core for the --unchanged

138

detection in commit.

139

140

:return: True if any changes have occured.

141

"""

142

return self._any_changes

143

144

def _validate_unicode_text(self, text, context):

145

"""Verify things like commit messages don't have bogus characters."""

146

if '\r' in text:

147

raise ValueError('Invalid value for %s: %r' % (context, text))

148

149

def _validate_revprops(self, revprops):

150

for key, value in revprops.iteritems():

151

# We know that the XML serializers do not round trip '\r'

152

# correctly, so refuse to accept them

153

if not isinstance(value, basestring):

154

raise ValueError('revision property (%s) is not a valid'

155

' (unicode) string: %r' % (key, value))

156

self._validate_unicode_text(value,

157

'revision property (%s)' % (key,))

158

159

def commit(self, message):

160

"""Make the actual commit.

161

162

:return: The revision id of the recorded revision.

163

"""

164

self._validate_unicode_text(message, 'commit message')

165

rev = _mod_revision.Revision(

166

timestamp=self._timestamp,

167

timezone=self._timezone,

168

committer=self._committer,

169

message=message,

170

inventory_sha1=self.inv_sha1,

171

revision_id=self._new_revision_id,

172

properties=self._revprops)

173

rev.parent_ids = self.parents

174

self.repository.add_revision(self._new_revision_id, rev,

175

self.new_inventory, self._config)

176

self.repository.commit_write_group()

177

return self._new_revision_id

178

179

def abort(self):

180

"""Abort the commit that is being built.

181

"""

182

self.repository.abort_write_group()

183

184

def revision_tree(self):

185

"""Return the tree that was just committed.

186

187

After calling commit() this can be called to get a RevisionTree

188

representing the newly committed tree. This is preferred to

189

calling Repository.revision_tree() because that may require

190

deserializing the inventory, while we already have a copy in

191

memory.

192

"""

193

if self.new_inventory is None:

194

self.new_inventory = self.repository.get_inventory(

195

self._new_revision_id)

196

return RevisionTree(self.repository, self.new_inventory,

197

self._new_revision_id)

198

199

def finish_inventory(self):

200

"""Tell the builder that the inventory is finished.

201

202

:return: The inventory id in the repository, which can be used with

203

repository.get_inventory.

204

"""

205

if self.new_inventory is None:

206

# an inventory delta was accumulated without creating a new

207

# inventory.

208

basis_id = self.basis_delta_revision

209

self.inv_sha1 = self.repository.add_inventory_by_delta(

210

basis_id, self._basis_delta, self._new_revision_id,

211

self.parents)

212

else:

213

if self.new_inventory.root is None:

214

raise AssertionError('Root entry should be supplied to'

215

' record_entry_contents, as of bzr 0.10.')

216

self.new_inventory.add(InventoryDirectory(ROOT_ID, '', None))

217

self.new_inventory.revision_id = self._new_revision_id

218

self.inv_sha1 = self.repository.add_inventory(

219

self._new_revision_id,

220

self.new_inventory,

221

self.parents

222

)

223

return self._new_revision_id

224

225

def _gen_revision_id(self):

226

"""Return new revision-id."""

227

return generate_ids.gen_revision_id(self._config.username(),

228

self._timestamp)

229

230

def _generate_revision_if_needed(self):

231

"""Create a revision id if None was supplied.

232

233

If the repository can not support user-specified revision ids

234

they should override this function and raise CannotSetRevisionId

235

if _new_revision_id is not None.

236

237

:raises: CannotSetRevisionId

238

"""

239

if self._new_revision_id is None:

240

self._new_revision_id = self._gen_revision_id()

241

self.random_revid = True

242

else:

243

self.random_revid = False

244

245

def _heads(self, file_id, revision_ids):

246

"""Calculate the graph heads for revision_ids in the graph of file_id.

247

248

This can use either a per-file graph or a global revision graph as we

249

have an identity relationship between the two graphs.

250

"""

251

return self.__heads(revision_ids)

252

253

def _check_root(self, ie, parent_invs, tree):

254

"""Helper for record_entry_contents.

255

256

:param ie: An entry being added.

257

:param parent_invs: The inventories of the parent revisions of the

258

commit.

259

:param tree: The tree that is being committed.

260

"""

261

# In this revision format, root entries have no knit or weave When

262

# serializing out to disk and back in root.revision is always

263

# _new_revision_id

264

ie.revision = self._new_revision_id

265

266

def _require_root_change(self, tree):

267

"""Enforce an appropriate root object change.

268

269

This is called once when record_iter_changes is called, if and only if

270

the root was not in the delta calculated by record_iter_changes.

271

272

:param tree: The tree which is being committed.

273

"""

274

# NB: if there are no parents then this method is not called, so no

275

# need to guard on parents having length.

276

entry = entry_factory['directory'](tree.path2id(''), '',

277

None)

278

entry.revision = self._new_revision_id

279

self._basis_delta.append(('', '', entry.file_id, entry))

280

281

def _get_delta(self, ie, basis_inv, path):

282

"""Get a delta against the basis inventory for ie."""

283

if ie.file_id not in basis_inv:

284

# add

285

result = (None, path, ie.file_id, ie)

286

self._basis_delta.append(result)

287

return result

288

elif ie != basis_inv[ie.file_id]:

289

# common but altered

290

# TODO: avoid tis id2path call.

291

result = (basis_inv.id2path(ie.file_id), path, ie.file_id, ie)

292

self._basis_delta.append(result)

293

return result

294

else:

295

# common, unaltered

296

return None

297

298

def get_basis_delta(self):

299

"""Return the complete inventory delta versus the basis inventory.

300

301

This has been built up with the calls to record_delete and

302

record_entry_contents. The client must have already called

303

will_record_deletes() to indicate that they will be generating a

304

complete delta.

305

306

:return: An inventory delta, suitable for use with apply_delta, or

307

Repository.add_inventory_by_delta, etc.

308

"""

309

if not self._recording_deletes:

310

raise AssertionError("recording deletes not activated.")

311

return self._basis_delta

312

313

def record_delete(self, path, file_id):

314

"""Record that a delete occured against a basis tree.

315

316

This is an optional API - when used it adds items to the basis_delta

317

being accumulated by the commit builder. It cannot be called unless the

318

method will_record_deletes() has been called to inform the builder that

319

a delta is being supplied.

320

321

:param path: The path of the thing deleted.

322

:param file_id: The file id that was deleted.

323

"""

324

if not self._recording_deletes:

325

raise AssertionError("recording deletes not activated.")

326

delta = (path, None, file_id, None)

327

self._basis_delta.append(delta)

328

self._any_changes = True

329

return delta

330

331

def will_record_deletes(self):

332

"""Tell the commit builder that deletes are being notified.

333

334

This enables the accumulation of an inventory delta; for the resulting

335

commit to be valid, deletes against the basis MUST be recorded via

336

builder.record_delete().

337

"""

338

self._recording_deletes = True

339

try:

340

basis_id = self.parents[0]

341

except IndexError:

342

basis_id = _mod_revision.NULL_REVISION

343

self.basis_delta_revision = basis_id

344

345

def record_entry_contents(self, ie, parent_invs, path, tree,

346

content_summary):

347

"""Record the content of ie from tree into the commit if needed.

348

349

Side effect: sets ie.revision when unchanged

350

351

:param ie: An inventory entry present in the commit.

352

:param parent_invs: The inventories of the parent revisions of the

353

commit.

354

:param path: The path the entry is at in the tree.

355

:param tree: The tree which contains this entry and should be used to

356

obtain content.

357

:param content_summary: Summary data from the tree about the paths

358

content - stat, length, exec, sha/link target. This is only

359

accessed when the entry has a revision of None - that is when it is

360

a candidate to commit.

361

:return: A tuple (change_delta, version_recorded, fs_hash).

362

change_delta is an inventory_delta change for this entry against

363

the basis tree of the commit, or None if no change occured against

364

the basis tree.

365

version_recorded is True if a new version of the entry has been

366

recorded. For instance, committing a merge where a file was only

367

changed on the other side will return (delta, False).

368

fs_hash is either None, or the hash details for the path (currently

369

a tuple of the contents sha1 and the statvalue returned by

370

tree.get_file_with_stat()).

371

"""

372

if self.new_inventory.root is None:

373

if ie.parent_id is not None:

374

raise errors.RootMissing()

375

self._check_root(ie, parent_invs, tree)

376

if ie.revision is None:

377

kind = content_summary[0]

378

else:

379

# ie is carried over from a prior commit

380

kind = ie.kind

381

# XXX: repository specific check for nested tree support goes here - if

382

# the repo doesn't want nested trees we skip it ?

383

if (kind == 'tree-reference' and

384

not self.repository._format.supports_tree_reference):

385

# mismatch between commit builder logic and repository:

386

# this needs the entry creation pushed down into the builder.

387

raise NotImplementedError('Missing repository subtree support.')

388

self.new_inventory.add(ie)

389

390

# TODO: slow, take it out of the inner loop.

391

try:

392

basis_inv = parent_invs[0]

393

except IndexError:

394

basis_inv = Inventory(root_id=None)

395

396

# ie.revision is always None if the InventoryEntry is considered

397

# for committing. We may record the previous parents revision if the

398

# content is actually unchanged against a sole head.

399

if ie.revision is not None:

400

if not self._versioned_root and path == '':

401

# repositories that do not version the root set the root's

402

# revision to the new commit even when no change occurs (more

403

# specifically, they do not record a revision on the root; and

404

# the rev id is assigned to the root during deserialisation -

405

# this masks when a change may have occurred against the basis.

406

# To match this we always issue a delta, because the revision

407

# of the root will always be changing.

408

if ie.file_id in basis_inv:

409

delta = (basis_inv.id2path(ie.file_id), path,

410

ie.file_id, ie)

411

else:

412

# add

413

delta = (None, path, ie.file_id, ie)

414

self._basis_delta.append(delta)

415

return delta, False, None

416

else:

417

# we don't need to commit this, because the caller already

418

# determined that an existing revision of this file is

419

# appropriate. If its not being considered for committing then

420

# it and all its parents to the root must be unaltered so

421

# no-change against the basis.

422

if ie.revision == self._new_revision_id:

423

raise AssertionError("Impossible situation, a skipped "

424

"inventory entry (%r) claims to be modified in this "

425

"commit (%r).", (ie, self._new_revision_id))

426

return None, False, None

427

# XXX: Friction: parent_candidates should return a list not a dict

428

# so that we don't have to walk the inventories again.

429

parent_candiate_entries = ie.parent_candidates(parent_invs)

430

head_set = self._heads(ie.file_id, parent_candiate_entries.keys())

431

heads = []

432

for inv in parent_invs:

433

if ie.file_id in inv:

434

old_rev = inv[ie.file_id].revision

435

if old_rev in head_set:

436

heads.append(inv[ie.file_id].revision)

437

head_set.remove(inv[ie.file_id].revision)

438

439

store = False

440

# now we check to see if we need to write a new record to the

441

# file-graph.

442

# We write a new entry unless there is one head to the ancestors, and

443

# the kind-derived content is unchanged.

444

445

# Cheapest check first: no ancestors, or more the one head in the

446

# ancestors, we write a new node.

447

if len(heads) != 1:

448

store = True

449

if not store:

450

# There is a single head, look it up for comparison

451

parent_entry = parent_candiate_entries[heads[0]]

452

# if the non-content specific data has changed, we'll be writing a

453

# node:

454

if (parent_entry.parent_id != ie.parent_id or

455

parent_entry.name != ie.name):

456

store = True

457

# now we need to do content specific checks:

458

if not store:

459

# if the kind changed the content obviously has

460

if kind != parent_entry.kind:

461

store = True

462

# Stat cache fingerprint feedback for the caller - None as we usually

463

# don't generate one.

464

fingerprint = None

465

if kind == 'file':

466

if content_summary[2] is None:

467

raise ValueError("Files must not have executable = None")

468

if not store:

469

# We can't trust a check of the file length because of content

470

# filtering...

471

if (# if the exec bit has changed we have to store:

472

parent_entry.executable != content_summary[2]):

473

store = True

474

elif parent_entry.text_sha1 == content_summary[3]:

475

# all meta and content is unchanged (using a hash cache

476

# hit to check the sha)

477

ie.revision = parent_entry.revision

478

ie.text_size = parent_entry.text_size

479

ie.text_sha1 = parent_entry.text_sha1

480

ie.executable = parent_entry.executable

481

return self._get_delta(ie, basis_inv, path), False, None

482

else:

483

# Either there is only a hash change(no hash cache entry,

484

# or same size content change), or there is no change on

485

# this file at all.

486

# Provide the parent's hash to the store layer, so that the

487

# content is unchanged we will not store a new node.

488

nostore_sha = parent_entry.text_sha1

489

if store:

490

# We want to record a new node regardless of the presence or

491

# absence of a content change in the file.

492

nostore_sha = None

493

ie.executable = content_summary[2]

494

file_obj, stat_value = tree.get_file_with_stat(ie.file_id, path)

495

try:

496

text = file_obj.read()

497

finally:

498

file_obj.close()

499

try:

500

ie.text_sha1, ie.text_size = self._add_text_to_weave(

501

ie.file_id, text, heads, nostore_sha)

502

# Let the caller know we generated a stat fingerprint.

503

fingerprint = (ie.text_sha1, stat_value)

504

except errors.ExistingContent:

505

# Turns out that the file content was unchanged, and we were

506

# only going to store a new node if it was changed. Carry over

507

# the entry.

508

ie.revision = parent_entry.revision

509

ie.text_size = parent_entry.text_size

510

ie.text_sha1 = parent_entry.text_sha1

511

ie.executable = parent_entry.executable

512

return self._get_delta(ie, basis_inv, path), False, None

513

elif kind == 'directory':

514

if not store:

515

# all data is meta here, nothing specific to directory, so

516

# carry over:

517

ie.revision = parent_entry.revision

518

return self._get_delta(ie, basis_inv, path), False, None

519

self._add_text_to_weave(ie.file_id, '', heads, None)

520

elif kind == 'symlink':

521

current_link_target = content_summary[3]

522

if not store:

523

# symlink target is not generic metadata, check if it has

524

# changed.

525

if current_link_target != parent_entry.symlink_target:

526

store = True

527

if not store:

528

# unchanged, carry over.

529

ie.revision = parent_entry.revision

530

ie.symlink_target = parent_entry.symlink_target

531

return self._get_delta(ie, basis_inv, path), False, None

532

ie.symlink_target = current_link_target

533

self._add_text_to_weave(ie.file_id, '', heads, None)

534

elif kind == 'tree-reference':

535

if not store:

536

if content_summary[3] != parent_entry.reference_revision:

537

store = True

538

if not store:

539

# unchanged, carry over.

540

ie.reference_revision = parent_entry.reference_revision

541

ie.revision = parent_entry.revision

542

return self._get_delta(ie, basis_inv, path), False, None

543

ie.reference_revision = content_summary[3]

544

if ie.reference_revision is None:

545

raise AssertionError("invalid content_summary for nested tree: %r"

546

% (content_summary,))

547

self._add_text_to_weave(ie.file_id, '', heads, None)

548

else:

549

raise NotImplementedError('unknown kind')

550

ie.revision = self._new_revision_id

551

self._any_changes = True

552

return self._get_delta(ie, basis_inv, path), True, fingerprint

553

554

def record_iter_changes(self, tree, basis_revision_id, iter_changes,

555

_entry_factory=entry_factory):

556

"""Record a new tree via iter_changes.

557

558

:param tree: The tree to obtain text contents from for changed objects.

559

:param basis_revision_id: The revision id of the tree the iter_changes

560

has been generated against. Currently assumed to be the same

561

as self.parents[0] - if it is not, errors may occur.

562

:param iter_changes: An iter_changes iterator with the changes to apply

563

to basis_revision_id. The iterator must not include any items with

564

a current kind of None - missing items must be either filtered out

565

or errored-on beefore record_iter_changes sees the item.

566

:param _entry_factory: Private method to bind entry_factory locally for

567

performance.

568

:return: A generator of (file_id, relpath, fs_hash) tuples for use with

569

tree._observed_sha1.

570

"""

571

# Create an inventory delta based on deltas between all the parents and

572

# deltas between all the parent inventories. We use inventory delta's

573

# between the inventory objects because iter_changes masks

574

# last-changed-field only changes.

575

# Working data:

576

# file_id -> change map, change is fileid, paths, changed, versioneds,

577

# parents, names, kinds, executables

578

merged_ids = {}

579

# {file_id -> revision_id -> inventory entry, for entries in parent

580

# trees that are not parents[0]

581

parent_entries = {}

582

ghost_basis = False

583

try:

584

revtrees = list(self.repository.revision_trees(self.parents))

585

except errors.NoSuchRevision:

586

# one or more ghosts, slow path.

587

revtrees = []

588

for revision_id in self.parents:

589

try:

590

revtrees.append(self.repository.revision_tree(revision_id))

591

except errors.NoSuchRevision:

592

if not revtrees:

593

basis_revision_id = _mod_revision.NULL_REVISION

594

ghost_basis = True

595

revtrees.append(self.repository.revision_tree(

596

_mod_revision.NULL_REVISION))

597

# The basis inventory from a repository

598

if revtrees:

599

basis_inv = revtrees[0].inventory

600

else:

601

basis_inv = self.repository.revision_tree(

602

_mod_revision.NULL_REVISION).inventory

603

if len(self.parents) > 0:

604

if basis_revision_id != self.parents[0] and not ghost_basis:

605

raise Exception(

606

"arbitrary basis parents not yet supported with merges")

607

for revtree in revtrees[1:]:

608

for change in revtree.inventory._make_delta(basis_inv):

609

if change[1] is None:

610

# Not present in this parent.

611

continue

612

if change[2] not in merged_ids:

613

if change[0] is not None:

614

basis_entry = basis_inv[change[2]]

615

merged_ids[change[2]] = [

616

# basis revid

617

basis_entry.revision,

618

# new tree revid

619

change[3].revision]

620

parent_entries[change[2]] = {

621

# basis parent

622

basis_entry.revision:basis_entry,

623

# this parent

624

change[3].revision:change[3],

625

}

626

else:

627

merged_ids[change[2]] = [change[3].revision]

628

parent_entries[change[2]] = {change[3].revision:change[3]}

629

else:

630

merged_ids[change[2]].append(change[3].revision)

631

parent_entries[change[2]][change[3].revision] = change[3]

632

else:

633

merged_ids = {}

634

# Setup the changes from the tree:

635

# changes maps file_id -> (change, [parent revision_ids])

636

changes= {}

637

for change in iter_changes:

638

# This probably looks up in basis_inv way to much.

639

if change[1][0] is not None:

640

head_candidate = [basis_inv[change[0]].revision]

641

else:

642

head_candidate = []

643

changes[change[0]] = change, merged_ids.get(change[0],

644

head_candidate)

645

unchanged_merged = set(merged_ids) - set(changes)

646

# Extend the changes dict with synthetic changes to record merges of

647

# texts.

648

for file_id in unchanged_merged:

649

# Record a merged version of these items that did not change vs the

650

# basis. This can be either identical parallel changes, or a revert

651

# of a specific file after a merge. The recorded content will be

652

# that of the current tree (which is the same as the basis), but

653

# the per-file graph will reflect a merge.

654

# NB:XXX: We are reconstructing path information we had, this

655

# should be preserved instead.

656

# inv delta change: (file_id, (path_in_source, path_in_target),

657

# changed_content, versioned, parent, name, kind,

658

# executable)

659

try:

660

basis_entry = basis_inv[file_id]

661

except errors.NoSuchId:

662

# a change from basis->some_parents but file_id isn't in basis

663

# so was new in the merge, which means it must have changed

664

# from basis -> current, and as it hasn't the add was reverted

665

# by the user. So we discard this change.

666

pass

667

else:

668

change = (file_id,

669

(basis_inv.id2path(file_id), tree.id2path(file_id)),

670

False, (True, True),

671

(basis_entry.parent_id, basis_entry.parent_id),

672

(basis_entry.name, basis_entry.name),

673

(basis_entry.kind, basis_entry.kind),

674

(basis_entry.executable, basis_entry.executable))

675

changes[file_id] = (change, merged_ids[file_id])

676

# changes contains tuples with the change and a set of inventory

677

# candidates for the file.

678

# inv delta is:

679

# old_path, new_path, file_id, new_inventory_entry

680

seen_root = False # Is the root in the basis delta?

681

inv_delta = self._basis_delta

682

modified_rev = self._new_revision_id

683

for change, head_candidates in changes.values():

684

if change[3][1]: # versioned in target.

685

# Several things may be happening here:

686

# We may have a fork in the per-file graph

687

# - record a change with the content from tree

688

# We may have a change against < all trees

689

# - carry over the tree that hasn't changed

690

# We may have a change against all trees

691

# - record the change with the content from tree

692

kind = change[6][1]

693

file_id = change[0]

694

entry = _entry_factory[kind](file_id, change[5][1],

695

change[4][1])

696

head_set = self._heads(change[0], set(head_candidates))

697

heads = []

698

# Preserve ordering.

699

for head_candidate in head_candidates:

700

if head_candidate in head_set:

701

heads.append(head_candidate)

702

head_set.remove(head_candidate)

703

carried_over = False

704

if len(heads) == 1:

705

# Could be a carry-over situation:

706

parent_entry_revs = parent_entries.get(file_id, None)

707

if parent_entry_revs:

708

parent_entry = parent_entry_revs.get(heads[0], None)

709

else:

710

parent_entry = None

711

if parent_entry is None:

712

# The parent iter_changes was called against is the one

713

# that is the per-file head, so any change is relevant

714

# iter_changes is valid.

715

carry_over_possible = False

716

else:

717

# could be a carry over situation

718

# A change against the basis may just indicate a merge,

719

# we need to check the content against the source of the

720

# merge to determine if it was changed after the merge

721

# or carried over.

722

if (parent_entry.kind != entry.kind or

723

parent_entry.parent_id != entry.parent_id or

724

parent_entry.name != entry.name):

725

# Metadata common to all entries has changed

726

# against per-file parent

727

carry_over_possible = False

728

else:

729

carry_over_possible = True

730

# per-type checks for changes against the parent_entry

731

# are done below.

732

else:

733

# Cannot be a carry-over situation

734

carry_over_possible = False

735

# Populate the entry in the delta

736

if kind == 'file':

737

# XXX: There is still a small race here: If someone reverts the content of a file

738

# after iter_changes examines and decides it has changed,

739

# we will unconditionally record a new version even if some

740

# other process reverts it while commit is running (with

741

# the revert happening after iter_changes did it's

742

# examination).

743

if change[7][1]:

744

entry.executable = True

745

else:

746

entry.executable = False

747

if (carry_over_possible and

748

parent_entry.executable == entry.executable):

749

# Check the file length, content hash after reading

750

# the file.

751

nostore_sha = parent_entry.text_sha1

752

else:

753

nostore_sha = None

754

file_obj, stat_value = tree.get_file_with_stat(file_id, change[1][1])

755

try:

756

text = file_obj.read()

757

finally:

758

file_obj.close()

759

try:

760

entry.text_sha1, entry.text_size = self._add_text_to_weave(

761

file_id, text, heads, nostore_sha)

762

yield file_id, change[1][1], (entry.text_sha1, stat_value)

763

except errors.ExistingContent:

764

# No content change against a carry_over parent

765

# Perhaps this should also yield a fs hash update?

766

carried_over = True

767

entry.text_size = parent_entry.text_size

768

entry.text_sha1 = parent_entry.text_sha1

769

elif kind == 'symlink':

770

# Wants a path hint?

771

entry.symlink_target = tree.get_symlink_target(file_id)

772

if (carry_over_possible and

773

parent_entry.symlink_target == entry.symlink_target):

774

carried_over = True

775

else:

776

self._add_text_to_weave(change[0], '', heads, None)

777

elif kind == 'directory':

778

if carry_over_possible:

779

carried_over = True

780

else:

781

# Nothing to set on the entry.

782

# XXX: split into the Root and nonRoot versions.

783

if change[1][1] != '' or self.repository.supports_rich_root():

784

self._add_text_to_weave(change[0], '', heads, None)

785

elif kind == 'tree-reference':

786

if not self.repository._format.supports_tree_reference:

787

# This isn't quite sane as an error, but we shouldn't

788

# ever see this code path in practice: tree's don't

789

# permit references when the repo doesn't support tree

790

# references.

791

raise errors.UnsupportedOperation(tree.add_reference,

792

self.repository)

793

reference_revision = tree.get_reference_revision(change[0])

794

entry.reference_revision = reference_revision

795

if (carry_over_possible and

796

parent_entry.reference_revision == reference_revision):

797

carried_over = True

798

else:

799

self._add_text_to_weave(change[0], '', heads, None)

800

else:

801

raise AssertionError('unknown kind %r' % kind)

802

if not carried_over:

803

entry.revision = modified_rev

804

else:

805

entry.revision = parent_entry.revision

806

else:

807

entry = None

808

new_path = change[1][1]

809

inv_delta.append((change[1][0], new_path, change[0], entry))

810

if new_path == '':

811

seen_root = True

812

self.new_inventory = None

813

if len(inv_delta):

814

# This should perhaps be guarded by a check that the basis we

815

# commit against is the basis for the commit and if not do a delta

816

# against the basis.

817

self._any_changes = True

818

if not seen_root:

819

# housekeeping root entry changes do not affect no-change commits.

820

self._require_root_change(tree)

821

self.basis_delta_revision = basis_revision_id

822

823

def _add_text_to_weave(self, file_id, new_text, parents, nostore_sha):

824

parent_keys = tuple([(file_id, parent) for parent in parents])

825

return self.repository.texts._add_text(

826

(file_id, self._new_revision_id), parent_keys, new_text,

827

nostore_sha=nostore_sha, random_id=self.random_revid)[0:2]

828

829

830

class RootCommitBuilder(CommitBuilder):

831

"""This commitbuilder actually records the root id"""

832

833

# the root entry gets versioned properly by this builder.

834

_versioned_root = True

835

836

def _check_root(self, ie, parent_invs, tree):

837

"""Helper for record_entry_contents.

838

839

:param ie: An entry being added.

840

:param parent_invs: The inventories of the parent revisions of the

841

commit.

842

:param tree: The tree that is being committed.

843

"""

844

845

def _require_root_change(self, tree):

846

"""Enforce an appropriate root object change.

847

848

This is called once when record_iter_changes is called, if and only if

849

the root was not in the delta calculated by record_iter_changes.

850

851

:param tree: The tree which is being committed.

852

"""

853

# versioned roots do not change unless the tree found a change.

854

855

856

######################################################################

857

# Repositories

858

859

860

class Repository(_RelockDebugMixin):

861

"""Repository holding history for one or more branches.

862

863

The repository holds and retrieves historical information including

864

revisions and file history. It's normally accessed only by the Branch,

865

which views a particular line of development through that history.

866

867

The Repository builds on top of some byte storage facilies (the revisions,

868

signatures, inventories, texts and chk_bytes attributes) and a Transport,

869

which respectively provide byte storage and a means to access the (possibly

870

remote) disk.

871

872

The byte storage facilities are addressed via tuples, which we refer to

873

as 'keys' throughout the code base. Revision_keys, inventory_keys and

874

signature_keys are all 1-tuples: (revision_id,). text_keys are two-tuples:

875

(file_id, revision_id). chk_bytes uses CHK keys - a 1-tuple with a single

876

byte string made up of a hash identifier and a hash value.

877

We use this interface because it allows low friction with the underlying

878

code that implements disk indices, network encoding and other parts of

879

bzrlib.

880

881

:ivar revisions: A bzrlib.versionedfile.VersionedFiles instance containing

882

the serialised revisions for the repository. This can be used to obtain

883

revision graph information or to access raw serialised revisions.

884

The result of trying to insert data into the repository via this store

885

is undefined: it should be considered read-only except for implementors

886

of repositories.

887

:ivar signatures: A bzrlib.versionedfile.VersionedFiles instance containing

888

the serialised signatures for the repository. This can be used to

889

obtain access to raw serialised signatures. The result of trying to

890

insert data into the repository via this store is undefined: it should

891

be considered read-only except for implementors of repositories.

892

:ivar inventories: A bzrlib.versionedfile.VersionedFiles instance containing

893

the serialised inventories for the repository. This can be used to

894

obtain unserialised inventories. The result of trying to insert data

895

into the repository via this store is undefined: it should be

896

considered read-only except for implementors of repositories.

897

:ivar texts: A bzrlib.versionedfile.VersionedFiles instance containing the

898

texts of files and directories for the repository. This can be used to

899

obtain file texts or file graphs. Note that Repository.iter_file_bytes

900

is usually a better interface for accessing file texts.

901

The result of trying to insert data into the repository via this store

902

is undefined: it should be considered read-only except for implementors

903

of repositories.

904

:ivar chk_bytes: A bzrlib.versionedfile.VersionedFiles instance containing

905

any data the repository chooses to store or have indexed by its hash.

906

The result of trying to insert data into the repository via this store

907

is undefined: it should be considered read-only except for implementors

908

of repositories.

909

:ivar _transport: Transport for file access to repository, typically

910

pointing to .bzr/repository.

911

"""

912

913

# What class to use for a CommitBuilder. Often its simpler to change this

914

# in a Repository class subclass rather than to override

915

# get_commit_builder.

916

_commit_builder_class = CommitBuilder

917

# The search regex used by xml based repositories to determine what things

918

# where changed in a single commit.

919

_file_ids_altered_regex = lazy_regex.lazy_compile(

920

r'file_id="(?P<file_id>[^"]+)"'

921

r'.* revision="(?P<revision_id>[^"]+)"'

922

)

923

924

def abort_write_group(self, suppress_errors=False):

925

"""Commit the contents accrued within the current write group.

926

927

:param suppress_errors: if true, abort_write_group will catch and log

928

unexpected errors that happen during the abort, rather than

929

allowing them to propagate. Defaults to False.

930

931

:seealso: start_write_group.

932

"""

933

if self._write_group is not self.get_transaction():

934

# has an unlock or relock occured ?

935

if suppress_errors:

936

mutter(

937

'(suppressed) mismatched lock context and write group. %r, %r',

938

self._write_group, self.get_transaction())

939

return

940

raise errors.BzrError(

941

'mismatched lock context and write group. %r, %r' %

942

(self._write_group, self.get_transaction()))

943

try:

944

self._abort_write_group()

945

except Exception, exc:

946

self._write_group = None

947

if not suppress_errors:

948

raise

949

mutter('abort_write_group failed')

950

log_exception_quietly()

951

note('bzr: ERROR (ignored): %s', exc)

952

self._write_group = None

953

954

def _abort_write_group(self):

955

"""Template method for per-repository write group cleanup.

956

957

This is called during abort before the write group is considered to be

958

finished and should cleanup any internal state accrued during the write

959

group. There is no requirement that data handed to the repository be

960

*not* made available - this is not a rollback - but neither should any

961

attempt be made to ensure that data added is fully commited. Abort is

962

invoked when an error has occured so futher disk or network operations

963

may not be possible or may error and if possible should not be

964

attempted.

965

"""

966

967

def add_fallback_repository(self, repository):

968

"""Add a repository to use for looking up data not held locally.

969

970

:param repository: A repository.

971

"""

972

if not self._format.supports_external_lookups:

973

raise errors.UnstackableRepositoryFormat(self._format, self.base)

974

if self.is_locked():

975

# This repository will call fallback.unlock() when we transition to

976

# the unlocked state, so we make sure to increment the lock count

977

repository.lock_read()

978

self._check_fallback_repository(repository)

979

self._fallback_repositories.append(repository)

980

self.texts.add_fallback_versioned_files(repository.texts)

981

self.inventories.add_fallback_versioned_files(repository.inventories)

982

self.revisions.add_fallback_versioned_files(repository.revisions)

983

self.signatures.add_fallback_versioned_files(repository.signatures)

984

if self.chk_bytes is not None:

985

self.chk_bytes.add_fallback_versioned_files(repository.chk_bytes)

986

987

def _check_fallback_repository(self, repository):

988

"""Check that this repository can fallback to repository safely.

989

990

Raise an error if not.

991

992

:param repository: A repository to fallback to.

993

"""

994

return InterRepository._assert_same_model(self, repository)

995

996

def add_inventory(self, revision_id, inv, parents):

997

"""Add the inventory inv to the repository as revision_id.

998

999

:param parents: The revision ids of the parents that revision_id

1000

is known to have and are in the repository already.

1001

1002

:returns: The validator(which is a sha1 digest, though what is sha'd is

1003

repository format specific) of the serialized inventory.

1004

"""

1005

if not self.is_in_write_group():

1006

raise AssertionError("%r not in write group" % (self,))

1007

_mod_revision.check_not_reserved_id(revision_id)

1008

if not (inv.revision_id is None or inv.revision_id == revision_id):

1009

raise AssertionError(

1010

"Mismatch between inventory revision"

1011

" id and insertion revid (%r, %r)"

1012

% (inv.revision_id, revision_id))

1013

if inv.root is None:

1014

raise AssertionError()

1015

return self._add_inventory_checked(revision_id, inv, parents)

1016

1017

def _add_inventory_checked(self, revision_id, inv, parents):

1018

"""Add inv to the repository after checking the inputs.

1019

1020

This function can be overridden to allow different inventory styles.

1021

1022

:seealso: add_inventory, for the contract.

1023

"""

1024

inv_lines = self._serialise_inventory_to_lines(inv)

1025

return self._inventory_add_lines(revision_id, parents,

1026

inv_lines, check_content=False)

1027

1028

def add_inventory_by_delta(self, basis_revision_id, delta, new_revision_id,

1029

parents, basis_inv=None, propagate_caches=False):

1030

"""Add a new inventory expressed as a delta against another revision.

1031

1032

See the inventory developers documentation for the theory behind

1033

inventory deltas.

1034

1035

:param basis_revision_id: The inventory id the delta was created

1036

against. (This does not have to be a direct parent.)

1037

:param delta: The inventory delta (see Inventory.apply_delta for

1038

details).

1039

:param new_revision_id: The revision id that the inventory is being

1040

added for.

1041

:param parents: The revision ids of the parents that revision_id is

1042

known to have and are in the repository already. These are supplied

1043

for repositories that depend on the inventory graph for revision

1044

graph access, as well as for those that pun ancestry with delta

1045

compression.

1046

:param basis_inv: The basis inventory if it is already known,

1047

otherwise None.

1048

:param propagate_caches: If True, the caches for this inventory are

1049

copied to and updated for the result if possible.

1050

1051

:returns: (validator, new_inv)

1052

The validator(which is a sha1 digest, though what is sha'd is

1053

repository format specific) of the serialized inventory, and the

1054

resulting inventory.

1055

"""

1056

if not self.is_in_write_group():

1057

raise AssertionError("%r not in write group" % (self,))

1058

_mod_revision.check_not_reserved_id(new_revision_id)

1059

basis_tree = self.revision_tree(basis_revision_id)

1060

basis_tree.lock_read()

1061

try:

1062

# Note that this mutates the inventory of basis_tree, which not all

1063

# inventory implementations may support: A better idiom would be to

1064

# return a new inventory, but as there is no revision tree cache in

1065

# repository this is safe for now - RBC 20081013

1066

if basis_inv is None:

1067

basis_inv = basis_tree.inventory

1068

basis_inv.apply_delta(delta)

1069

basis_inv.revision_id = new_revision_id

1070

return (self.add_inventory(new_revision_id, basis_inv, parents),

1071

basis_inv)

1072

finally:

1073

basis_tree.unlock()

1074

1075

def _inventory_add_lines(self, revision_id, parents, lines,

1076

check_content=True):

1077

"""Store lines in inv_vf and return the sha1 of the inventory."""

1078

parents = [(parent,) for parent in parents]

1079

result = self.inventories.add_lines((revision_id,), parents, lines,

1080

check_content=check_content)[0]

1081

self.inventories._access.flush()

1082

return result

1083

1084

def add_revision(self, revision_id, rev, inv=None, config=None):

1085

"""Add rev to the revision store as revision_id.

1086

1087

:param revision_id: the revision id to use.

1088

:param rev: The revision object.

1089

:param inv: The inventory for the revision. if None, it will be looked

1090

up in the inventory storer

1091

:param config: If None no digital signature will be created.

1092

If supplied its signature_needed method will be used

1093

to determine if a signature should be made.

1094

"""

1095

# TODO: jam 20070210 Shouldn't we check rev.revision_id and

1096

# rev.parent_ids?

1097

_mod_revision.check_not_reserved_id(revision_id)

1098

if config is not None and config.signature_needed():

1099

if inv is None:

1100

inv = self.get_inventory(revision_id)

1101

plaintext = Testament(rev, inv).as_short_text()

1102

self.store_revision_signature(

1103

gpg.GPGStrategy(config), plaintext, revision_id)

1104

# check inventory present

1105

if not self.inventories.get_parent_map([(revision_id,)]):

1106

if inv is None:

1107

raise errors.WeaveRevisionNotPresent(revision_id,

1108

self.inventories)

1109

else:

1110

# yes, this is not suitable for adding with ghosts.

1111

rev.inventory_sha1 = self.add_inventory(revision_id, inv,

1112

rev.parent_ids)

1113

else:

1114

key = (revision_id,)

1115

rev.inventory_sha1 = self.inventories.get_sha1s([key])[key]

1116

self._add_revision(rev)

1117

1118

def _add_revision(self, revision):

1119

text = self._serializer.write_revision_to_string(revision)

1120

key = (revision.revision_id,)

1121

parents = tuple((parent,) for parent in revision.parent_ids)

1122

self.revisions.add_lines(key, parents, osutils.split_lines(text))

1123

1124

def all_revision_ids(self):

1125

"""Returns a list of all the revision ids in the repository.

1126

1127

This is conceptually deprecated because code should generally work on

1128

the graph reachable from a particular revision, and ignore any other

1129

revisions that might be present. There is no direct replacement

1130

method.

1131

"""

1132

if 'evil' in debug.debug_flags:

1133

mutter_callsite(2, "all_revision_ids is linear with history.")

1134

return self._all_revision_ids()

1135

1136

def _all_revision_ids(self):

1137

"""Returns a list of all the revision ids in the repository.

1138

1139

These are in as much topological order as the underlying store can

1140

present.

1141

"""

1142

raise NotImplementedError(self._all_revision_ids)

1143

1144

def break_lock(self):

1145

"""Break a lock if one is present from another instance.

1146

1147

Uses the ui factory to ask for confirmation if the lock may be from

1148

an active process.

1149

"""

1150

self.control_files.break_lock()

1151

1152

@needs_read_lock

1153

def _eliminate_revisions_not_present(self, revision_ids):

1154

"""Check every revision id in revision_ids to see if we have it.

1155

1156

Returns a set of the present revisions.

1157

"""

1158

result = []

1159

graph = self.get_graph()

1160

parent_map = graph.get_parent_map(revision_ids)

1161

# The old API returned a list, should this actually be a set?

1162

return parent_map.keys()

1163

1164

def _check_inventories(self, checker):

1165

"""Check the inventories found from the revision scan.

1166

1167

This is responsible for verifying the sha1 of inventories and

1168

creating a pending_keys set that covers data referenced by inventories.

1169

"""

1170

bar = ui.ui_factory.nested_progress_bar()

1171

try:

1172

self._do_check_inventories(checker, bar)

1173

finally:

1174

bar.finished()

1175

1176

def _do_check_inventories(self, checker, bar):

1177

"""Helper for _check_inventories."""

1178

revno = 0

1179

keys = {'chk_bytes':set(), 'inventories':set(), 'texts':set()}

1180

kinds = ['chk_bytes', 'texts']

1181

count = len(checker.pending_keys)

1182

bar.update("inventories", 0, 2)

1183

current_keys = checker.pending_keys

1184

checker.pending_keys = {}

1185

# Accumulate current checks.

1186

for key in current_keys:

1187

if key[0] != 'inventories' and key[0] not in kinds:

1188

checker._report_items.append('unknown key type %r' % (key,))

1189

keys[key[0]].add(key[1:])

1190

if keys['inventories']:

1191

# NB: output order *should* be roughly sorted - topo or

1192

# inverse topo depending on repository - either way decent

1193

# to just delta against. However, pre-CHK formats didn't

1194

# try to optimise inventory layout on disk. As such the

1195

# pre-CHK code path does not use inventory deltas.

1196

last_object = None

1197

for record in self.inventories.check(keys=keys['inventories']):

1198

if record.storage_kind == 'absent':

1199

checker._report_items.append(

1200

'Missing inventory {%s}' % (record.key,))

1201

else:

1202

last_object = self._check_record('inventories', record,

1203

checker, last_object,

1204

current_keys[('inventories',) + record.key])

1205

del keys['inventories']

1206

else:

1207

return

1208

bar.update("texts", 1)

1209

while (checker.pending_keys or keys['chk_bytes']

1210

or keys['texts']):

1211

# Something to check.

1212

current_keys = checker.pending_keys

1213

checker.pending_keys = {}

1214

# Accumulate current checks.

1215

for key in current_keys:

1216

if key[0] not in kinds:

1217

checker._report_items.append('unknown key type %r' % (key,))

1218

keys[key[0]].add(key[1:])

1219

# Check the outermost kind only - inventories || chk_bytes || texts

1220

for kind in kinds:

1221

if keys[kind]:

1222

last_object = None

1223

for record in getattr(self, kind).check(keys=keys[kind]):

1224

if record.storage_kind == 'absent':

1225

checker._report_items.append(

1226

'Missing %s {%s}' % (kind, record.key,))

1227

else:

1228

last_object = self._check_record(kind, record,

1229

checker, last_object, current_keys[(kind,) + record.key])

1230

keys[kind] = set()

1231

break

1232

1233

def _check_record(self, kind, record, checker, last_object, item_data):

1234

"""Check a single text from this repository."""

1235

if kind == 'inventories':

1236

rev_id = record.key[0]

1237

inv = self.deserialise_inventory(rev_id,

1238

record.get_bytes_as('fulltext'))

1239

if last_object is not None:

1240

delta = inv._make_delta(last_object)

1241

for old_path, path, file_id, ie in delta:

1242

if ie is None:

1243

continue

1244

ie.check(checker, rev_id, inv)

1245

else:

1246

for path, ie in inv.iter_entries():

1247

ie.check(checker, rev_id, inv)

1248

if self._format.fast_deltas:

1249

return inv

1250

elif kind == 'chk_bytes':

1251

# No code written to check chk_bytes for this repo format.

1252

checker._report_items.append(

1253

'unsupported key type chk_bytes for %s' % (record.key,))

1254

elif kind == 'texts':

1255

self._check_text(record, checker, item_data)

1256

else:

1257

checker._report_items.append(

1258

'unknown key type %s for %s' % (kind, record.key))

1259

1260

def _check_text(self, record, checker, item_data):

1261

"""Check a single text."""

1262

# Check it is extractable.

1263

# TODO: check length.

1264

if record.storage_kind == 'chunked':

1265

chunks = record.get_bytes_as(record.storage_kind)

1266

sha1 = osutils.sha_strings(chunks)

1267

length = sum(map(len, chunks))

1268

else:

1269

content = record.get_bytes_as('fulltext')

1270

sha1 = osutils.sha_string(content)

1271

length = len(content)

1272

if item_data and sha1 != item_data[1]:

1273

checker._report_items.append(

1274

'sha1 mismatch: %s has sha1 %s expected %s referenced by %s' %

1275

(record.key, sha1, item_data[1], item_data[2]))

1276

1277

@staticmethod

1278

def create(a_bzrdir):

1279

"""Construct the current default format repository in a_bzrdir."""

1280

return RepositoryFormat.get_default_format().initialize(a_bzrdir)

1281

1282

def __init__(self, _format, a_bzrdir, control_files):

1283

"""instantiate a Repository.

1284

1285

:param _format: The format of the repository on disk.

1286

:param a_bzrdir: The BzrDir of the repository.

1287

1288

In the future we will have a single api for all stores for

1289

getting file texts, inventories and revisions, then

1290

this construct will accept instances of those things.

1291

"""

1292

super(Repository, self).__init__()

1293

self._format = _format

1294

# the following are part of the public API for Repository:

1295

self.bzrdir = a_bzrdir

1296

self.control_files = control_files

1297

self._transport = control_files._transport

1298

self.base = self._transport.base

1299

# for tests

1300

self._reconcile_does_inventory_gc = True

1301

self._reconcile_fixes_text_parents = False

1302

self._reconcile_backsup_inventory = True

1303

# not right yet - should be more semantically clear ?

1304

1305

# TODO: make sure to construct the right store classes, etc, depending

1306

# on whether escaping is required.

1307

self._warn_if_deprecated()

1308

self._write_group = None

1309

# Additional places to query for data.

1310

self._fallback_repositories = []

1311

# An InventoryEntry cache, used during deserialization

1312

self._inventory_entry_cache = fifo_cache.FIFOCache(10*1024)

1313

1314

def __repr__(self):

1315

if self._fallback_repositories:

1316

return '%s(%r, fallback_repositories=%r)' % (

1317

self.__class__.__name__,

1318

self.base,

1319

self._fallback_repositories)

1320

else:

1321

return '%s(%r)' % (self.__class__.__name__,

1322

self.base)

1323

1324

def _has_same_fallbacks(self, other_repo):

1325

"""Returns true if the repositories have the same fallbacks."""

1326

my_fb = self._fallback_repositories

1327

other_fb = other_repo._fallback_repositories

1328

if len(my_fb) != len(other_fb):

1329

return False

1330

for f, g in zip(my_fb, other_fb):

1331

if not f.has_same_location(g):

1332

return False

1333

return True

1334

1335

def has_same_location(self, other):

1336

"""Returns a boolean indicating if this repository is at the same

1337

location as another repository.

1338

1339

This might return False even when two repository objects are accessing

1340

the same physical repository via different URLs.

1341

"""

1342

if self.__class__ is not other.__class__:

1343

return False

1344

return (self._transport.base == other._transport.base)

1345

1346

def is_in_write_group(self):

1347

"""Return True if there is an open write group.

1348

1349

:seealso: start_write_group.

1350

"""

1351

return self._write_group is not None

1352

1353

def is_locked(self):

1354

return self.control_files.is_locked()

1355

1356

def is_write_locked(self):

1357

"""Return True if this object is write locked."""

1358

return self.is_locked() and self.control_files._lock_mode == 'w'

1359

1360

def lock_write(self, token=None):

1361

"""Lock this repository for writing.

1362

1363

This causes caching within the repository obejct to start accumlating

1364

data during reads, and allows a 'write_group' to be obtained. Write

1365

groups must be used for actual data insertion.

1366

1367

:param token: if this is already locked, then lock_write will fail

1368

unless the token matches the existing lock.

1369

:returns: a token if this instance supports tokens, otherwise None.

1370

:raises TokenLockingNotSupported: when a token is given but this

1371

instance doesn't support using token locks.

1372

:raises MismatchedToken: if the specified token doesn't match the token

1373

of the existing lock.

1374

:seealso: start_write_group.

1375

1376

A token should be passed in if you know that you have locked the object

1377

some other way, and need to synchronise this object's state with that

1378

fact.

1379

1380

XXX: this docstring is duplicated in many places, e.g. lockable_files.py

1381

"""

1382

locked = self.is_locked()

1383

result = self.control_files.lock_write(token=token)

1384

if not locked:

1385

self._note_lock('w')

1386

for repo in self._fallback_repositories:

1387

# Writes don't affect fallback repos

1388

repo.lock_read()

1389

self._refresh_data()

1390

return result

1391

1392

def lock_read(self):

1393

locked = self.is_locked()

1394

self.control_files.lock_read()

1395

if not locked:

1396

self._note_lock('r')

1397

for repo in self._fallback_repositories:

1398

repo.lock_read()

1399

self._refresh_data()

1400

1401

def get_physical_lock_status(self):

1402

return self.control_files.get_physical_lock_status()

1403

1404

def leave_lock_in_place(self):

1405

"""Tell this repository not to release the physical lock when this

1406

object is unlocked.

1407

1408

If lock_write doesn't return a token, then this method is not supported.

1409

"""

1410

self.control_files.leave_in_place()

1411

1412

def dont_leave_lock_in_place(self):

1413

"""Tell this repository to release the physical lock when this

1414

object is unlocked, even if it didn't originally acquire it.

1415

1416

If lock_write doesn't return a token, then this method is not supported.

1417

"""

1418

self.control_files.dont_leave_in_place()

1419

1420

@needs_read_lock

1421

def gather_stats(self, revid=None, committers=None):

1422

"""Gather statistics from a revision id.

1423

1424

:param revid: The revision id to gather statistics from, if None, then

1425

no revision specific statistics are gathered.

1426

:param committers: Optional parameter controlling whether to grab

1427

a count of committers from the revision specific statistics.

1428

:return: A dictionary of statistics. Currently this contains:

1429

committers: The number of committers if requested.

1430

firstrev: A tuple with timestamp, timezone for the penultimate left

1431

most ancestor of revid, if revid is not the NULL_REVISION.

1432

latestrev: A tuple with timestamp, timezone for revid, if revid is

1433

not the NULL_REVISION.

1434

revisions: The total revision count in the repository.

1435

size: An estimate disk size of the repository in bytes.

1436

"""

1437

result = {}

1438

if revid and committers:

1439

result['committers'] = 0

1440

if revid and revid != _mod_revision.NULL_REVISION:

1441

if committers:

1442

all_committers = set()

1443

revisions = self.get_ancestry(revid)

1444

# pop the leading None

1445

revisions.pop(0)

1446

first_revision = None

1447

if not committers:

1448

# ignore the revisions in the middle - just grab first and last

1449

revisions = revisions[0], revisions[-1]

1450

for revision in self.get_revisions(revisions):

1451

if not first_revision:

1452

first_revision = revision

1453

if committers:

1454

all_committers.add(revision.committer)

1455

last_revision = revision

1456

if committers:

1457

result['committers'] = len(all_committers)

1458

result['firstrev'] = (first_revision.timestamp,

1459

first_revision.timezone)

1460

result['latestrev'] = (last_revision.timestamp,

1461

last_revision.timezone)

1462

1463

# now gather global repository information

1464

# XXX: This is available for many repos regardless of listability.

1465

if self.bzrdir.root_transport.listable():

1466

# XXX: do we want to __define len__() ?

1467

# Maybe the versionedfiles object should provide a different

1468

# method to get the number of keys.

1469

result['revisions'] = len(self.revisions.keys())

1470

# result['size'] = t

1471

return result

1472

1473

def find_branches(self, using=False):

1474

"""Find branches underneath this repository.

1475

1476

This will include branches inside other branches.

1477

1478

:param using: If True, list only branches using this repository.

1479

"""

1480

if using and not self.is_shared():

1481

try:

1482

return [self.bzrdir.open_branch()]

1483

except errors.NotBranchError:

1484

return []

1485

class Evaluator(object):

1486

1487

def __init__(self):

1488

self.first_call = True

1489

1490

def __call__(self, bzrdir):

1491

# On the first call, the parameter is always the bzrdir

1492

# containing the current repo.

1493

if not self.first_call:

1494

try:

1495

repository = bzrdir.open_repository()

1496

except errors.NoRepositoryPresent:

1497

pass

1498

else:

1499

return False, (None, repository)

1500

self.first_call = False

1501

try:

1502

value = (bzrdir.open_branch(), None)

1503

except errors.NotBranchError:

1504

value = (None, None)

1505

return True, value

1506

1507

branches = []

1508

for branch, repository in bzrdir.BzrDir.find_bzrdirs(

1509

self.bzrdir.root_transport, evaluate=Evaluator()):

1510

if branch is not None:

1511

branches.append(branch)

1512

if not using and repository is not None:

1513

branches.extend(repository.find_branches())

1514

return branches

1515

1516

@needs_read_lock

1517

def search_missing_revision_ids(self, other, revision_id=None, find_ghosts=True):

1518

"""Return the revision ids that other has that this does not.

1519

1520

These are returned in topological order.

1521

1522

revision_id: only return revision ids included by revision_id.

1523

"""

1524

return InterRepository.get(other, self).search_missing_revision_ids(

1525

revision_id, find_ghosts)

1526

1527

@staticmethod

1528

def open(base):

1529

"""Open the repository rooted at base.

1530

1531

For instance, if the repository is at URL/.bzr/repository,

1532

Repository.open(URL) -> a Repository instance.

1533

"""

1534

control = bzrdir.BzrDir.open(base)

1535

return control.open_repository()

1536

1537

def copy_content_into(self, destination, revision_id=None):

1538

"""Make a complete copy of the content in self into destination.

1539

1540

This is a destructive operation! Do not use it on existing

1541

repositories.

1542

"""

1543

return InterRepository.get(self, destination).copy_content(revision_id)

1544

1545

def commit_write_group(self):

1546

"""Commit the contents accrued within the current write group.

1547

1548

:seealso: start_write_group.

1549

1550

:return: it may return an opaque hint that can be passed to 'pack'.

1551

"""

1552

if self._write_group is not self.get_transaction():

1553

# has an unlock or relock occured ?

1554

raise errors.BzrError('mismatched lock context %r and '

1555

'write group %r.' %

1556

(self.get_transaction(), self._write_group))

1557

result = self._commit_write_group()

1558

self._write_group = None

1559

return result

1560

1561

def _commit_write_group(self):

1562

"""Template method for per-repository write group cleanup.

1563

1564

This is called before the write group is considered to be

1565

finished and should ensure that all data handed to the repository

1566

for writing during the write group is safely committed (to the

1567

extent possible considering file system caching etc).

1568

"""

1569

1570

def suspend_write_group(self):

1571

raise errors.UnsuspendableWriteGroup(self)

1572

1573

def get_missing_parent_inventories(self, check_for_missing_texts=True):

1574

"""Return the keys of missing inventory parents for revisions added in

1575

this write group.

1576

1577

A revision is not complete if the inventory delta for that revision

1578

cannot be calculated. Therefore if the parent inventories of a

1579

revision are not present, the revision is incomplete, and e.g. cannot

1580

be streamed by a smart server. This method finds missing inventory

1581

parents for revisions added in this write group.

1582

"""

1583

if not self._format.supports_external_lookups:

1584

# This is only an issue for stacked repositories

1585

return set()

1586

if not self.is_in_write_group():

1587

raise AssertionError('not in a write group')

1588

1589

# XXX: We assume that every added revision already has its

1590

# corresponding inventory, so we only check for parent inventories that

1591

# might be missing, rather than all inventories.

1592

parents = set(self.revisions._index.get_missing_parents())

1593

parents.discard(_mod_revision.NULL_REVISION)

1594

unstacked_inventories = self.inventories._index

1595

present_inventories = unstacked_inventories.get_parent_map(

1596

key[-1:] for key in parents)

1597

parents.difference_update(present_inventories)

1598

if len(parents) == 0:

1599

# No missing parent inventories.

1600

return set()

1601

if not check_for_missing_texts:

1602

return set(('inventories', rev_id) for (rev_id,) in parents)

1603

# Ok, now we have a list of missing inventories. But these only matter

1604

# if the inventories that reference them are missing some texts they

1605

# appear to introduce.

1606

# XXX: Texts referenced by all added inventories need to be present,

1607

# but at the moment we're only checking for texts referenced by

1608

# inventories at the graph's edge.

1609

key_deps = self.revisions._index._key_dependencies

1610

key_deps.satisfy_refs_for_keys(present_inventories)

1611

referrers = frozenset(r[0] for r in key_deps.get_referrers())

1612

file_ids = self.fileids_altered_by_revision_ids(referrers)

1613

missing_texts = set()

1614

for file_id, version_ids in file_ids.iteritems():

1615

missing_texts.update(

1616

(file_id, version_id) for version_id in version_ids)

1617

present_texts = self.texts.get_parent_map(missing_texts)

1618

missing_texts.difference_update(present_texts)

1619

if not missing_texts:

1620

# No texts are missing, so all revisions and their deltas are

1621

# reconstructable.

1622

return set()

1623

# Alternatively the text versions could be returned as the missing

1624

# keys, but this is likely to be less data.

1625

missing_keys = set(('inventories', rev_id) for (rev_id,) in parents)

1626

return missing_keys

1627

1628

def refresh_data(self):

1629

"""Re-read any data needed to to synchronise with disk.

1630

1631

This method is intended to be called after another repository instance

1632

(such as one used by a smart server) has inserted data into the

1633

repository. It may not be called during a write group, but may be

1634

called at any other time.

1635

"""

1636

if self.is_in_write_group():

1637

raise errors.InternalBzrError(

1638

"May not refresh_data while in a write group.")

1639

self._refresh_data()

1640

1641

def resume_write_group(self, tokens):

1642

if not self.is_write_locked():

1643

raise errors.NotWriteLocked(self)

1644

if self._write_group:

1645

raise errors.BzrError('already in a write group')

1646

self._resume_write_group(tokens)

1647

# so we can detect unlock/relock - the write group is now entered.

1648

self._write_group = self.get_transaction()

1649

1650

def _resume_write_group(self, tokens):

1651

raise errors.UnsuspendableWriteGroup(self)

1652

1653

def fetch(self, source, revision_id=None, pb=None, find_ghosts=False,

1654

fetch_spec=None):

1655

"""Fetch the content required to construct revision_id from source.

1656

1657

If revision_id is None and fetch_spec is None, then all content is

1658

copied.

1659

1660

fetch() may not be used when the repository is in a write group -

1661

either finish the current write group before using fetch, or use

1662

fetch before starting the write group.

1663

1664

:param find_ghosts: Find and copy revisions in the source that are

1665

ghosts in the target (and not reachable directly by walking out to

1666

the first-present revision in target from revision_id).

1667

:param revision_id: If specified, all the content needed for this

1668

revision ID will be copied to the target. Fetch will determine for

1669

itself which content needs to be copied.

1670

:param fetch_spec: If specified, a SearchResult or

1671

PendingAncestryResult that describes which revisions to copy. This

1672

allows copying multiple heads at once. Mutually exclusive with

1673

revision_id.

1674

"""

1675

if fetch_spec is not None and revision_id is not None:

1676

raise AssertionError(

1677

"fetch_spec and revision_id are mutually exclusive.")

1678

if self.is_in_write_group():

1679

raise errors.InternalBzrError(

1680

"May not fetch while in a write group.")

1681

# fast path same-url fetch operations

1682

# TODO: lift out to somewhere common with RemoteRepository

1683

# <https://bugs.edge.launchpad.net/bzr/+bug/401646>

1684

if (self.has_same_location(source)

1685

and fetch_spec is None

1686

and self._has_same_fallbacks(source)):

1687

# check that last_revision is in 'from' and then return a

1688

# no-operation.

1689

if (revision_id is not None and

1690

not _mod_revision.is_null(revision_id)):

1691

self.get_revision(revision_id)

1692

return 0, []

1693

# if there is no specific appropriate InterRepository, this will get

1694

# the InterRepository base class, which raises an

1695

# IncompatibleRepositories when asked to fetch.

1696

inter = InterRepository.get(source, self)

1697

return inter.fetch(revision_id=revision_id, pb=pb,

1698

find_ghosts=find_ghosts, fetch_spec=fetch_spec)

1699

1700

def create_bundle(self, target, base, fileobj, format=None):

1701

return serializer.write_bundle(self, target, base, fileobj, format)

1702

1703

def get_commit_builder(self, branch, parents, config, timestamp=None,

1704

timezone=None, committer=None, revprops=None,

1705

revision_id=None):

1706

"""Obtain a CommitBuilder for this repository.

1707

1708

:param branch: Branch to commit to.

1709

:param parents: Revision ids of the parents of the new revision.

1710

:param config: Configuration to use.

1711

:param timestamp: Optional timestamp recorded for commit.

1712

:param timezone: Optional timezone for timestamp.

1713

:param committer: Optional committer to set for commit.

1714

:param revprops: Optional dictionary of revision properties.

1715

:param revision_id: Optional revision id.

1716

"""

1717

if self._fallback_repositories:

1718

raise errors.BzrError("Cannot commit from a lightweight checkout "

1719

"to a stacked branch. See "

1720

"https://bugs.launchpad.net/bzr/+bug/375013 for details.")

1721

result = self._commit_builder_class(self, parents, config,

1722

timestamp, timezone, committer, revprops, revision_id)

1723

self.start_write_group()

1724

return result

1725

1726

@only_raises(errors.LockNotHeld, errors.LockBroken)

1727

def unlock(self):

1728

if (self.control_files._lock_count == 1 and

1729

self.control_files._lock_mode == 'w'):

1730

if self._write_group is not None:

1731

self.abort_write_group()

1732

self.control_files.unlock()

1733

raise errors.BzrError(

1734

'Must end write groups before releasing write locks.')

1735

self.control_files.unlock()

1736

if self.control_files._lock_count == 0:

1737

self._inventory_entry_cache.clear()

1738

for repo in self._fallback_repositories:

1739

repo.unlock()

1740

1741

@needs_read_lock

1742

def clone(self, a_bzrdir, revision_id=None):

1743

"""Clone this repository into a_bzrdir using the current format.

1744

1745

Currently no check is made that the format of this repository and

1746

the bzrdir format are compatible. FIXME RBC 20060201.

1747

1748

:return: The newly created destination repository.

1749

"""

1750

# TODO: deprecate after 0.16; cloning this with all its settings is

1751

# probably not very useful -- mbp 20070423

1752

dest_repo = self._create_sprouting_repo(a_bzrdir, shared=self.is_shared())

1753

self.copy_content_into(dest_repo, revision_id)

1754

return dest_repo

1755

1756

def start_write_group(self):

1757

"""Start a write group in the repository.

1758

1759

Write groups are used by repositories which do not have a 1:1 mapping

1760

between file ids and backend store to manage the insertion of data from

1761

both fetch and commit operations.

1762

1763

A write lock is required around the start_write_group/commit_write_group

1764

for the support of lock-requiring repository formats.

1765

1766

One can only insert data into a repository inside a write group.

1767

1768

:return: None.

1769

"""

1770

if not self.is_write_locked():

1771

raise errors.NotWriteLocked(self)

1772

if self._write_group:

1773

raise errors.BzrError('already in a write group')

1774

self._start_write_group()

1775

# so we can detect unlock/relock - the write group is now entered.

1776

self._write_group = self.get_transaction()

1777

1778

def _start_write_group(self):

1779

"""Template method for per-repository write group startup.

1780

1781

This is called before the write group is considered to be

1782

entered.

1783

"""

1784

1785

@needs_read_lock

1786

def sprout(self, to_bzrdir, revision_id=None):

1787

"""Create a descendent repository for new development.

1788

1789

Unlike clone, this does not copy the settings of the repository.

1790

"""

1791

dest_repo = self._create_sprouting_repo(to_bzrdir, shared=False)

1792

dest_repo.fetch(self, revision_id=revision_id)

1793

return dest_repo

1794

1795

def _create_sprouting_repo(self, a_bzrdir, shared):

1796

if not isinstance(a_bzrdir._format, self.bzrdir._format.__class__):

1797

# use target default format.

1798

dest_repo = a_bzrdir.create_repository()

1799

else:

1800

# Most control formats need the repository to be specifically

1801

# created, but on some old all-in-one formats it's not needed

1802

try:

1803

dest_repo = self._format.initialize(a_bzrdir, shared=shared)

1804

except errors.UninitializableFormat:

1805

dest_repo = a_bzrdir.open_repository()

1806

return dest_repo

1807

1808

def _get_sink(self):

1809

"""Return a sink for streaming into this repository."""

1810

return StreamSink(self)

1811

1812

def _get_source(self, to_format):

1813

"""Return a source for streaming from this repository."""

1814

return StreamSource(self, to_format)

1815

1816

@needs_read_lock

1817

def has_revision(self, revision_id):

1818

"""True if this repository has a copy of the revision."""

1819

return revision_id in self.has_revisions((revision_id,))

1820

1821

@needs_read_lock

1822

def has_revisions(self, revision_ids):

1823

"""Probe to find out the presence of multiple revisions.

1824

1825

:param revision_ids: An iterable of revision_ids.

1826

:return: A set of the revision_ids that were present.

1827

"""

1828

parent_map = self.revisions.get_parent_map(

1829

[(rev_id,) for rev_id in revision_ids])

1830

result = set()

1831

if _mod_revision.NULL_REVISION in revision_ids:

1832

result.add(_mod_revision.NULL_REVISION)

1833

result.update([key[0] for key in parent_map])

1834

return result

1835

1836

@needs_read_lock

1837

def get_revision(self, revision_id):

1838

"""Return the Revision object for a named revision."""

1839

return self.get_revisions([revision_id])[0]

1840

1841

@needs_read_lock

1842

def get_revision_reconcile(self, revision_id):

1843

"""'reconcile' helper routine that allows access to a revision always.

1844

1845

This variant of get_revision does not cross check the weave graph

1846

against the revision one as get_revision does: but it should only

1847

be used by reconcile, or reconcile-alike commands that are correcting

1848

or testing the revision graph.

1849

"""

1850

return self._get_revisions([revision_id])[0]

1851

1852

@needs_read_lock

1853

def get_revisions(self, revision_ids):

1854

"""Get many revisions at once.

1855

1856

Repositories that need to check data on every revision read should

1857

subclass this method.

1858

"""

1859

return self._get_revisions(revision_ids)

1860

1861

@needs_read_lock

1862

def _get_revisions(self, revision_ids):

1863

"""Core work logic to get many revisions without sanity checks."""

1864

revs = {}

1865

for revid, rev in self._iter_revisions(revision_ids):

1866

if rev is None:

1867

raise errors.NoSuchRevision(self, revid)

1868

revs[revid] = rev

1869

return [revs[revid] for revid in revision_ids]

1870

1871

def _iter_revisions(self, revision_ids):

1872

"""Iterate over revision objects.

1873

1874

:param revision_ids: An iterable of revisions to examine. None may be

1875

passed to request all revisions known to the repository. Note that

1876

not all repositories can find unreferenced revisions; for those

1877

repositories only referenced ones will be returned.

1878

:return: An iterator of (revid, revision) tuples. Absent revisions (

1879

those asked for but not available) are returned as (revid, None).

1880

"""

1881

if revision_ids is None:

1882

revision_ids = self.all_revision_ids()

1883

else:

1884

for rev_id in revision_ids:

1885

if not rev_id or not isinstance(rev_id, basestring):

1886

raise errors.InvalidRevisionId(revision_id=rev_id, branch=self)

1887

keys = [(key,) for key in revision_ids]

1888

stream = self.revisions.get_record_stream(keys, 'unordered', True)

1889

for record in stream:

1890

revid = record.key[0]

1891

if record.storage_kind == 'absent':

1892

yield (revid, None)

1893

else:

1894

text = record.get_bytes_as('fulltext')

1895

rev = self._serializer.read_revision_from_string(text)

1896

yield (revid, rev)

1897

1898

@needs_read_lock

1899

def get_revision_xml(self, revision_id):

1900

# TODO: jam 20070210 This shouldn't be necessary since get_revision

1901

# would have already do it.

1902

# TODO: jam 20070210 Just use _serializer.write_revision_to_string()

1903

# TODO: this can't just be replaced by:

1904

# return self._serializer.write_revision_to_string(

1905

# self.get_revision(revision_id))

1906

# as cStringIO preservers the encoding unlike write_revision_to_string

1907

# or some other call down the path.

1908

rev = self.get_revision(revision_id)

1909

rev_tmp = cStringIO.StringIO()

1910

# the current serializer..

1911

self._serializer.write_revision(rev, rev_tmp)

1912

rev_tmp.seek(0)

1913

return rev_tmp.getvalue()

1914

1915

def get_deltas_for_revisions(self, revisions, specific_fileids=None):

1916

"""Produce a generator of revision deltas.

1917

1918

Note that the input is a sequence of REVISIONS, not revision_ids.

1919

Trees will be held in memory until the generator exits.

1920

Each delta is relative to the revision's lefthand predecessor.

1921

1922

:param specific_fileids: if not None, the result is filtered

1923

so that only those file-ids, their parents and their

1924

children are included.

1925

"""

1926

# Get the revision-ids of interest

1927

required_trees = set()

1928

for revision in revisions:

1929

required_trees.add(revision.revision_id)

1930

required_trees.update(revision.parent_ids[:1])

1931

1932

# Get the matching filtered trees. Note that it's more

1933

# efficient to pass filtered trees to changes_from() rather

1934

# than doing the filtering afterwards. changes_from() could

1935

# arguably do the filtering itself but it's path-based, not

1936

# file-id based, so filtering before or afterwards is

1937

# currently easier.

1938

if specific_fileids is None:

1939

trees = dict((t.get_revision_id(), t) for

1940

t in self.revision_trees(required_trees))

1941

else:

1942

trees = dict((t.get_revision_id(), t) for

1943

t in self._filtered_revision_trees(required_trees,

1944

specific_fileids))

1945

1946

# Calculate the deltas

1947

for revision in revisions:

1948

if not revision.parent_ids:

1949

old_tree = self.revision_tree(_mod_revision.NULL_REVISION)

1950

else:

1951

old_tree = trees[revision.parent_ids[0]]

1952

yield trees[revision.revision_id].changes_from(old_tree)

1953

1954

@needs_read_lock

1955

def get_revision_delta(self, revision_id, specific_fileids=None):

1956

"""Return the delta for one revision.

1957

1958

The delta is relative to the left-hand predecessor of the

1959

revision.

1960

1961

:param specific_fileids: if not None, the result is filtered

1962

so that only those file-ids, their parents and their

1963

children are included.

1964

"""

1965

r = self.get_revision(revision_id)

1966

return list(self.get_deltas_for_revisions([r],

1967

specific_fileids=specific_fileids))[0]

1968

1969

@needs_write_lock

1970

def store_revision_signature(self, gpg_strategy, plaintext, revision_id):

1971

signature = gpg_strategy.sign(plaintext)

1972

self.add_signature_text(revision_id, signature)

1973

1974

@needs_write_lock

1975

def add_signature_text(self, revision_id, signature):

1976

self.signatures.add_lines((revision_id,), (),

1977

osutils.split_lines(signature))

1978

1979

def find_text_key_references(self):

1980

"""Find the text key references within the repository.

1981

1982

:return: A dictionary mapping text keys ((fileid, revision_id) tuples)

1983

to whether they were referred to by the inventory of the

1984

revision_id that they contain. The inventory texts from all present

1985

revision ids are assessed to generate this report.

1986

"""

1987

revision_keys = self.revisions.keys()

1988

w = self.inventories

1989

pb = ui.ui_factory.nested_progress_bar()

1990

try:

1991

return self._find_text_key_references_from_xml_inventory_lines(

1992

w.iter_lines_added_or_present_in_keys(revision_keys, pb=pb))

1993

finally:

1994

pb.finished()

1995

1996

def _find_text_key_references_from_xml_inventory_lines(self,

1997

line_iterator):

1998

"""Core routine for extracting references to texts from inventories.

1999

2000

This performs the translation of xml lines to revision ids.

2001

2002

:param line_iterator: An iterator of lines, origin_version_id

2003

:return: A dictionary mapping text keys ((fileid, revision_id) tuples)

2004

to whether they were referred to by the inventory of the

2005

revision_id that they contain. Note that if that revision_id was

2006

not part of the line_iterator's output then False will be given -

2007

even though it may actually refer to that key.

2008

"""

2009

if not self._serializer.support_altered_by_hack:

2010

raise AssertionError(

2011

"_find_text_key_references_from_xml_inventory_lines only "

2012

"supported for branches which store inventory as unnested xml"

2013

", not on %r" % self)

2014

result = {}

2015

2016

# this code needs to read every new line in every inventory for the

2017

# inventories [revision_ids]. Seeing a line twice is ok. Seeing a line

2018

# not present in one of those inventories is unnecessary but not

2019

# harmful because we are filtering by the revision id marker in the

2020

# inventory lines : we only select file ids altered in one of those

2021

# revisions. We don't need to see all lines in the inventory because

2022

# only those added in an inventory in rev X can contain a revision=X

2023

# line.

2024

unescape_revid_cache = {}

2025

unescape_fileid_cache = {}

2026

2027

# jam 20061218 In a big fetch, this handles hundreds of thousands

2028

# of lines, so it has had a lot of inlining and optimizing done.

2029

# Sorry that it is a little bit messy.

2030

# Move several functions to be local variables, since this is a long

2031

# running loop.

2032

search = self._file_ids_altered_regex.search

2033

unescape = _unescape_xml

2034

setdefault = result.setdefault

2035

for line, line_key in line_iterator:

2036

match = search(line)

2037

if match is None:

2038

continue

2039

# One call to match.group() returning multiple items is quite a

2040

# bit faster than 2 calls to match.group() each returning 1

2041

file_id, revision_id = match.group('file_id', 'revision_id')

2042

2043

# Inlining the cache lookups helps a lot when you make 170,000

2044

# lines and 350k ids, versus 8.4 unique ids.

2045

# Using a cache helps in 2 ways:

2046

# 1) Avoids unnecessary decoding calls

2047

# 2) Re-uses cached strings, which helps in future set and

2048

# equality checks.

2049

# (2) is enough that removing encoding entirely along with

2050

# the cache (so we are using plain strings) results in no

2051

# performance improvement.

2052

try:

2053

revision_id = unescape_revid_cache[revision_id]

2054

except KeyError:

2055

unescaped = unescape(revision_id)

2056

unescape_revid_cache[revision_id] = unescaped

2057

revision_id = unescaped

2058

2059

# Note that unconditionally unescaping means that we deserialise

2060

# every fileid, which for general 'pull' is not great, but we don't

2061

# really want to have some many fulltexts that this matters anyway.

2062

# RBC 20071114.

2063

try:

2064

file_id = unescape_fileid_cache[file_id]

2065

except KeyError:

2066

unescaped = unescape(file_id)

2067

unescape_fileid_cache[file_id] = unescaped

2068

file_id = unescaped

2069

2070

key = (file_id, revision_id)

2071

setdefault(key, False)

2072

if revision_id == line_key[-1]:

2073

result[key] = True

2074

return result

2075

2076

def _inventory_xml_lines_for_keys(self, keys):

2077

"""Get a line iterator of the sort needed for findind references.

2078

2079

Not relevant for non-xml inventory repositories.

2080

2081

Ghosts in revision_keys are ignored.

2082

2083

:param revision_keys: The revision keys for the inventories to inspect.

2084

:return: An iterator over (inventory line, revid) for the fulltexts of

2085

all of the xml inventories specified by revision_keys.

2086

"""

2087

stream = self.inventories.get_record_stream(keys, 'unordered', True)

2088

for record in stream:

2089

if record.storage_kind != 'absent':

2090

chunks = record.get_bytes_as('chunked')

2091

revid = record.key[-1]

2092

lines = osutils.chunks_to_lines(chunks)

2093

for line in lines:

2094

yield line, revid

2095

2096

def _find_file_ids_from_xml_inventory_lines(self, line_iterator,

2097

revision_keys):

2098

"""Helper routine for fileids_altered_by_revision_ids.

2099

2100

This performs the translation of xml lines to revision ids.

2101

2102

:param line_iterator: An iterator of lines, origin_version_id

2103

:param revision_keys: The revision ids to filter for. This should be a

2104

set or other type which supports efficient __contains__ lookups, as

2105

the revision key from each parsed line will be looked up in the

2106

revision_keys filter.

2107

:return: a dictionary mapping altered file-ids to an iterable of

2108

revision_ids. Each altered file-ids has the exact revision_ids that

2109

altered it listed explicitly.

2110

"""

2111

seen = set(self._find_text_key_references_from_xml_inventory_lines(

2112

line_iterator).iterkeys())

2113

parent_keys = self._find_parent_keys_of_revisions(revision_keys)

2114

parent_seen = set(self._find_text_key_references_from_xml_inventory_lines(

2115

self._inventory_xml_lines_for_keys(parent_keys)))

2116

new_keys = seen - parent_seen

2117

result = {}

2118

setdefault = result.setdefault

2119

for key in new_keys:

2120

setdefault(key[0], set()).add(key[-1])

2121

return result

2122

2123

def _find_parent_ids_of_revisions(self, revision_ids):

2124

"""Find all parent ids that are mentioned in the revision graph.

2125

2126

:return: set of revisions that are parents of revision_ids which are

2127

not part of revision_ids themselves

2128

"""

2129

parent_map = self.get_parent_map(revision_ids)

2130

parent_ids = set()

2131

map(parent_ids.update, parent_map.itervalues())

2132

parent_ids.difference_update(revision_ids)

2133

parent_ids.discard(_mod_revision.NULL_REVISION)

2134

return parent_ids

2135

2136

def _find_parent_keys_of_revisions(self, revision_keys):

2137

"""Similar to _find_parent_ids_of_revisions, but used with keys.

2138

2139

:param revision_keys: An iterable of revision_keys.

2140

:return: The parents of all revision_keys that are not already in

2141

revision_keys

2142

"""

2143

parent_map = self.revisions.get_parent_map(revision_keys)

2144

parent_keys = set()

2145

map(parent_keys.update, parent_map.itervalues())

2146

parent_keys.difference_update(revision_keys)

2147

parent_keys.discard(_mod_revision.NULL_REVISION)

2148

return parent_keys

2149

2150

def fileids_altered_by_revision_ids(self, revision_ids, _inv_weave=None):

2151

"""Find the file ids and versions affected by revisions.

2152

2153

:param revisions: an iterable containing revision ids.

2154

:param _inv_weave: The inventory weave from this repository or None.

2155

If None, the inventory weave will be opened automatically.

2156

:return: a dictionary mapping altered file-ids to an iterable of

2157

revision_ids. Each altered file-ids has the exact revision_ids that

2158

altered it listed explicitly.

2159

"""

2160

selected_keys = set((revid,) for revid in revision_ids)

2161

w = _inv_weave or self.inventories

2162

pb = ui.ui_factory.nested_progress_bar()

2163

try:

2164

return self._find_file_ids_from_xml_inventory_lines(

2165

w.iter_lines_added_or_present_in_keys(

2166

selected_keys, pb=pb),

2167

selected_keys)

2168

finally:

2169

pb.finished()

2170

2171

def iter_files_bytes(self, desired_files):

2172

"""Iterate through file versions.

2173

2174

Files will not necessarily be returned in the order they occur in

2175

desired_files. No specific order is guaranteed.

2176

2177

Yields pairs of identifier, bytes_iterator. identifier is an opaque

2178

value supplied by the caller as part of desired_files. It should

2179

uniquely identify the file version in the caller's context. (Examples:

2180

an index number or a TreeTransform trans_id.)

2181

2182

bytes_iterator is an iterable of bytestrings for the file. The

2183

kind of iterable and length of the bytestrings are unspecified, but for

2184

this implementation, it is a list of bytes produced by

2185

VersionedFile.get_record_stream().

2186

2187

:param desired_files: a list of (file_id, revision_id, identifier)

2188

triples

2189

"""

2190

text_keys = {}

2191

for file_id, revision_id, callable_data in desired_files:

2192

text_keys[(file_id, revision_id)] = callable_data

2193

for record in self.texts.get_record_stream(text_keys, 'unordered', True):

2194

if record.storage_kind == 'absent':

2195

raise errors.RevisionNotPresent(record.key, self)

2196

yield text_keys[record.key], record.get_bytes_as('chunked')

2197

2198

def _generate_text_key_index(self, text_key_references=None,

2199

ancestors=None):

2200

"""Generate a new text key index for the repository.

2201

2202

This is an expensive function that will take considerable time to run.

2203

2204

:return: A dict mapping text keys ((file_id, revision_id) tuples) to a

2205

list of parents, also text keys. When a given key has no parents,

2206

the parents list will be [NULL_REVISION].

2207

"""

2208

# All revisions, to find inventory parents.

2209

if ancestors is None:

2210

graph = self.get_graph()

2211

ancestors = graph.get_parent_map(self.all_revision_ids())

2212

if text_key_references is None:

2213

text_key_references = self.find_text_key_references()

2214

pb = ui.ui_factory.nested_progress_bar()

2215

try:

2216

return self._do_generate_text_key_index(ancestors,

2217

text_key_references, pb)

2218

finally:

2219

pb.finished()

2220

2221

def _do_generate_text_key_index(self, ancestors, text_key_references, pb):

2222

"""Helper for _generate_text_key_index to avoid deep nesting."""

2223

revision_order = tsort.topo_sort(ancestors)

2224

invalid_keys = set()

2225

revision_keys = {}

2226

for revision_id in revision_order:

2227

revision_keys[revision_id] = set()

2228

text_count = len(text_key_references)

2229

# a cache of the text keys to allow reuse; costs a dict of all the

2230

# keys, but saves a 2-tuple for every child of a given key.

2231

text_key_cache = {}

2232

for text_key, valid in text_key_references.iteritems():

2233

if not valid:

2234

invalid_keys.add(text_key)

2235

else:

2236

revision_keys[text_key[1]].add(text_key)

2237

text_key_cache[text_key] = text_key

2238

del text_key_references

2239

text_index = {}

2240

text_graph = graph.Graph(graph.DictParentsProvider(text_index))

2241

NULL_REVISION = _mod_revision.NULL_REVISION

2242

# Set a cache with a size of 10 - this suffices for bzr.dev but may be

2243

# too small for large or very branchy trees. However, for 55K path

2244

# trees, it would be easy to use too much memory trivially. Ideally we

2245

# could gauge this by looking at available real memory etc, but this is

2246

# always a tricky proposition.

2247

inventory_cache = lru_cache.LRUCache(10)

2248

batch_size = 10 # should be ~150MB on a 55K path tree

2249

batch_count = len(revision_order) / batch_size + 1

2250

processed_texts = 0

2251

pb.update("Calculating text parents", processed_texts, text_count)

2252

for offset in xrange(batch_count):

2253

to_query = revision_order[offset * batch_size:(offset + 1) *

2254

batch_size]

2255

if not to_query:

2256

break

2257

for revision_id in to_query:

2258

parent_ids = ancestors[revision_id]

2259

for text_key in revision_keys[revision_id]:

2260

pb.update("Calculating text parents", processed_texts)

2261

processed_texts += 1

2262

candidate_parents = []

2263

for parent_id in parent_ids:

2264

parent_text_key = (text_key[0], parent_id)

2265

try:

2266

check_parent = parent_text_key not in \

2267

revision_keys[parent_id]

2268

except KeyError:

2269

# the parent parent_id is a ghost:

2270

check_parent = False

2271

# truncate the derived graph against this ghost.

2272

parent_text_key = None

2273

if check_parent:

2274

# look at the parent commit details inventories to

2275

# determine possible candidates in the per file graph.

2276

# TODO: cache here.

2277

try:

2278

inv = inventory_cache[parent_id]

2279

except KeyError:

2280

inv = self.revision_tree(parent_id).inventory

2281

inventory_cache[parent_id] = inv

2282

try:

2283

parent_entry = inv[text_key[0]]

2284

except (KeyError, errors.NoSuchId):

2285

parent_entry = None

2286

if parent_entry is not None:

2287

parent_text_key = (

2288

text_key[0], parent_entry.revision)

2289

else:

2290

parent_text_key = None

2291

if parent_text_key is not None:

2292

candidate_parents.append(

2293

text_key_cache[parent_text_key])

2294

parent_heads = text_graph.heads(candidate_parents)

2295

new_parents = list(parent_heads)

2296

new_parents.sort(key=lambda x:candidate_parents.index(x))

2297

if new_parents == []:

2298

new_parents = [NULL_REVISION]

2299

text_index[text_key] = new_parents

2300

2301

for text_key in invalid_keys:

2302

text_index[text_key] = [NULL_REVISION]

2303

return text_index

2304

2305

def item_keys_introduced_by(self, revision_ids, _files_pb=None):

2306

"""Get an iterable listing the keys of all the data introduced by a set

2307

of revision IDs.

2308

2309

The keys will be ordered so that the corresponding items can be safely

2310

fetched and inserted in that order.

2311

2312

:returns: An iterable producing tuples of (knit-kind, file-id,

2313

versions). knit-kind is one of 'file', 'inventory', 'signatures',

2314

'revisions'. file-id is None unless knit-kind is 'file'.

2315

"""

2316

for result in self._find_file_keys_to_fetch(revision_ids, _files_pb):

2317

yield result

2318

del _files_pb

2319

for result in self._find_non_file_keys_to_fetch(revision_ids):

2320

yield result

2321

2322

def _find_file_keys_to_fetch(self, revision_ids, pb):

2323

# XXX: it's a bit weird to control the inventory weave caching in this

2324

# generator. Ideally the caching would be done in fetch.py I think. Or

2325

# maybe this generator should explicitly have the contract that it

2326

# should not be iterated until the previously yielded item has been

2327

# processed?

2328

inv_w = self.inventories

2329

2330

# file ids that changed

2331

file_ids = self.fileids_altered_by_revision_ids(revision_ids, inv_w)

2332

count = 0

2333

num_file_ids = len(file_ids)

2334

for file_id, altered_versions in file_ids.iteritems():

2335

if pb is not None:

2336

pb.update("Fetch texts", count, num_file_ids)

2337

count += 1

2338

yield ("file", file_id, altered_versions)

2339

2340

def _find_non_file_keys_to_fetch(self, revision_ids):

2341

# inventory

2342

yield ("inventory", None, revision_ids)

2343

2344

# signatures

2345

# XXX: Note ATM no callers actually pay attention to this return

2346

# instead they just use the list of revision ids and ignore

2347

# missing sigs. Consider removing this work entirely

2348

revisions_with_signatures = set(self.signatures.get_parent_map(

2349

[(r,) for r in revision_ids]))

2350

revisions_with_signatures = set(

2351

[r for (r,) in revisions_with_signatures])

2352

revisions_with_signatures.intersection_update(revision_ids)

2353

yield ("signatures", None, revisions_with_signatures)

2354

2355

# revisions

2356

yield ("revisions", None, revision_ids)

2357

2358

@needs_read_lock

2359

def get_inventory(self, revision_id):

2360

"""Get Inventory object by revision id."""

2361

return self.iter_inventories([revision_id]).next()

2362

2363

def iter_inventories(self, revision_ids, ordering=None):

2364

"""Get many inventories by revision_ids.

2365

2366

This will buffer some or all of the texts used in constructing the

2367

inventories in memory, but will only parse a single inventory at a

2368

time.

2369

2370

:param revision_ids: The expected revision ids of the inventories.

2371

:param ordering: optional ordering, e.g. 'topological'. If not

2372

specified, the order of revision_ids will be preserved (by

2373

buffering if necessary).

2374

:return: An iterator of inventories.

2375

"""

2376

if ((None in revision_ids)

2377

or (_mod_revision.NULL_REVISION in revision_ids)):

2378

raise ValueError('cannot get null revision inventory')

2379

return self._iter_inventories(revision_ids, ordering)

2380

2381

def _iter_inventories(self, revision_ids, ordering):

2382

"""single-document based inventory iteration."""

2383

inv_xmls = self._iter_inventory_xmls(revision_ids, ordering)

2384

for text, revision_id in inv_xmls:

2385

yield self.deserialise_inventory(revision_id, text)

2386

2387

def _iter_inventory_xmls(self, revision_ids, ordering):

2388

if ordering is None:

2389

order_as_requested = True

2390

ordering = 'unordered'

2391

else:

2392

order_as_requested = False

2393

keys = [(revision_id,) for revision_id in revision_ids]

2394

if not keys:

2395

return

2396

if order_as_requested:

2397

key_iter = iter(keys)

2398

next_key = key_iter.next()

2399

stream = self.inventories.get_record_stream(keys, ordering, True)

2400

text_chunks = {}

2401

for record in stream:

2402

if record.storage_kind != 'absent':

2403

chunks = record.get_bytes_as('chunked')

2404

if order_as_requested:

2405

text_chunks[record.key] = chunks

2406

else:

2407

yield ''.join(chunks), record.key[-1]

2408

else:

2409

raise errors.NoSuchRevision(self, record.key)

2410

if order_as_requested:

2411

# Yield as many results as we can while preserving order.

2412

while next_key in text_chunks:

2413

chunks = text_chunks.pop(next_key)

2414

yield ''.join(chunks), next_key[-1]

2415

try:

2416

next_key = key_iter.next()

2417

except StopIteration:

2418

# We still want to fully consume the get_record_stream,

2419

# just in case it is not actually finished at this point

2420

next_key = None

2421

break

2422

2423

def deserialise_inventory(self, revision_id, xml):

2424

"""Transform the xml into an inventory object.

2425

2426

:param revision_id: The expected revision id of the inventory.

2427

:param xml: A serialised inventory.

2428

"""

2429

result = self._serializer.read_inventory_from_string(xml, revision_id,

2430

entry_cache=self._inventory_entry_cache)

2431

if result.revision_id != revision_id:

2432

raise AssertionError('revision id mismatch %s != %s' % (

2433

result.revision_id, revision_id))

2434

return result

2435

2436

def serialise_inventory(self, inv):

2437

return self._serializer.write_inventory_to_string(inv)

2438

2439

def _serialise_inventory_to_lines(self, inv):

2440

return self._serializer.write_inventory_to_lines(inv)

2441

2442

def get_serializer_format(self):

2443

return self._serializer.format_num

2444

2445

@needs_read_lock

2446

def get_inventory_xml(self, revision_id):

2447

"""Get inventory XML as a file object."""

2448

texts = self._iter_inventory_xmls([revision_id], 'unordered')

2449

try:

2450

text, revision_id = texts.next()

2451

except StopIteration:

2452

raise errors.HistoryMissing(self, 'inventory', revision_id)

2453

return text

2454

2455

@needs_read_lock

2456

def get_inventory_sha1(self, revision_id):

2457

"""Return the sha1 hash of the inventory entry

2458

"""

2459

return self.get_revision(revision_id).inventory_sha1

2460

2461

def get_rev_id_for_revno(self, revno, known_pair):

2462

"""Return the revision id of a revno, given a later (revno, revid)

2463

pair in the same history.

2464

2465

:return: if found (True, revid). If the available history ran out

2466

before reaching the revno, then this returns

2467

(False, (closest_revno, closest_revid)).

2468

"""

2469

known_revno, known_revid = known_pair

2470

partial_history = [known_revid]

2471

distance_from_known = known_revno - revno

2472

if distance_from_known < 0:

2473

raise ValueError(

2474

'requested revno (%d) is later than given known revno (%d)'

2475

% (revno, known_revno))

2476

try:

2477

_iter_for_revno(

2478

self, partial_history, stop_index=distance_from_known)

2479

except errors.RevisionNotPresent, err:

2480

if err.revision_id == known_revid:

2481

# The start revision (known_revid) wasn't found.

2482

raise

2483

# This is a stacked repository with no fallbacks, or a there's a

2484

# left-hand ghost. Either way, even though the revision named in

2485

# the error isn't in this repo, we know it's the next step in this

2486

# left-hand history.

2487

partial_history.append(err.revision_id)

2488

if len(partial_history) <= distance_from_known:

2489

# Didn't find enough history to get a revid for the revno.

2490

earliest_revno = known_revno - len(partial_history) + 1

2491

return (False, (earliest_revno, partial_history[-1]))

2492

if len(partial_history) - 1 > distance_from_known:

2493

raise AssertionError('_iter_for_revno returned too much history')

2494

return (True, partial_history[-1])

2495

2496

def iter_reverse_revision_history(self, revision_id):

2497

"""Iterate backwards through revision ids in the lefthand history

2498

2499

:param revision_id: The revision id to start with. All its lefthand

2500

ancestors will be traversed.

2501

"""

2502

graph = self.get_graph()

2503

next_id = revision_id

2504

while True:

2505

if next_id in (None, _mod_revision.NULL_REVISION):

2506

return

2507

try:

2508

parents = graph.get_parent_map([next_id])[next_id]

2509

except KeyError:

2510

raise errors.RevisionNotPresent(next_id, self)

2511

yield next_id

2512

if len(parents) == 0:

2513

return

2514

else:

2515

next_id = parents[0]

2516

2517

@needs_read_lock

2518

def get_revision_inventory(self, revision_id):

2519

"""Return inventory of a past revision."""

2520

# TODO: Unify this with get_inventory()

2521

# bzr 0.0.6 and later imposes the constraint that the inventory_id

2522

# must be the same as its revision, so this is trivial.

2523

if revision_id is None:

2524

# This does not make sense: if there is no revision,

2525

# then it is the current tree inventory surely ?!

2526

# and thus get_root_id() is something that looks at the last

2527

# commit on the branch, and the get_root_id is an inventory check.

2528

raise NotImplementedError

2529

# return Inventory(self.get_root_id())

2530

else:

2531

return self.get_inventory(revision_id)

2532

2533

def is_shared(self):

2534

"""Return True if this repository is flagged as a shared repository."""

2535

raise NotImplementedError(self.is_shared)

2536

2537

@needs_write_lock

2538

def reconcile(self, other=None, thorough=False):

2539

"""Reconcile this repository."""

2540

from bzrlib.reconcile import RepoReconciler

2541

reconciler = RepoReconciler(self, thorough=thorough)

2542

reconciler.reconcile()

2543

return reconciler

2544

2545

def _refresh_data(self):

2546

"""Helper called from lock_* to ensure coherency with disk.

2547

2548

The default implementation does nothing; it is however possible

2549

for repositories to maintain loaded indices across multiple locks

2550

by checking inside their implementation of this method to see

2551

whether their indices are still valid. This depends of course on

2552

the disk format being validatable in this manner. This method is

2553

also called by the refresh_data() public interface to cause a refresh

2554

to occur while in a write lock so that data inserted by a smart server

2555

push operation is visible on the client's instance of the physical

2556

repository.

2557

"""

2558

2559

@needs_read_lock

2560

def revision_tree(self, revision_id):

2561

"""Return Tree for a revision on this branch.

2562

2563

`revision_id` may be NULL_REVISION for the empty tree revision.

2564

"""

2565

revision_id = _mod_revision.ensure_null(revision_id)

2566

# TODO: refactor this to use an existing revision object

2567

# so we don't need to read it in twice.

2568

if revision_id == _mod_revision.NULL_REVISION:

2569

return RevisionTree(self, Inventory(root_id=None),

2570

_mod_revision.NULL_REVISION)

2571

else:

2572

inv = self.get_revision_inventory(revision_id)

2573

return RevisionTree(self, inv, revision_id)

2574

2575

def revision_trees(self, revision_ids):

2576

"""Return Trees for revisions in this repository.

2577

2578

:param revision_ids: a sequence of revision-ids;

2579

a revision-id may not be None or 'null:'

2580

"""

2581

inventories = self.iter_inventories(revision_ids)

2582

for inv in inventories:

2583

yield RevisionTree(self, inv, inv.revision_id)

2584

2585

def _filtered_revision_trees(self, revision_ids, file_ids):

2586

"""Return Tree for a revision on this branch with only some files.

2587

2588

:param revision_ids: a sequence of revision-ids;

2589

a revision-id may not be None or 'null:'

2590

:param file_ids: if not None, the result is filtered

2591

so that only those file-ids, their parents and their

2592

children are included.

2593

"""

2594

inventories = self.iter_inventories(revision_ids)

2595

for inv in inventories:

2596

# Should we introduce a FilteredRevisionTree class rather

2597

# than pre-filter the inventory here?

2598

filtered_inv = inv.filter(file_ids)

2599

yield RevisionTree(self, filtered_inv, filtered_inv.revision_id)

2600

2601

@needs_read_lock

2602

def get_ancestry(self, revision_id, topo_sorted=True):

2603

"""Return a list of revision-ids integrated by a revision.

2604

2605

The first element of the list is always None, indicating the origin

2606

revision. This might change when we have history horizons, or

2607

perhaps we should have a new API.

2608

2609

This is topologically sorted.

2610

"""

2611

if _mod_revision.is_null(revision_id):

2612

return [None]

2613

if not self.has_revision(revision_id):

2614

raise errors.NoSuchRevision(self, revision_id)

2615

graph = self.get_graph()

2616

keys = set()

2617

search = graph._make_breadth_first_searcher([revision_id])

2618

while True:

2619

try:

2620

found, ghosts = search.next_with_ghosts()

2621

except StopIteration:

2622

break

2623

keys.update(found)

2624

if _mod_revision.NULL_REVISION in keys:

2625

keys.remove(_mod_revision.NULL_REVISION)

2626

if topo_sorted:

2627

parent_map = graph.get_parent_map(keys)

2628

keys = tsort.topo_sort(parent_map)

2629

return [None] + list(keys)

2630

2631

def pack(self, hint=None):

2632

"""Compress the data within the repository.

2633

2634

This operation only makes sense for some repository types. For other

2635

types it should be a no-op that just returns.

2636

2637

This stub method does not require a lock, but subclasses should use

2638

@needs_write_lock as this is a long running call its reasonable to

2639

implicitly lock for the user.

2640

2641

:param hint: If not supplied, the whole repository is packed.

2642

If supplied, the repository may use the hint parameter as a

2643

hint for the parts of the repository to pack. A hint can be

2644

obtained from the result of commit_write_group(). Out of

2645

date hints are simply ignored, because concurrent operations

2646

can obsolete them rapidly.

2647

"""

2648

2649

def get_transaction(self):

2650

return self.control_files.get_transaction()

2651

2652

def get_parent_map(self, revision_ids):

2653

"""See graph.StackedParentsProvider.get_parent_map"""

2654

# revisions index works in keys; this just works in revisions

2655

# therefore wrap and unwrap

2656

query_keys = []

2657

result = {}

2658

for revision_id in revision_ids:

2659

if revision_id == _mod_revision.NULL_REVISION:

2660

result[revision_id] = ()

2661

elif revision_id is None:

2662

raise ValueError('get_parent_map(None) is not valid')

2663

else:

2664

query_keys.append((revision_id ,))

2665

for ((revision_id,), parent_keys) in \

2666

self.revisions.get_parent_map(query_keys).iteritems():

2667

if parent_keys:

2668

result[revision_id] = tuple(parent_revid

2669

for (parent_revid,) in parent_keys)

2670

else:

2671

result[revision_id] = (_mod_revision.NULL_REVISION,)

2672

return result

2673

2674

def _make_parents_provider(self):

2675

return self

2676

2677

def get_graph(self, other_repository=None):

2678

"""Return the graph walker for this repository format"""

2679

parents_provider = self._make_parents_provider()

2680

if (other_repository is not None and

2681

not self.has_same_location(other_repository)):

2682

parents_provider = graph.StackedParentsProvider(

2683

[parents_provider, other_repository._make_parents_provider()])

2684

return graph.Graph(parents_provider)

2685

2686

def _get_versioned_file_checker(self, text_key_references=None,

2687

ancestors=None):

2688

"""Return an object suitable for checking versioned files.

2689

2690

:param text_key_references: if non-None, an already built

2691

dictionary mapping text keys ((fileid, revision_id) tuples)

2692

to whether they were referred to by the inventory of the

2693

revision_id that they contain. If None, this will be

2694

calculated.

2695

:param ancestors: Optional result from

2696

self.get_graph().get_parent_map(self.all_revision_ids()) if already

2697

available.

2698

"""

2699

return _VersionedFileChecker(self,

2700

text_key_references=text_key_references, ancestors=ancestors)

2701

2702

def revision_ids_to_search_result(self, result_set):

2703

"""Convert a set of revision ids to a graph SearchResult."""

2704

result_parents = set()

2705

for parents in self.get_graph().get_parent_map(

2706

result_set).itervalues():

2707

result_parents.update(parents)

2708

included_keys = result_set.intersection(result_parents)

2709

start_keys = result_set.difference(included_keys)

2710

exclude_keys = result_parents.difference(result_set)

2711

result = graph.SearchResult(start_keys, exclude_keys,

2712

len(result_set), result_set)

2713

return result

2714

2715

@needs_write_lock

2716

def set_make_working_trees(self, new_value):

2717

"""Set the policy flag for making working trees when creating branches.

2718

2719

This only applies to branches that use this repository.

2720

2721

The default is 'True'.

2722

:param new_value: True to restore the default, False to disable making

2723

working trees.

2724

"""

2725

raise NotImplementedError(self.set_make_working_trees)

2726

2727

def make_working_trees(self):

2728

"""Returns the policy for making working trees on new branches."""

2729

raise NotImplementedError(self.make_working_trees)

2730

2731

@needs_write_lock

2732

def sign_revision(self, revision_id, gpg_strategy):

2733

plaintext = Testament.from_revision(self, revision_id).as_short_text()

2734

self.store_revision_signature(gpg_strategy, plaintext, revision_id)

2735

2736

@needs_read_lock

2737

def has_signature_for_revision_id(self, revision_id):

2738

"""Query for a revision signature for revision_id in the repository."""

2739

if not self.has_revision(revision_id):

2740

raise errors.NoSuchRevision(self, revision_id)

2741

sig_present = (1 == len(

2742

self.signatures.get_parent_map([(revision_id,)])))

2743

return sig_present

2744

2745

@needs_read_lock

2746

def get_signature_text(self, revision_id):

2747

"""Return the text for a signature."""

2748

stream = self.signatures.get_record_stream([(revision_id,)],

2749

'unordered', True)

2750

record = stream.next()

2751

if record.storage_kind == 'absent':

2752

raise errors.NoSuchRevision(self, revision_id)

2753

return record.get_bytes_as('fulltext')

2754

2755

@needs_read_lock

2756

def check(self, revision_ids=None, callback_refs=None, check_repo=True):

2757

"""Check consistency of all history of given revision_ids.

2758

2759

Different repository implementations should override _check().

2760

2761

:param revision_ids: A non-empty list of revision_ids whose ancestry

2762

will be checked. Typically the last revision_id of a branch.

2763

:param callback_refs: A dict of check-refs to resolve and callback

2764

the check/_check method on the items listed as wanting the ref.

2765

see bzrlib.check.

2766

:param check_repo: If False do not check the repository contents, just

2767

calculate the data callback_refs requires and call them back.

2768

"""

2769

return self._check(revision_ids, callback_refs=callback_refs,

2770

check_repo=check_repo)

2771

2772

def _check(self, revision_ids, callback_refs, check_repo):

2773

result = check.Check(self, check_repo=check_repo)

2774

result.check(callback_refs)

2775

return result

2776

2777

def _warn_if_deprecated(self):

2778

global _deprecation_warning_done

2779

if _deprecation_warning_done:

2780

return

2781

_deprecation_warning_done = True

2782

warning("Format %s for %s is deprecated - please use 'bzr upgrade' to get better performance"

2783

% (self._format, self.bzrdir.transport.base))

2784

2785

def supports_rich_root(self):

2786

return self._format.rich_root_data

2787

2788

def _check_ascii_revisionid(self, revision_id, method):

2789

"""Private helper for ascii-only repositories."""

2790

# weave repositories refuse to store revisionids that are non-ascii.

2791

if revision_id is not None:

2792

# weaves require ascii revision ids.

2793

if isinstance(revision_id, unicode):

2794

try:

2795

revision_id.encode('ascii')

2796

except UnicodeEncodeError:

2797

raise errors.NonAsciiRevisionId(method, self)

2798

else:

2799

try:

2800

revision_id.decode('ascii')

2801

except UnicodeDecodeError:

2802

raise errors.NonAsciiRevisionId(method, self)

2803

2804

def revision_graph_can_have_wrong_parents(self):

2805

"""Is it possible for this repository to have a revision graph with

2806

incorrect parents?

2807

2808

If True, then this repository must also implement

2809

_find_inconsistent_revision_parents so that check and reconcile can

2810

check for inconsistencies before proceeding with other checks that may

2811

depend on the revision index being consistent.

2812

"""

2813

raise NotImplementedError(self.revision_graph_can_have_wrong_parents)

2814

2815

2816

# remove these delegates a while after bzr 0.15

2817

def __make_delegated(name, from_module):

2818

def _deprecated_repository_forwarder():

2819

symbol_versioning.warn('%s moved to %s in bzr 0.15'

2820

% (name, from_module),

2821

DeprecationWarning,

2822

stacklevel=2)

2823

m = __import__(from_module, globals(), locals(), [name])

2824

try:

2825

return getattr(m, name)

2826

except AttributeError:

2827

raise AttributeError('module %s has no name %s'

2828

% (m, name))

2829

globals()[name] = _deprecated_repository_forwarder

2830

2831

for _name in [

2832

'AllInOneRepository',

2833

'WeaveMetaDirRepository',

2834

'PreSplitOutRepositoryFormat',

2835

'RepositoryFormat4',

2836

'RepositoryFormat5',

2837

'RepositoryFormat6',

2838

'RepositoryFormat7',

2839

2840

__make_delegated(_name, 'bzrlib.repofmt.weaverepo')

2841

2842

for _name in [

2843

'KnitRepository',

2844

'RepositoryFormatKnit',

2845

'RepositoryFormatKnit1',

2846

2847

__make_delegated(_name, 'bzrlib.repofmt.knitrepo')

2848

2849

2850

def install_revision(repository, rev, revision_tree):

2851

"""Install all revision data into a repository."""

2852

install_revisions(repository, [(rev, revision_tree, None)])

2853

2854

2855

def install_revisions(repository, iterable, num_revisions=None, pb=None):

2856

"""Install all revision data into a repository.

2857

2858

Accepts an iterable of revision, tree, signature tuples. The signature

2859

may be None.

2860

"""

2861

repository.start_write_group()

2862

try:

2863

inventory_cache = lru_cache.LRUCache(10)

2864

for n, (revision, revision_tree, signature) in enumerate(iterable):

2865

_install_revision(repository, revision, revision_tree, signature,

2866

inventory_cache)

2867

if pb is not None:

2868

pb.update('Transferring revisions', n + 1, num_revisions)

2869

except:

2870

repository.abort_write_group()

2871

raise

2872

else:

2873

repository.commit_write_group()

2874

2875

2876

def _install_revision(repository, rev, revision_tree, signature,

2877

inventory_cache):

2878

"""Install all revision data into a repository."""

2879

present_parents = []

2880

parent_trees = {}

2881

for p_id in rev.parent_ids:

2882

if repository.has_revision(p_id):

2883

present_parents.append(p_id)

2884

parent_trees[p_id] = repository.revision_tree(p_id)

2885

else:

2886

parent_trees[p_id] = repository.revision_tree(

2887

_mod_revision.NULL_REVISION)

2888

2889

inv = revision_tree.inventory

2890

entries = inv.iter_entries()

2891

# backwards compatibility hack: skip the root id.

2892

if not repository.supports_rich_root():

2893

path, root = entries.next()

2894

if root.revision != rev.revision_id:

2895

raise errors.IncompatibleRevision(repr(repository))

2896

text_keys = {}

2897

for path, ie in entries:

2898

text_keys[(ie.file_id, ie.revision)] = ie

2899

text_parent_map = repository.texts.get_parent_map(text_keys)

2900

missing_texts = set(text_keys) - set(text_parent_map)

2901

# Add the texts that are not already present

2902

for text_key in missing_texts:

2903

ie = text_keys[text_key]

2904

text_parents = []

2905

# FIXME: TODO: The following loop overlaps/duplicates that done by

2906

# commit to determine parents. There is a latent/real bug here where

2907

# the parents inserted are not those commit would do - in particular

2908

# they are not filtered by heads(). RBC, AB

2909

for revision, tree in parent_trees.iteritems():

2910

if ie.file_id not in tree:

2911

continue

2912

parent_id = tree.inventory[ie.file_id].revision

2913

if parent_id in text_parents:

2914

continue

2915

text_parents.append((ie.file_id, parent_id))

2916

lines = revision_tree.get_file(ie.file_id).readlines()

2917

repository.texts.add_lines(text_key, text_parents, lines)

2918

try:

2919

# install the inventory

2920

if repository._format._commit_inv_deltas and len(rev.parent_ids):

2921

# Cache this inventory

2922

inventory_cache[rev.revision_id] = inv

2923

try:

2924

basis_inv = inventory_cache[rev.parent_ids[0]]

2925

except KeyError:

2926

repository.add_inventory(rev.revision_id, inv, present_parents)

2927

else:

2928

delta = inv._make_delta(basis_inv)

2929

repository.add_inventory_by_delta(rev.parent_ids[0], delta,

2930

rev.revision_id, present_parents)

2931

else:

2932

repository.add_inventory(rev.revision_id, inv, present_parents)

2933

except errors.RevisionAlreadyPresent:

2934

pass

2935

if signature is not None:

2936

repository.add_signature_text(rev.revision_id, signature)

2937

repository.add_revision(rev.revision_id, rev, inv)

2938

2939

2940

class MetaDirRepository(Repository):

2941

"""Repositories in the new meta-dir layout.

2942

2943

:ivar _transport: Transport for access to repository control files,

2944

typically pointing to .bzr/repository.

2945

"""

2946

2947

def __init__(self, _format, a_bzrdir, control_files):

2948

super(MetaDirRepository, self).__init__(_format, a_bzrdir, control_files)

2949

self._transport = control_files._transport

2950

2951

def is_shared(self):

2952

"""Return True if this repository is flagged as a shared repository."""

2953

return self._transport.has('shared-storage')

2954

2955

@needs_write_lock

2956

def set_make_working_trees(self, new_value):

2957

"""Set the policy flag for making working trees when creating branches.

2958

2959

This only applies to branches that use this repository.

2960

2961

The default is 'True'.

2962

:param new_value: True to restore the default, False to disable making

2963

working trees.

2964

"""

2965

if new_value:

2966

try:

2967

self._transport.delete('no-working-trees')

2968

except errors.NoSuchFile:

2969

pass

2970

else:

2971

self._transport.put_bytes('no-working-trees', '',

2972

mode=self.bzrdir._get_file_mode())

2973

2974

def make_working_trees(self):

2975

"""Returns the policy for making working trees on new branches."""

2976

return not self._transport.has('no-working-trees')

2977

2978

2979

class MetaDirVersionedFileRepository(MetaDirRepository):

2980

"""Repositories in a meta-dir, that work via versioned file objects."""

2981

2982

def __init__(self, _format, a_bzrdir, control_files):

2983

super(MetaDirVersionedFileRepository, self).__init__(_format, a_bzrdir,

2984

control_files)

2985

2986

2987

network_format_registry = registry.FormatRegistry()

2988

"""Registry of formats indexed by their network name.

2989

2990

The network name for a repository format is an identifier that can be used when

2991

referring to formats with smart server operations. See

2992

RepositoryFormat.network_name() for more detail.

2993

"""

2994

2995

2996

format_registry = registry.FormatRegistry(network_format_registry)

2997

"""Registry of formats, indexed by their BzrDirMetaFormat format string.

2998

2999

This can contain either format instances themselves, or classes/factories that

3000

can be called to obtain one.

3001

"""

3002

3003

3004

#####################################################################

3005

# Repository Formats

3006

3007

class RepositoryFormat(object):

3008

"""A repository format.

3009

3010

Formats provide four things:

3011

* An initialization routine to construct repository data on disk.

3012

* a optional format string which is used when the BzrDir supports

3013

versioned children.

3014

* an open routine which returns a Repository instance.

3015

* A network name for referring to the format in smart server RPC

3016

methods.

3017

3018

There is one and only one Format subclass for each on-disk format. But

3019

there can be one Repository subclass that is used for several different

3020

formats. The _format attribute on a Repository instance can be used to

3021

determine the disk format.

3022

3023

Formats are placed in a registry by their format string for reference

3024

during opening. These should be subclasses of RepositoryFormat for

3025

consistency.

3026

3027

Once a format is deprecated, just deprecate the initialize and open

3028

methods on the format class. Do not deprecate the object, as the

3029

object may be created even when a repository instance hasn't been

3030

created.

3031

3032

Common instance attributes:

3033

_matchingbzrdir - the bzrdir format that the repository format was

3034

originally written to work with. This can be used if manually

3035

constructing a bzrdir and repository, or more commonly for test suite

3036

parameterization.

3037

"""

3038

3039

# Set to True or False in derived classes. True indicates that the format

3040

# supports ghosts gracefully.

3041

supports_ghosts = None

3042

# Can this repository be given external locations to lookup additional

3043

# data. Set to True or False in derived classes.

3044

supports_external_lookups = None

3045

# Does this format support CHK bytestring lookups. Set to True or False in

3046

# derived classes.

3047

supports_chks = None

3048

# Should commit add an inventory, or an inventory delta to the repository.

3049

_commit_inv_deltas = True

3050

# What order should fetch operations request streams in?

3051

# The default is unordered as that is the cheapest for an origin to

3052

# provide.

3053

_fetch_order = 'unordered'

3054

# Does this repository format use deltas that can be fetched as-deltas ?

3055

# (E.g. knits, where the knit deltas can be transplanted intact.

3056

# We default to False, which will ensure that enough data to get

3057

# a full text out of any fetch stream will be grabbed.

3058

_fetch_uses_deltas = False

3059

# Should fetch trigger a reconcile after the fetch? Only needed for

3060

# some repository formats that can suffer internal inconsistencies.

3061

_fetch_reconcile = False

3062

# Does this format have < O(tree_size) delta generation. Used to hint what

3063

# code path for commit, amongst other things.

3064

fast_deltas = None

3065

# Does doing a pack operation compress data? Useful for the pack UI command

3066

# (so if there is one pack, the operation can still proceed because it may

3067

# help), and for fetching when data won't have come from the same

3068

# compressor.

3069

pack_compresses = False

3070

# Does the repository inventory storage understand references to trees?

3071

supports_tree_reference = None

3072

3073

def __str__(self):

3074

return "<%s>" % self.__class__.__name__

3075

3076

def __eq__(self, other):

3077

# format objects are generally stateless

3078

return isinstance(other, self.__class__)

3079

3080

def __ne__(self, other):

3081

return not self == other

3082

3083

@classmethod

3084

def find_format(klass, a_bzrdir):

3085

"""Return the format for the repository object in a_bzrdir.

3086

3087

This is used by bzr native formats that have a "format" file in

3088

the repository. Other methods may be used by different types of

3089

control directory.

3090

"""

3091

try:

3092

transport = a_bzrdir.get_repository_transport(None)

3093

format_string = transport.get("format").read()

3094

return format_registry.get(format_string)

3095

except errors.NoSuchFile:

3096

raise errors.NoRepositoryPresent(a_bzrdir)

3097

except KeyError:

3098

raise errors.UnknownFormatError(format=format_string,

3099

kind='repository')

3100

3101

@classmethod

3102

def register_format(klass, format):

3103

format_registry.register(format.get_format_string(), format)

3104

3105

@classmethod

3106

def unregister_format(klass, format):

3107

format_registry.remove(format.get_format_string())

3108

3109

@classmethod

3110

def get_default_format(klass):

3111

"""Return the current default format."""

3112

from bzrlib import bzrdir

3113

return bzrdir.format_registry.make_bzrdir('default').repository_format

3114

3115

def get_format_string(self):

3116

"""Return the ASCII format string that identifies this format.

3117

3118

Note that in pre format ?? repositories the format string is

3119

not permitted nor written to disk.

3120

"""

3121

raise NotImplementedError(self.get_format_string)

3122

3123

def get_format_description(self):

3124

"""Return the short description for this format."""

3125

raise NotImplementedError(self.get_format_description)

3126

3127

# TODO: this shouldn't be in the base class, it's specific to things that

3128

# use weaves or knits -- mbp 20070207

3129

def _get_versioned_file_store(self,

3130

name,

3131

transport,

3132

control_files,

3133

prefixed=True,

3134

versionedfile_class=None,

3135

versionedfile_kwargs={},

3136

escaped=False):

3137

if versionedfile_class is None:

3138

versionedfile_class = self._versionedfile_class

3139

weave_transport = control_files._transport.clone(name)

3140

dir_mode = control_files._dir_mode

3141

file_mode = control_files._file_mode

3142

return VersionedFileStore(weave_transport, prefixed=prefixed,

3143

dir_mode=dir_mode,

3144

file_mode=file_mode,

3145

versionedfile_class=versionedfile_class,

3146

versionedfile_kwargs=versionedfile_kwargs,

3147

escaped=escaped)

3148

3149

def initialize(self, a_bzrdir, shared=False):

3150

"""Initialize a repository of this format in a_bzrdir.

3151

3152

:param a_bzrdir: The bzrdir to put the new repository in it.

3153

:param shared: The repository should be initialized as a sharable one.

3154

:returns: The new repository object.

3155

3156

This may raise UninitializableFormat if shared repository are not

3157

compatible the a_bzrdir.

3158

"""

3159

raise NotImplementedError(self.initialize)

3160

3161

def is_supported(self):

3162

"""Is this format supported?

3163

3164

Supported formats must be initializable and openable.

3165

Unsupported formats may not support initialization or committing or

3166

some other features depending on the reason for not being supported.

3167

"""

3168

return True

3169

3170

def network_name(self):

3171

"""A simple byte string uniquely identifying this format for RPC calls.

3172

3173

MetaDir repository formats use their disk format string to identify the

3174

repository over the wire. All in one formats such as bzr < 0.8, and

3175

foreign formats like svn/git and hg should use some marker which is

3176

unique and immutable.

3177

"""

3178

raise NotImplementedError(self.network_name)

3179

3180

def check_conversion_target(self, target_format):

3181

if self.rich_root_data and not target_format.rich_root_data:

3182

raise errors.BadConversionTarget(

3183

'Does not support rich root data.', target_format,

3184

from_format=self)

3185

if (self.supports_tree_reference and

3186

not getattr(target_format, 'supports_tree_reference', False)):

3187

raise errors.BadConversionTarget(

3188

'Does not support nested trees', target_format,

3189

from_format=self)

3190

3191

def open(self, a_bzrdir, _found=False):

3192

"""Return an instance of this format for the bzrdir a_bzrdir.

3193

3194

_found is a private parameter, do not use it.

3195

"""

3196

raise NotImplementedError(self.open)

3197

3198

3199

class MetaDirRepositoryFormat(RepositoryFormat):

3200

"""Common base class for the new repositories using the metadir layout."""

3201

3202

rich_root_data = False

3203

supports_tree_reference = False

3204

supports_external_lookups = False

3205

3206

@property

3207

def _matchingbzrdir(self):

3208

matching = bzrdir.BzrDirMetaFormat1()

3209

matching.repository_format = self

3210

return matching

3211

3212

def __init__(self):

3213

super(MetaDirRepositoryFormat, self).__init__()

3214

3215

def _create_control_files(self, a_bzrdir):

3216

"""Create the required files and the initial control_files object."""

3217

# FIXME: RBC 20060125 don't peek under the covers

3218

# NB: no need to escape relative paths that are url safe.

3219

repository_transport = a_bzrdir.get_repository_transport(self)

3220

control_files = lockable_files.LockableFiles(repository_transport,

3221

'lock', lockdir.LockDir)

3222

control_files.create_lock()

3223

return control_files

3224

3225

def _upload_blank_content(self, a_bzrdir, dirs, files, utf8_files, shared):

3226

"""Upload the initial blank content."""

3227

control_files = self._create_control_files(a_bzrdir)

3228

control_files.lock_write()

3229

transport = control_files._transport

3230

if shared == True:

3231

utf8_files += [('shared-storage', '')]

3232

try:

3233

transport.mkdir_multi(dirs, mode=a_bzrdir._get_dir_mode())

3234

for (filename, content_stream) in files:

3235

transport.put_file(filename, content_stream,

3236

mode=a_bzrdir._get_file_mode())

3237

for (filename, content_bytes) in utf8_files:

3238

transport.put_bytes_non_atomic(filename, content_bytes,

3239

mode=a_bzrdir._get_file_mode())

3240

finally:

3241

control_files.unlock()

3242

3243

def network_name(self):

3244

"""Metadir formats have matching disk and network format strings."""

3245

return self.get_format_string()

3246

3247

3248

# Pre-0.8 formats that don't have a disk format string (because they are

3249

# versioned by the matching control directory). We use the control directories

3250

# disk format string as a key for the network_name because they meet the

3251

# constraints (simple string, unique, immutable).

3252

network_format_registry.register_lazy(

3253

"Bazaar-NG branch, format 5\n",

3254

'bzrlib.repofmt.weaverepo',

3255

'RepositoryFormat5',

3256

)

3257

network_format_registry.register_lazy(

3258

"Bazaar-NG branch, format 6\n",

3259

'bzrlib.repofmt.weaverepo',

3260

'RepositoryFormat6',

3261

)

3262

3263

# formats which have no format string are not discoverable or independently

3264

# creatable on disk, so are not registered in format_registry. They're

3265

# all in bzrlib.repofmt.weaverepo now. When an instance of one of these is

3266

# needed, it's constructed directly by the BzrDir. Non-native formats where

3267

# the repository is not separately opened are similar.

3268

3269

format_registry.register_lazy(

3270

'Bazaar-NG Repository format 7',

3271

'bzrlib.repofmt.weaverepo',

3272

'RepositoryFormat7'

3273

)

3274

3275

format_registry.register_lazy(

3276

'Bazaar-NG Knit Repository Format 1',

3277

'bzrlib.repofmt.knitrepo',

3278

'RepositoryFormatKnit1',

3279

)

3280

3281

format_registry.register_lazy(

3282

'Bazaar Knit Repository Format 3 (bzr 0.15)\n',

3283

'bzrlib.repofmt.knitrepo',

3284

'RepositoryFormatKnit3',

3285

)

3286

3287

format_registry.register_lazy(

3288

'Bazaar Knit Repository Format 4 (bzr 1.0)\n',

3289

'bzrlib.repofmt.knitrepo',

3290

'RepositoryFormatKnit4',

3291

)

3292

3293

# Pack-based formats. There is one format for pre-subtrees, and one for

3294

# post-subtrees to allow ease of testing.

3295

# NOTE: These are experimental in 0.92. Stable in 1.0 and above

3296

format_registry.register_lazy(

3297

'Bazaar pack repository format 1 (needs bzr 0.92)\n',

3298

'bzrlib.repofmt.pack_repo',

3299

'RepositoryFormatKnitPack1',

3300

)

3301

format_registry.register_lazy(

3302

'Bazaar pack repository format 1 with subtree support (needs bzr 0.92)\n',

3303

'bzrlib.repofmt.pack_repo',

3304

'RepositoryFormatKnitPack3',

3305

)

3306

format_registry.register_lazy(

3307

'Bazaar pack repository format 1 with rich root (needs bzr 1.0)\n',

3308

'bzrlib.repofmt.pack_repo',

3309

'RepositoryFormatKnitPack4',

3310

)

3311

format_registry.register_lazy(

3312

'Bazaar RepositoryFormatKnitPack5 (bzr 1.6)\n',

3313

'bzrlib.repofmt.pack_repo',

3314

'RepositoryFormatKnitPack5',

3315

)

3316

format_registry.register_lazy(

3317

'Bazaar RepositoryFormatKnitPack5RichRoot (bzr 1.6.1)\n',

3318

'bzrlib.repofmt.pack_repo',

3319

'RepositoryFormatKnitPack5RichRoot',

3320

)

3321

format_registry.register_lazy(

3322

'Bazaar RepositoryFormatKnitPack5RichRoot (bzr 1.6)\n',

3323

'bzrlib.repofmt.pack_repo',

3324

'RepositoryFormatKnitPack5RichRootBroken',

3325

)

3326

format_registry.register_lazy(

3327

'Bazaar RepositoryFormatKnitPack6 (bzr 1.9)\n',

3328

'bzrlib.repofmt.pack_repo',

3329

'RepositoryFormatKnitPack6',

3330

)

3331

format_registry.register_lazy(

3332

'Bazaar RepositoryFormatKnitPack6RichRoot (bzr 1.9)\n',

3333

'bzrlib.repofmt.pack_repo',

3334

'RepositoryFormatKnitPack6RichRoot',

3335

)

3336

3337

# Development formats.

3338

# Obsolete but kept pending a CHK based subtree format.

3339

format_registry.register_lazy(

3340

("Bazaar development format 2 with subtree support "

3341

"(needs bzr.dev from before 1.8)\n"),

3342

'bzrlib.repofmt.pack_repo',

3343

'RepositoryFormatPackDevelopment2Subtree',

3344

)

3345

3346

# 1.14->1.16 go below here

3347

format_registry.register_lazy(

3348

'Bazaar development format - group compression and chk inventory'

3349

' (needs bzr.dev from 1.14)\n',

3350

'bzrlib.repofmt.groupcompress_repo',

3351

'RepositoryFormatCHK1',

3352

)

3353

3354

format_registry.register_lazy(

3355

'Bazaar development format - chk repository with bencode revision '

3356

'serialization (needs bzr.dev from 1.16)\n',

3357

'bzrlib.repofmt.groupcompress_repo',

3358

'RepositoryFormatCHK2',

3359

)

3360

format_registry.register_lazy(

3361

'Bazaar repository format 2a (needs bzr 1.16 or later)\n',

3362

'bzrlib.repofmt.groupcompress_repo',

3363

'RepositoryFormat2a',

3364

)

3365

3366

3367

class InterRepository(InterObject):

3368

"""This class represents operations taking place between two repositories.

3369

3370

Its instances have methods like copy_content and fetch, and contain

3371

references to the source and target repositories these operations can be

3372

carried out on.

3373

3374

Often we will provide convenience methods on 'repository' which carry out

3375

operations with another repository - they will always forward to

3376

InterRepository.get(other).method_name(parameters).

3377

"""

3378

3379

_walk_to_common_revisions_batch_size = 50

3380

_optimisers = []

3381

"""The available optimised InterRepository types."""

3382

3383

@needs_write_lock

3384

def copy_content(self, revision_id=None):

3385

"""Make a complete copy of the content in self into destination.

3386

3387

This is a destructive operation! Do not use it on existing

3388

repositories.

3389

3390

:param revision_id: Only copy the content needed to construct

3391

revision_id and its parents.

3392

"""

3393

try:

3394

self.target.set_make_working_trees(self.source.make_working_trees())

3395

except NotImplementedError:

3396

pass

3397

self.target.fetch(self.source, revision_id=revision_id)

3398

3399

@needs_write_lock

3400

def fetch(self, revision_id=None, pb=None, find_ghosts=False,

3401

fetch_spec=None):

3402

"""Fetch the content required to construct revision_id.

3403

3404

The content is copied from self.source to self.target.

3405

3406

:param revision_id: if None all content is copied, if NULL_REVISION no

3407

content is copied.

3408

:param pb: optional progress bar to use for progress reports. If not

3409

provided a default one will be created.

3410

:return: None.

3411

"""

3412

from bzrlib.fetch import RepoFetcher

3413

f = RepoFetcher(to_repository=self.target,

3414

from_repository=self.source,

3415

last_revision=revision_id,

3416

fetch_spec=fetch_spec,

3417

pb=pb, find_ghosts=find_ghosts)

3418

3419

def _walk_to_common_revisions(self, revision_ids):

3420

"""Walk out from revision_ids in source to revisions target has.

3421

3422

:param revision_ids: The start point for the search.

3423

:return: A set of revision ids.

3424

"""

3425

target_graph = self.target.get_graph()

3426

revision_ids = frozenset(revision_ids)

3427

missing_revs = set()

3428

source_graph = self.source.get_graph()

3429

# ensure we don't pay silly lookup costs.

3430

searcher = source_graph._make_breadth_first_searcher(revision_ids)

3431

null_set = frozenset([_mod_revision.NULL_REVISION])

3432

searcher_exhausted = False

3433

while True:

3434

next_revs = set()

3435

ghosts = set()

3436

# Iterate the searcher until we have enough next_revs

3437

while len(next_revs) < self._walk_to_common_revisions_batch_size:

3438

try:

3439

next_revs_part, ghosts_part = searcher.next_with_ghosts()

3440

next_revs.update(next_revs_part)

3441

ghosts.update(ghosts_part)

3442

except StopIteration:

3443

searcher_exhausted = True

3444

break

3445

# If there are ghosts in the source graph, and the caller asked for

3446

# them, make sure that they are present in the target.

3447

# We don't care about other ghosts as we can't fetch them and

3448

# haven't been asked to.

3449

ghosts_to_check = set(revision_ids.intersection(ghosts))

3450

revs_to_get = set(next_revs).union(ghosts_to_check)

3451

if revs_to_get:

3452

have_revs = set(target_graph.get_parent_map(revs_to_get))

3453

# we always have NULL_REVISION present.

3454

have_revs = have_revs.union(null_set)

3455

# Check if the target is missing any ghosts we need.

3456

ghosts_to_check.difference_update(have_revs)

3457

if ghosts_to_check:

3458

# One of the caller's revision_ids is a ghost in both the

3459

# source and the target.

3460

raise errors.NoSuchRevision(

3461

self.source, ghosts_to_check.pop())

3462

missing_revs.update(next_revs - have_revs)

3463

# Because we may have walked past the original stop point, make

3464

# sure everything is stopped

3465

stop_revs = searcher.find_seen_ancestors(have_revs)

3466

searcher.stop_searching_any(stop_revs)

3467

if searcher_exhausted:

3468

break

3469

return searcher.get_result()

3470

3471

@needs_read_lock

3472

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

3473

"""Return the revision ids that source has that target does not.

3474

3475

:param revision_id: only return revision ids included by this

3476

revision_id.

3477

:param find_ghosts: If True find missing revisions in deep history

3478

rather than just finding the surface difference.

3479

:return: A bzrlib.graph.SearchResult.

3480

"""

3481

# stop searching at found target revisions.

3482

if not find_ghosts and revision_id is not None:

3483

return self._walk_to_common_revisions([revision_id])

3484

# generic, possibly worst case, slow code path.

3485

target_ids = set(self.target.all_revision_ids())

3486

if revision_id is not None:

3487

source_ids = self.source.get_ancestry(revision_id)

3488

if source_ids[0] is not None:

3489

raise AssertionError()

3490

source_ids.pop(0)

3491

else:

3492

source_ids = self.source.all_revision_ids()

3493

result_set = set(source_ids).difference(target_ids)

3494

return self.source.revision_ids_to_search_result(result_set)

3495

3496

@staticmethod

3497

def _same_model(source, target):

3498

"""True if source and target have the same data representation.

3499

3500

Note: this is always called on the base class; overriding it in a

3501

subclass will have no effect.

3502

"""

3503

try:

3504

InterRepository._assert_same_model(source, target)

3505

return True

3506

except errors.IncompatibleRepositories, e:

3507

return False

3508

3509

@staticmethod

3510

def _assert_same_model(source, target):

3511

"""Raise an exception if two repositories do not use the same model.

3512

"""

3513

if source.supports_rich_root() != target.supports_rich_root():

3514

raise errors.IncompatibleRepositories(source, target,

3515

"different rich-root support")

3516

if source._serializer != target._serializer:

3517

raise errors.IncompatibleRepositories(source, target,

3518

"different serializers")

3519

3520

3521

class InterSameDataRepository(InterRepository):

3522

"""Code for converting between repositories that represent the same data.

3523

3524

Data format and model must match for this to work.

3525

"""

3526

3527

@classmethod

3528

def _get_repo_format_to_test(self):

3529

"""Repository format for testing with.

3530

3531

InterSameData can pull from subtree to subtree and from non-subtree to

3532

non-subtree, so we test this with the richest repository format.

3533

"""

3534

from bzrlib.repofmt import knitrepo

3535

return knitrepo.RepositoryFormatKnit3()

3536

3537

@staticmethod

3538

def is_compatible(source, target):

3539

return InterRepository._same_model(source, target)

3540

3541

3542

class InterWeaveRepo(InterSameDataRepository):

3543

"""Optimised code paths between Weave based repositories.

3544

3545

This should be in bzrlib/repofmt/weaverepo.py but we have not yet

3546

implemented lazy inter-object optimisation.

3547

"""

3548

3549

@classmethod

3550

def _get_repo_format_to_test(self):

3551

from bzrlib.repofmt import weaverepo

3552

return weaverepo.RepositoryFormat7()

3553

3554

@staticmethod

3555

def is_compatible(source, target):

3556

"""Be compatible with known Weave formats.

3557

3558

We don't test for the stores being of specific types because that

3559

could lead to confusing results, and there is no need to be

3560

overly general.

3561

"""

3562

from bzrlib.repofmt.weaverepo import (

3563

RepositoryFormat5,

3564

RepositoryFormat6,

3565

RepositoryFormat7,

3566

)

3567

try:

3568

return (isinstance(source._format, (RepositoryFormat5,

3569

RepositoryFormat6,

3570

RepositoryFormat7)) and

3571

isinstance(target._format, (RepositoryFormat5,

3572

RepositoryFormat6,

3573

RepositoryFormat7)))

3574

except AttributeError:

3575

return False

3576

3577

@needs_write_lock

3578

def copy_content(self, revision_id=None):

3579

"""See InterRepository.copy_content()."""

3580

# weave specific optimised path:

3581

try:

3582

self.target.set_make_working_trees(self.source.make_working_trees())

3583

except (errors.RepositoryUpgradeRequired, NotImplemented):

3584

pass

3585

# FIXME do not peek!

3586

if self.source._transport.listable():

3587

pb = ui.ui_factory.nested_progress_bar()

3588

try:

3589

self.target.texts.insert_record_stream(

3590

self.source.texts.get_record_stream(

3591

self.source.texts.keys(), 'topological', False))

3592

pb.update('Copying inventory', 0, 1)

3593

self.target.inventories.insert_record_stream(

3594

self.source.inventories.get_record_stream(

3595

self.source.inventories.keys(), 'topological', False))

3596

self.target.signatures.insert_record_stream(

3597

self.source.signatures.get_record_stream(

3598

self.source.signatures.keys(),

3599

'unordered', True))

3600

self.target.revisions.insert_record_stream(

3601

self.source.revisions.get_record_stream(

3602

self.source.revisions.keys(),

3603

'topological', True))

3604

finally:

3605

pb.finished()

3606

else:

3607

self.target.fetch(self.source, revision_id=revision_id)

3608

3609

@needs_read_lock

3610

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

3611

"""See InterRepository.missing_revision_ids()."""

3612

# we want all revisions to satisfy revision_id in source.

3613

# but we don't want to stat every file here and there.

3614

# we want then, all revisions other needs to satisfy revision_id

3615

# checked, but not those that we have locally.

3616

# so the first thing is to get a subset of the revisions to

3617

# satisfy revision_id in source, and then eliminate those that

3618

# we do already have.

3619

# this is slow on high latency connection to self, but as this

3620

# disk format scales terribly for push anyway due to rewriting

3621

# inventory.weave, this is considered acceptable.

3622

# - RBC 20060209

3623

if revision_id is not None:

3624

source_ids = self.source.get_ancestry(revision_id)

3625

if source_ids[0] is not None:

3626

raise AssertionError()

3627

source_ids.pop(0)

3628

else:

3629

source_ids = self.source._all_possible_ids()

3630

source_ids_set = set(source_ids)

3631

# source_ids is the worst possible case we may need to pull.

3632

# now we want to filter source_ids against what we actually

3633

# have in target, but don't try to check for existence where we know

3634

# we do not have a revision as that would be pointless.

3635

target_ids = set(self.target._all_possible_ids())

3636

possibly_present_revisions = target_ids.intersection(source_ids_set)

3637

actually_present_revisions = set(

3638

self.target._eliminate_revisions_not_present(possibly_present_revisions))

3639

required_revisions = source_ids_set.difference(actually_present_revisions)

3640

if revision_id is not None:

3641

# we used get_ancestry to determine source_ids then we are assured all

3642

# revisions referenced are present as they are installed in topological order.

3643

# and the tip revision was validated by get_ancestry.

3644

result_set = required_revisions

3645

else:

3646

# if we just grabbed the possibly available ids, then

3647

# we only have an estimate of whats available and need to validate

3648

# that against the revision records.

3649

result_set = set(

3650

self.source._eliminate_revisions_not_present(required_revisions))

3651

return self.source.revision_ids_to_search_result(result_set)

3652

3653

3654

class InterKnitRepo(InterSameDataRepository):

3655

"""Optimised code paths between Knit based repositories."""

3656

3657

@classmethod

3658

def _get_repo_format_to_test(self):

3659

from bzrlib.repofmt import knitrepo

3660

return knitrepo.RepositoryFormatKnit1()

3661

3662

@staticmethod

3663

def is_compatible(source, target):

3664

"""Be compatible with known Knit formats.

3665

3666

We don't test for the stores being of specific types because that

3667

could lead to confusing results, and there is no need to be

3668

overly general.

3669

"""

3670

from bzrlib.repofmt.knitrepo import RepositoryFormatKnit

3671

try:

3672

are_knits = (isinstance(source._format, RepositoryFormatKnit) and

3673

isinstance(target._format, RepositoryFormatKnit))

3674

except AttributeError:

3675

return False

3676

return are_knits and InterRepository._same_model(source, target)

3677

3678

@needs_read_lock

3679

def search_missing_revision_ids(self, revision_id=None, find_ghosts=True):

3680

"""See InterRepository.missing_revision_ids()."""

3681

if revision_id is not None:

3682

source_ids = self.source.get_ancestry(revision_id)

3683

if source_ids[0] is not None:

3684

raise AssertionError()

3685

source_ids.pop(0)

3686

else:

3687

source_ids = self.source.all_revision_ids()

3688

source_ids_set = set(source_ids)

3689

# source_ids is the worst possible case we may need to pull.

3690

# now we want to filter source_ids against what we actually

3691

# have in target, but don't try to check for existence where we know

3692

# we do not have a revision as that would be pointless.

3693

target_ids = set(self.target.all_revision_ids())

3694

possibly_present_revisions = target_ids.intersection(source_ids_set)

3695

actually_present_revisions = set(

3696

self.target._eliminate_revisions_not_present(possibly_present_revisions))

3697

required_revisions = source_ids_set.difference(actually_present_revisions)

3698

if revision_id is not None:

3699

# we used get_ancestry to determine source_ids then we are assured all

3700

# revisions referenced are present as they are installed in topological order.

3701

# and the tip revision was validated by get_ancestry.

3702

result_set = required_revisions

3703

else:

3704

# if we just grabbed the possibly available ids, then

3705

# we only have an estimate of whats available and need to validate

3706

# that against the revision records.

3707

result_set = set(

3708

self.source._eliminate_revisions_not_present(required_revisions))

3709

return self.source.revision_ids_to_search_result(result_set)

3710

3711

3712

class InterDifferingSerializer(InterRepository):

3713

3714

@classmethod

3715

def _get_repo_format_to_test(self):

3716

return None

3717

3718

@staticmethod

3719

def is_compatible(source, target):

3720

"""Be compatible with Knit2 source and Knit3 target"""

3721

# This is redundant with format.check_conversion_target(), however that

3722

# raises an exception, and we just want to say "False" as in we won't

3723

# support converting between these formats.

3724

if 'IDS_never' in debug.debug_flags:

3725

return False

3726

if source.supports_rich_root() and not target.supports_rich_root():

3727

return False

3728

if (source._format.supports_tree_reference

3729

and not target._format.supports_tree_reference):

3730

return False

3731

if target._fallback_repositories and target._format.supports_chks:

3732

# IDS doesn't know how to copy CHKs for the parent inventories it

3733

# adds to stacked repos.

3734

return False

3735

if 'IDS_always' in debug.debug_flags:

3736

return True

3737

# Only use this code path for local source and target. IDS does far

3738

# too much IO (both bandwidth and roundtrips) over a network.

3739

if not source.bzrdir.transport.base.startswith('file:///'):

3740

return False

3741

if not target.bzrdir.transport.base.startswith('file:///'):

3742

return False

3743

return True

3744

3745

def _get_trees(self, revision_ids, cache):

3746

possible_trees = []

3747

for rev_id in revision_ids:

3748

if rev_id in cache:

3749

possible_trees.append((rev_id, cache[rev_id]))

3750

else:

3751

# Not cached, but inventory might be present anyway.

3752

try:

3753

tree = self.source.revision_tree(rev_id)

3754

except errors.NoSuchRevision:

3755

# Nope, parent is ghost.

3756

pass

3757

else:

3758

cache[rev_id] = tree

3759

possible_trees.append((rev_id, tree))

3760

return possible_trees

3761

3762

def _get_delta_for_revision(self, tree, parent_ids, possible_trees):

3763

"""Get the best delta and base for this revision.

3764

3765

:return: (basis_id, delta)

3766

"""

3767

deltas = []

3768

# Generate deltas against each tree, to find the shortest.

3769

texts_possibly_new_in_tree = set()

3770

for basis_id, basis_tree in possible_trees:

3771

delta = tree.inventory._make_delta(basis_tree.inventory)

3772

for old_path, new_path, file_id, new_entry in delta:

3773

if new_path is None:

3774

# This file_id isn't present in the new rev, so we don't

3775

# care about it.

3776

continue

3777

if not new_path:

3778

# Rich roots are handled elsewhere...

3779

continue

3780

kind = new_entry.kind

3781

if kind != 'directory' and kind != 'file':

3782

# No text record associated with this inventory entry.

3783

continue

3784

# This is a directory or file that has changed somehow.

3785

texts_possibly_new_in_tree.add((file_id, new_entry.revision))

3786

deltas.append((len(delta), basis_id, delta))

3787

deltas.sort()

3788

return deltas[0][1:]

3789

3790

def _fetch_parent_invs_for_stacking(self, parent_map, cache):

3791

"""Find all parent revisions that are absent, but for which the

3792

inventory is present, and copy those inventories.

3793

3794

This is necessary to preserve correctness when the source is stacked

3795

without fallbacks configured. (Note that in cases like upgrade the

3796

source may be not have _fallback_repositories even though it is

3797

stacked.)

3798

"""

3799

parent_revs = set()

3800

for parents in parent_map.values():

3801

parent_revs.update(parents)

3802

present_parents = self.source.get_parent_map(parent_revs)

3803

absent_parents = set(parent_revs).difference(present_parents)

3804

parent_invs_keys_for_stacking = self.source.inventories.get_parent_map(

3805

(rev_id,) for rev_id in absent_parents)

3806

parent_inv_ids = [key[-1] for key in parent_invs_keys_for_stacking]

3807

for parent_tree in self.source.revision_trees(parent_inv_ids):

3808

current_revision_id = parent_tree.get_revision_id()

3809

parents_parents_keys = parent_invs_keys_for_stacking[

3810

(current_revision_id,)]

3811

parents_parents = [key[-1] for key in parents_parents_keys]

3812

basis_id = _mod_revision.NULL_REVISION

3813

basis_tree = self.source.revision_tree(basis_id)

3814

delta = parent_tree.inventory._make_delta(basis_tree.inventory)

3815

self.target.add_inventory_by_delta(

3816

basis_id, delta, current_revision_id, parents_parents)

3817

cache[current_revision_id] = parent_tree

3818

3819

def _fetch_batch(self, revision_ids, basis_id, cache):

3820

"""Fetch across a few revisions.

3821

3822

:param revision_ids: The revisions to copy

3823

:param basis_id: The revision_id of a tree that must be in cache, used

3824

as a basis for delta when no other base is available

3825

:param cache: A cache of RevisionTrees that we can use.

3826

:return: The revision_id of the last converted tree. The RevisionTree

3827

for it will be in cache

3828

"""

3829

# Walk though all revisions; get inventory deltas, copy referenced

3830

# texts that delta references, insert the delta, revision and

3831

# signature.

3832

root_keys_to_create = set()

3833

text_keys = set()

3834

pending_deltas = []

3835

pending_revisions = []

3836

parent_map = self.source.get_parent_map(revision_ids)

3837

self._fetch_parent_invs_for_stacking(parent_map, cache)

3838

for tree in self.source.revision_trees(revision_ids):

3839

# Find a inventory delta for this revision.

3840

# Find text entries that need to be copied, too.

3841

current_revision_id = tree.get_revision_id()

3842

parent_ids = parent_map.get(current_revision_id, ())

3843

parent_trees = self._get_trees(parent_ids, cache)

3844

possible_trees = list(parent_trees)

3845

if len(possible_trees) == 0:

3846

# There either aren't any parents, or the parents are ghosts,

3847

# so just use the last converted tree.

3848

possible_trees.append((basis_id, cache[basis_id]))

3849

basis_id, delta = self._get_delta_for_revision(tree, parent_ids,

3850

possible_trees)

3851

revision = self.source.get_revision(current_revision_id)

3852

pending_deltas.append((basis_id, delta,

3853

current_revision_id, revision.parent_ids))

3854

if self._converting_to_rich_root:

3855

self._revision_id_to_root_id[current_revision_id] = \

3856

tree.get_root_id()

3857

# Determine which texts are in present in this revision but not in

3858

# any of the available parents.

3859

texts_possibly_new_in_tree = set()

3860

for old_path, new_path, file_id, entry in delta:

3861

if new_path is None:

3862

# This file_id isn't present in the new rev

3863

continue

3864

if not new_path:

3865

# This is the root

3866

if not self.target.supports_rich_root():

3867

# The target doesn't support rich root, so we don't

3868

# copy

3869

continue

3870

if self._converting_to_rich_root:

3871

# This can't be copied normally, we have to insert

3872

# it specially

3873

root_keys_to_create.add((file_id, entry.revision))

3874

continue

3875

kind = entry.kind

3876

texts_possibly_new_in_tree.add((file_id, entry.revision))

3877

for basis_id, basis_tree in possible_trees:

3878

basis_inv = basis_tree.inventory

3879

for file_key in list(texts_possibly_new_in_tree):

3880

file_id, file_revision = file_key

3881

try:

3882

entry = basis_inv[file_id]

3883

except errors.NoSuchId:

3884

continue

3885

if entry.revision == file_revision:

3886

texts_possibly_new_in_tree.remove(file_key)

3887

text_keys.update(texts_possibly_new_in_tree)

3888

pending_revisions.append(revision)

3889

cache[current_revision_id] = tree

3890

basis_id = current_revision_id

3891

# Copy file texts

3892

from_texts = self.source.texts

3893

to_texts = self.target.texts

3894

if root_keys_to_create:

3895

from bzrlib.fetch import _new_root_data_stream

3896

root_stream = _new_root_data_stream(

3897

root_keys_to_create, self._revision_id_to_root_id, parent_map,

3898

self.source)

3899

to_texts.insert_record_stream(root_stream)

3900

to_texts.insert_record_stream(from_texts.get_record_stream(

3901

text_keys, self.target._format._fetch_order,

3902

not self.target._format._fetch_uses_deltas))

3903

# insert inventory deltas

3904

for delta in pending_deltas:

3905

self.target.add_inventory_by_delta(*delta)

3906

if self.target._fallback_repositories:

3907

# Make sure this stacked repository has all the parent inventories

3908

# for the new revisions that we are about to insert. We do this

3909

# before adding the revisions so that no revision is added until

3910

# all the inventories it may depend on are added.

3911

# Note that this is overzealous, as we may have fetched these in an

3912

# earlier batch.

3913

parent_ids = set()

3914

revision_ids = set()

3915

for revision in pending_revisions:

3916

revision_ids.add(revision.revision_id)

3917

parent_ids.update(revision.parent_ids)

3918

parent_ids.difference_update(revision_ids)

3919

parent_ids.discard(_mod_revision.NULL_REVISION)

3920

parent_map = self.source.get_parent_map(parent_ids)

3921

# we iterate over parent_map and not parent_ids because we don't

3922

# want to try copying any revision which is a ghost

3923

for parent_tree in self.source.revision_trees(parent_map):

3924

current_revision_id = parent_tree.get_revision_id()

3925

parents_parents = parent_map[current_revision_id]

3926

possible_trees = self._get_trees(parents_parents, cache)

3927

if len(possible_trees) == 0:

3928

# There either aren't any parents, or the parents are

3929

# ghosts, so just use the last converted tree.

3930

possible_trees.append((basis_id, cache[basis_id]))

3931

basis_id, delta = self._get_delta_for_revision(parent_tree,

3932

parents_parents, possible_trees)

3933

self.target.add_inventory_by_delta(

3934

basis_id, delta, current_revision_id, parents_parents)

3935

# insert signatures and revisions

3936

for revision in pending_revisions:

3937

try:

3938

signature = self.source.get_signature_text(

3939

revision.revision_id)

3940

self.target.add_signature_text(revision.revision_id,

3941

signature)

3942

except errors.NoSuchRevision:

3943

pass

3944

self.target.add_revision(revision.revision_id, revision)

3945

return basis_id

3946

3947

def _fetch_all_revisions(self, revision_ids, pb):

3948

"""Fetch everything for the list of revisions.

3949

3950

:param revision_ids: The list of revisions to fetch. Must be in

3951

topological order.

3952

:param pb: A ProgressTask

3953

:return: None

3954

"""

3955

basis_id, basis_tree = self._get_basis(revision_ids[0])

3956

batch_size = 100

3957

cache = lru_cache.LRUCache(100)

3958

cache[basis_id] = basis_tree

3959

del basis_tree # We don't want to hang on to it here

3960

hints = []

3961

for offset in range(0, len(revision_ids), batch_size):

3962

self.target.start_write_group()

3963

try:

3964

pb.update('Transferring revisions', offset,

3965

len(revision_ids))

3966

batch = revision_ids[offset:offset+batch_size]

3967

basis_id = self._fetch_batch(batch, basis_id, cache)

3968

except:

3969

self.target.abort_write_group()

3970

raise

3971

else:

3972

hint = self.target.commit_write_group()

3973

if hint:

3974

hints.extend(hint)

3975

if hints and self.target._format.pack_compresses:

3976

self.target.pack(hint=hints)

3977

pb.update('Transferring revisions', len(revision_ids),

3978

len(revision_ids))

3979

3980

@needs_write_lock

3981

def fetch(self, revision_id=None, pb=None, find_ghosts=False,

3982

fetch_spec=None):

3983

"""See InterRepository.fetch()."""

3984

if fetch_spec is not None:

3985

raise AssertionError("Not implemented yet...")

3986

if (not self.source.supports_rich_root()

3987

and self.target.supports_rich_root()):

3988

self._converting_to_rich_root = True

3989

self._revision_id_to_root_id = {}

3990

else:

3991

self._converting_to_rich_root = False

3992

revision_ids = self.target.search_missing_revision_ids(self.source,

3993

revision_id, find_ghosts=find_ghosts).get_keys()

3994

if not revision_ids:

3995

return 0, 0

3996

revision_ids = tsort.topo_sort(

3997

self.source.get_graph().get_parent_map(revision_ids))

3998

if not revision_ids:

3999

return 0, 0

4000

# Walk though all revisions; get inventory deltas, copy referenced

4001

# texts that delta references, insert the delta, revision and

4002

# signature.

4003

if pb is None:

4004

my_pb = ui.ui_factory.nested_progress_bar()

4005

pb = my_pb

4006

else:

4007

symbol_versioning.warn(

4008

symbol_versioning.deprecated_in((1, 14, 0))

4009

% "pb parameter to fetch()")

4010

my_pb = None

4011

try:

4012

self._fetch_all_revisions(revision_ids, pb)

4013

finally:

4014

if my_pb is not None:

4015

my_pb.finished()

4016

return len(revision_ids), 0

4017

4018

def _get_basis(self, first_revision_id):

4019

"""Get a revision and tree which exists in the target.

4020

4021

This assumes that first_revision_id is selected for transmission

4022

because all other ancestors are already present. If we can't find an

4023

ancestor we fall back to NULL_REVISION since we know that is safe.

4024

4025

:return: (basis_id, basis_tree)

4026

"""

4027

first_rev = self.source.get_revision(first_revision_id)

4028

try:

4029

basis_id = first_rev.parent_ids[0]

4030

# only valid as a basis if the target has it

4031

self.target.get_revision(basis_id)

4032

# Try to get a basis tree - if its a ghost it will hit the

4033

# NoSuchRevision case.

4034

basis_tree = self.source.revision_tree(basis_id)

4035

except (IndexError, errors.NoSuchRevision):

4036

basis_id = _mod_revision.NULL_REVISION

4037

basis_tree = self.source.revision_tree(basis_id)

4038

return basis_id, basis_tree

4039

4040

4041

InterRepository.register_optimiser(InterDifferingSerializer)

4042

InterRepository.register_optimiser(InterSameDataRepository)

4043

InterRepository.register_optimiser(InterWeaveRepo)

4044

InterRepository.register_optimiser(InterKnitRepo)

4045

4046

4047

class CopyConverter(object):

4048

"""A repository conversion tool which just performs a copy of the content.

4049

4050

This is slow but quite reliable.

4051

"""

4052

4053

def __init__(self, target_format):

4054

"""Create a CopyConverter.

4055

4056

:param target_format: The format the resulting repository should be.

4057

"""

4058

self.target_format = target_format

4059

4060

def convert(self, repo, pb):

4061

"""Perform the conversion of to_convert, giving feedback via pb.

4062

4063

:param to_convert: The disk object to convert.

4064

:param pb: a progress bar to use for progress information.

4065

"""

4066

self.pb = pb

4067

self.count = 0

4068

self.total = 4

4069

# this is only useful with metadir layouts - separated repo content.

4070

# trigger an assertion if not such

4071

repo._format.get_format_string()

4072

self.repo_dir = repo.bzrdir

4073

self.step('Moving repository to repository.backup')

4074

self.repo_dir.transport.move('repository', 'repository.backup')

4075

backup_transport = self.repo_dir.transport.clone('repository.backup')

4076

repo._format.check_conversion_target(self.target_format)

4077

self.source_repo = repo._format.open(self.repo_dir,

4078

_found=True,

4079

_override_transport=backup_transport)

4080

self.step('Creating new repository')

4081

converted = self.target_format.initialize(self.repo_dir,

4082

self.source_repo.is_shared())

4083

converted.lock_write()

4084

try:

4085

self.step('Copying content')

4086

self.source_repo.copy_content_into(converted)

4087

finally:

4088

converted.unlock()

4089

self.step('Deleting old repository content')

4090

self.repo_dir.transport.delete_tree('repository.backup')

4091

ui.ui_factory.note('repository converted')

4092

4093

def step(self, message):

4094

"""Update the pb by a step."""

4095

self.count +=1

4096

self.pb.update(message, self.count, self.total)

4097

4098

4099

_unescape_map = {

4100

'apos':"'",

4101

'quot':'"',

4102

'amp':'&',

4103

'lt':'<',

4104

'gt':'>'

4105

}

4106

4107

4108

def _unescaper(match, _map=_unescape_map):

4109

code = match.group(1)

4110

try:

4111

return _map[code]

4112

except KeyError:

4113

if not code.startswith('#'):

4114

raise

4115

return unichr(int(code[1:])).encode('utf8')

4116

4117

4118

_unescape_re = None

4119

4120

4121

def _unescape_xml(data):

4122

"""Unescape predefined XML entities in a string of data."""

4123

global _unescape_re

4124

if _unescape_re is None:

4125

_unescape_re = re.compile('\&([^;]*);')

4126

return _unescape_re.sub(_unescaper, data)

4127

4128

4129

class _VersionedFileChecker(object):

4130

4131

def __init__(self, repository, text_key_references=None, ancestors=None):

4132

self.repository = repository

4133

self.text_index = self.repository._generate_text_key_index(

4134

text_key_references=text_key_references, ancestors=ancestors)

4135

4136

def calculate_file_version_parents(self, text_key):

4137

"""Calculate the correct parents for a file version according to

4138

the inventories.

4139

"""

4140

parent_keys = self.text_index[text_key]

4141

if parent_keys == [_mod_revision.NULL_REVISION]:

4142

return ()

4143

return tuple(parent_keys)

4144

4145

def check_file_version_parents(self, texts, progress_bar=None):

4146

"""Check the parents stored in a versioned file are correct.

4147

4148

It also detects file versions that are not referenced by their

4149

corresponding revision's inventory.

4150

4151

:returns: A tuple of (wrong_parents, dangling_file_versions).

4152

wrong_parents is a dict mapping {revision_id: (stored_parents,

4153

correct_parents)} for each revision_id where the stored parents

4154

are not correct. dangling_file_versions is a set of (file_id,

4155

revision_id) tuples for versions that are present in this versioned

4156

file, but not used by the corresponding inventory.

4157

"""

4158

local_progress = None

4159

if progress_bar is None:

4160

local_progress = ui.ui_factory.nested_progress_bar()

4161

progress_bar = local_progress

4162

try:

4163

return self._check_file_version_parents(texts, progress_bar)

4164

finally:

4165

if local_progress:

4166

local_progress.finished()

4167

4168

def _check_file_version_parents(self, texts, progress_bar):

4169

"""See check_file_version_parents."""

4170

wrong_parents = {}

4171

self.file_ids = set([file_id for file_id, _ in

4172

self.text_index.iterkeys()])

4173

# text keys is now grouped by file_id

4174

n_versions = len(self.text_index)

4175

progress_bar.update('loading text store', 0, n_versions)

4176

parent_map = self.repository.texts.get_parent_map(self.text_index)

4177

# On unlistable transports this could well be empty/error...

4178

text_keys = self.repository.texts.keys()

4179

unused_keys = frozenset(text_keys) - set(self.text_index)

4180

for num, key in enumerate(self.text_index.iterkeys()):

4181

progress_bar.update('checking text graph', num, n_versions)

4182

correct_parents = self.calculate_file_version_parents(key)

4183

try:

4184

knit_parents = parent_map[key]

4185

except errors.RevisionNotPresent:

4186

# Missing text!

4187

knit_parents = None

4188

if correct_parents != knit_parents:

4189

wrong_parents[key] = (knit_parents, correct_parents)

4190

return wrong_parents, unused_keys

4191

4192

4193

def _old_get_graph(repository, revision_id):

4194

"""DO NOT USE. That is all. I'm serious."""

4195

graph = repository.get_graph()

4196

revision_graph = dict(((key, value) for key, value in

4197

graph.iter_ancestry([revision_id]) if value is not None))

4198

return _strip_NULL_ghosts(revision_graph)

4199

4200

4201

def _strip_NULL_ghosts(revision_graph):

4202

"""Also don't use this. more compatibility code for unmigrated clients."""

4203

# Filter ghosts, and null:

4204

if _mod_revision.NULL_REVISION in revision_graph:

4205

del revision_graph[_mod_revision.NULL_REVISION]

4206

for key, parents in revision_graph.items():

4207

revision_graph[key] = tuple(parent for parent in parents if parent

4208

in revision_graph)

4209

return revision_graph

4210

4211

4212

class StreamSink(object):

4213

"""An object that can insert a stream into a repository.

4214

4215

This interface handles the complexity of reserialising inventories and

4216

revisions from different formats, and allows unidirectional insertion into

4217

stacked repositories without looking for the missing basis parents

4218

beforehand.

4219

"""

4220

4221

def __init__(self, target_repo):

4222

self.target_repo = target_repo

4223

4224

def insert_stream(self, stream, src_format, resume_tokens):

4225

"""Insert a stream's content into the target repository.

4226

4227

:param src_format: a bzr repository format.

4228

4229

:return: a list of resume tokens and an iterable of keys additional

4230

items required before the insertion can be completed.

4231

"""

4232

self.target_repo.lock_write()

4233

try:

4234

if resume_tokens:

4235

self.target_repo.resume_write_group(resume_tokens)

4236

is_resume = True

4237

else:

4238

self.target_repo.start_write_group()

4239

is_resume = False

4240

try:

4241

# locked_insert_stream performs a commit|suspend.

4242

return self._locked_insert_stream(stream, src_format, is_resume)

4243

except:

4244

self.target_repo.abort_write_group(suppress_errors=True)

4245

raise

4246

finally:

4247

self.target_repo.unlock()

4248

4249

def _locked_insert_stream(self, stream, src_format, is_resume):

4250

to_serializer = self.target_repo._format._serializer

4251

src_serializer = src_format._serializer

4252

new_pack = None

4253

if to_serializer == src_serializer:

4254

# If serializers match and the target is a pack repository, set the

4255

# write cache size on the new pack. This avoids poor performance

4256

# on transports where append is unbuffered (such as

4257

# RemoteTransport). This is safe to do because nothing should read

4258

# back from the target repository while a stream with matching

4259

# serialization is being inserted.

4260

# The exception is that a delta record from the source that should

4261

# be a fulltext may need to be expanded by the target (see

4262

# test_fetch_revisions_with_deltas_into_pack); but we take care to

4263

# explicitly flush any buffered writes first in that rare case.

4264

try:

4265

new_pack = self.target_repo._pack_collection._new_pack

4266

except AttributeError:

4267

# Not a pack repository

4268

pass

4269

else:

4270

new_pack.set_write_cache_size(1024*1024)

4271

for substream_type, substream in stream:

4272

if 'stream' in debug.debug_flags:

4273

mutter('inserting substream: %s', substream_type)

4274

if substream_type == 'texts':

4275

self.target_repo.texts.insert_record_stream(substream)

4276

elif substream_type == 'inventories':

4277

if src_serializer == to_serializer:

4278

self.target_repo.inventories.insert_record_stream(

4279

substream)

4280

else:

4281

self._extract_and_insert_inventories(

4282

substream, src_serializer)

4283

elif substream_type == 'inventory-deltas':

4284

self._extract_and_insert_inventory_deltas(

4285

substream, src_serializer)

4286

elif substream_type == 'chk_bytes':

4287

# XXX: This doesn't support conversions, as it assumes the

4288

# conversion was done in the fetch code.

4289

self.target_repo.chk_bytes.insert_record_stream(substream)

4290

elif substream_type == 'revisions':

4291

# This may fallback to extract-and-insert more often than

4292

# required if the serializers are different only in terms of

4293

# the inventory.

4294

if src_serializer == to_serializer:

4295

self.target_repo.revisions.insert_record_stream(

4296

substream)

4297

else:

4298

self._extract_and_insert_revisions(substream,

4299

src_serializer)

4300

elif substream_type == 'signatures':

4301

self.target_repo.signatures.insert_record_stream(substream)

4302

else:

4303

raise AssertionError('kaboom! %s' % (substream_type,))

4304

# Done inserting data, and the missing_keys calculations will try to

4305

# read back from the inserted data, so flush the writes to the new pack

4306

# (if this is pack format).

4307

if new_pack is not None:

4308

new_pack._write_data('', flush=True)

4309

# Find all the new revisions (including ones from resume_tokens)

4310

missing_keys = self.target_repo.get_missing_parent_inventories(

4311

check_for_missing_texts=is_resume)

4312

try:

4313

for prefix, versioned_file in (

4314

('texts', self.target_repo.texts),

4315

('inventories', self.target_repo.inventories),

4316

('revisions', self.target_repo.revisions),

4317

('signatures', self.target_repo.signatures),

4318

('chk_bytes', self.target_repo.chk_bytes),

4319

4320

if versioned_file is None:

4321

continue

4322

missing_keys.update((prefix,) + key for key in

4323

versioned_file.get_missing_compression_parent_keys())

4324

except NotImplementedError:

4325

# cannot even attempt suspending, and missing would have failed

4326

# during stream insertion.

4327

missing_keys = set()

4328

else:

4329

if missing_keys:

4330

# suspend the write group and tell the caller what we is

4331

# missing. We know we can suspend or else we would not have

4332

# entered this code path. (All repositories that can handle

4333

# missing keys can handle suspending a write group).

4334

write_group_tokens = self.target_repo.suspend_write_group()

4335

return write_group_tokens, missing_keys

4336

hint = self.target_repo.commit_write_group()

4337

if (to_serializer != src_serializer and

4338

self.target_repo._format.pack_compresses):

4339

self.target_repo.pack(hint=hint)

4340

return [], set()

4341

4342

def _extract_and_insert_inventory_deltas(self, substream, serializer):

4343

target_rich_root = self.target_repo._format.rich_root_data

4344

target_tree_refs = self.target_repo._format.supports_tree_reference

4345

for record in substream:

4346

# Insert the delta directly

4347

inventory_delta_bytes = record.get_bytes_as('fulltext')

4348

deserialiser = inventory_delta.InventoryDeltaDeserializer()

4349

try:

4350

parse_result = deserialiser.parse_text_bytes(

4351

inventory_delta_bytes)

4352

except inventory_delta.IncompatibleInventoryDelta, err:

4353

trace.mutter("Incompatible delta: %s", err.msg)

4354

raise errors.IncompatibleRevision(self.target_repo._format)

4355

basis_id, new_id, rich_root, tree_refs, inv_delta = parse_result

4356

revision_id = new_id

4357

parents = [key[0] for key in record.parents]

4358

self.target_repo.add_inventory_by_delta(

4359

basis_id, inv_delta, revision_id, parents)

4360

4361

def _extract_and_insert_inventories(self, substream, serializer,

4362

parse_delta=None):

4363

"""Generate a new inventory versionedfile in target, converting data.

4364

4365

The inventory is retrieved from the source, (deserializing it), and

4366

stored in the target (reserializing it in a different format).

4367

"""

4368

target_rich_root = self.target_repo._format.rich_root_data

4369

target_tree_refs = self.target_repo._format.supports_tree_reference

4370

for record in substream:

4371

# It's not a delta, so it must be a fulltext in the source

4372

# serializer's format.

4373

bytes = record.get_bytes_as('fulltext')

4374

revision_id = record.key[0]

4375

inv = serializer.read_inventory_from_string(bytes, revision_id)

4376

parents = [key[0] for key in record.parents]

4377

self.target_repo.add_inventory(revision_id, inv, parents)

4378

# No need to keep holding this full inv in memory when the rest of

4379

# the substream is likely to be all deltas.

4380

del inv

4381

4382

def _extract_and_insert_revisions(self, substream, serializer):

4383

for record in substream:

4384

bytes = record.get_bytes_as('fulltext')

4385

revision_id = record.key[0]

4386

rev = serializer.read_revision_from_string(bytes)

4387

if rev.revision_id != revision_id:

4388

raise AssertionError('wtf: %s != %s' % (rev, revision_id))

4389

self.target_repo.add_revision(revision_id, rev)

4390

4391

def finished(self):

4392

if self.target_repo._format._fetch_reconcile:

4393

self.target_repo.reconcile()

4394

4395

4396

class StreamSource(object):

4397

"""A source of a stream for fetching between repositories."""

4398

4399

def __init__(self, from_repository, to_format):

4400

"""Create a StreamSource streaming from from_repository."""

4401

self.from_repository = from_repository

4402

self.to_format = to_format

4403

4404

def delta_on_metadata(self):

4405

"""Return True if delta's are permitted on metadata streams.

4406

4407

That is on revisions and signatures.

4408

"""

4409

src_serializer = self.from_repository._format._serializer

4410

target_serializer = self.to_format._serializer

4411

return (self.to_format._fetch_uses_deltas and

4412

src_serializer == target_serializer)

4413

4414

def _fetch_revision_texts(self, revs):

4415

# fetch signatures first and then the revision texts

4416

# may need to be a InterRevisionStore call here.

4417

from_sf = self.from_repository.signatures

4418

# A missing signature is just skipped.

4419

keys = [(rev_id,) for rev_id in revs]

4420

signatures = versionedfile.filter_absent(from_sf.get_record_stream(

4421

keys,

4422

self.to_format._fetch_order,

4423

not self.to_format._fetch_uses_deltas))

4424

# If a revision has a delta, this is actually expanded inside the

4425

# insert_record_stream code now, which is an alternate fix for

4426

# bug #261339

4427

from_rf = self.from_repository.revisions

4428

revisions = from_rf.get_record_stream(

4429

keys,

4430

self.to_format._fetch_order,

4431

not self.delta_on_metadata())

4432

return [('signatures', signatures), ('revisions', revisions)]

4433

4434

def _generate_root_texts(self, revs):

4435

"""This will be called by get_stream between fetching weave texts and

4436

fetching the inventory weave.

4437

"""

4438

if self._rich_root_upgrade():

4439

import bzrlib.fetch

4440

return bzrlib.fetch.Inter1and2Helper(

4441

self.from_repository).generate_root_texts(revs)

4442

else:

4443

return []

4444

4445

def get_stream(self, search):

4446

phase = 'file'

4447

revs = search.get_keys()

4448

graph = self.from_repository.get_graph()

4449

revs = tsort.topo_sort(graph.get_parent_map(revs))

4450

data_to_fetch = self.from_repository.item_keys_introduced_by(revs)

4451

text_keys = []

4452

for knit_kind, file_id, revisions in data_to_fetch:

4453

if knit_kind != phase:

4454

phase = knit_kind

4455

# Make a new progress bar for this phase

4456

if knit_kind == "file":

4457

# Accumulate file texts

4458

text_keys.extend([(file_id, revision) for revision in

4459

revisions])

4460

elif knit_kind == "inventory":

4461

# Now copy the file texts.

4462

from_texts = self.from_repository.texts

4463

yield ('texts', from_texts.get_record_stream(

4464

text_keys, self.to_format._fetch_order,

4465

not self.to_format._fetch_uses_deltas))

4466

# Cause an error if a text occurs after we have done the

4467

# copy.

4468

text_keys = None

4469

# Before we process the inventory we generate the root

4470

# texts (if necessary) so that the inventories references

4471

# will be valid.

4472

for _ in self._generate_root_texts(revs):

4473

yield _

4474

# we fetch only the referenced inventories because we do not

4475

# know for unselected inventories whether all their required

4476

# texts are present in the other repository - it could be

4477

# corrupt.

4478

for info in self._get_inventory_stream(revs):

4479

yield info

4480

elif knit_kind == "signatures":

4481

# Nothing to do here; this will be taken care of when

4482

# _fetch_revision_texts happens.

4483

pass

4484

elif knit_kind == "revisions":

4485

for record in self._fetch_revision_texts(revs):

4486

yield record

4487

else:

4488

raise AssertionError("Unknown knit kind %r" % knit_kind)

4489

4490

def get_stream_for_missing_keys(self, missing_keys):

4491

# missing keys can only occur when we are byte copying and not

4492

# translating (because translation means we don't send

4493

# unreconstructable deltas ever).

4494

keys = {}

4495

keys['texts'] = set()

4496

keys['revisions'] = set()

4497

keys['inventories'] = set()

4498

keys['chk_bytes'] = set()

4499

keys['signatures'] = set()

4500

for key in missing_keys:

4501

keys[key[0]].add(key[1:])

4502

if len(keys['revisions']):

4503

# If we allowed copying revisions at this point, we could end up

4504

# copying a revision without copying its required texts: a

4505

# violation of the requirements for repository integrity.

4506

raise AssertionError(

4507

'cannot copy revisions to fill in missing deltas %s' % (

4508

keys['revisions'],))

4509

for substream_kind, keys in keys.iteritems():

4510

vf = getattr(self.from_repository, substream_kind)

4511

if vf is None and keys:

4512

raise AssertionError(

4513

"cannot fill in keys for a versioned file we don't"

4514

" have: %s needs %s" % (substream_kind, keys))

4515

if not keys:

4516

# No need to stream something we don't have

4517

continue

4518

if substream_kind == 'inventories':

4519

# Some missing keys are genuinely ghosts, filter those out.

4520

present = self.from_repository.inventories.get_parent_map(keys)

4521

revs = [key[0] for key in present]

4522

# Get the inventory stream more-or-less as we do for the

4523

# original stream; there's no reason to assume that records

4524

# direct from the source will be suitable for the sink. (Think

4525

# e.g. 2a -> 1.9-rich-root).

4526

for info in self._get_inventory_stream(revs, missing=True):

4527

yield info

4528

continue

4529

4530

# Ask for full texts always so that we don't need more round trips

4531

# after this stream.

4532

# Some of the missing keys are genuinely ghosts, so filter absent

4533

# records. The Sink is responsible for doing another check to

4534

# ensure that ghosts don't introduce missing data for future

4535

# fetches.

4536

stream = versionedfile.filter_absent(vf.get_record_stream(keys,

4537

self.to_format._fetch_order, True))

4538

yield substream_kind, stream

4539

4540

def inventory_fetch_order(self):

4541

if self._rich_root_upgrade():

4542

return 'topological'

4543

else:

4544

return self.to_format._fetch_order

4545

4546

def _rich_root_upgrade(self):

4547

return (not self.from_repository._format.rich_root_data and

4548

self.to_format.rich_root_data)

4549

4550

def _get_inventory_stream(self, revision_ids, missing=False):

4551

from_format = self.from_repository._format

4552

if (from_format.supports_chks and self.to_format.supports_chks and

4553

from_format.network_name() == self.to_format.network_name()):

4554

raise AssertionError(

4555

"this case should be handled by GroupCHKStreamSource")

4556

elif 'forceinvdeltas' in debug.debug_flags:

4557

return self._get_convertable_inventory_stream(revision_ids,

4558

delta_versus_null=missing)

4559

elif from_format.network_name() == self.to_format.network_name():

4560

# Same format.

4561

return self._get_simple_inventory_stream(revision_ids,

4562

missing=missing)

4563

elif (not from_format.supports_chks and not self.to_format.supports_chks

4564

and from_format._serializer == self.to_format._serializer):

4565

# Essentially the same format.

4566

return self._get_simple_inventory_stream(revision_ids,

4567

missing=missing)

4568

else:

4569

# Any time we switch serializations, we want to use an

4570

# inventory-delta based approach.

4571

return self._get_convertable_inventory_stream(revision_ids,

4572

delta_versus_null=missing)

4573

4574

def _get_simple_inventory_stream(self, revision_ids, missing=False):

4575

# NB: This currently reopens the inventory weave in source;

4576

# using a single stream interface instead would avoid this.

4577

from_weave = self.from_repository.inventories

4578

if missing:

4579

delta_closure = True

4580

else:

4581

delta_closure = not self.delta_on_metadata()

4582

yield ('inventories', from_weave.get_record_stream(

4583

[(rev_id,) for rev_id in revision_ids],

4584

self.inventory_fetch_order(), delta_closure))

4585

4586

def _get_convertable_inventory_stream(self, revision_ids,

4587

delta_versus_null=False):

4588

# The source is using CHKs, but the target either doesn't or it has a

4589

# different serializer. The StreamSink code expects to be able to

4590

# convert on the target, so we need to put bytes-on-the-wire that can

4591

# be converted. That means inventory deltas (if the remote is <1.19,

4592

# RemoteStreamSink will fallback to VFS to insert the deltas).

4593

yield ('inventory-deltas',

4594

self._stream_invs_as_deltas(revision_ids,

4595

delta_versus_null=delta_versus_null))

4596

4597

def _stream_invs_as_deltas(self, revision_ids, delta_versus_null=False):

4598

"""Return a stream of inventory-deltas for the given rev ids.

4599

4600

:param revision_ids: The list of inventories to transmit

4601

:param delta_versus_null: Don't try to find a minimal delta for this

4602

entry, instead compute the delta versus the NULL_REVISION. This

4603

effectively streams a complete inventory. Used for stuff like

4604

filling in missing parents, etc.

4605

"""

4606

from_repo = self.from_repository

4607

revision_keys = [(rev_id,) for rev_id in revision_ids]

4608

parent_map = from_repo.inventories.get_parent_map(revision_keys)

4609

# XXX: possibly repos could implement a more efficient iter_inv_deltas

4610

# method...

4611

inventories = self.from_repository.iter_inventories(

4612

revision_ids, 'topological')

4613

format = from_repo._format

4614

invs_sent_so_far = set([_mod_revision.NULL_REVISION])

4615

inventory_cache = lru_cache.LRUCache(50)

4616

null_inventory = from_repo.revision_tree(

4617

_mod_revision.NULL_REVISION).inventory

4618

# XXX: ideally the rich-root/tree-refs flags would be per-revision, not

4619

# per-repo (e.g. streaming a non-rich-root revision out of a rich-root

4620

# repo back into a non-rich-root repo ought to be allowed)

4621

serializer = inventory_delta.InventoryDeltaSerializer(

4622

versioned_root=format.rich_root_data,

4623

tree_references=format.supports_tree_reference)

4624

for inv in inventories:

4625

key = (inv.revision_id,)

4626

parent_keys = parent_map.get(key, ())

4627

delta = None

4628

if not delta_versus_null and parent_keys:

4629

# The caller did not ask for complete inventories and we have

4630

# some parents that we can delta against. Make a delta against

4631

# each parent so that we can find the smallest.

4632

parent_ids = [parent_key[0] for parent_key in parent_keys]

4633

for parent_id in parent_ids:

4634

if parent_id not in invs_sent_so_far:

4635

# We don't know that the remote side has this basis, so

4636

# we can't use it.

4637

continue

4638

if parent_id == _mod_revision.NULL_REVISION:

4639

parent_inv = null_inventory

4640

else:

4641

parent_inv = inventory_cache.get(parent_id, None)

4642

if parent_inv is None:

4643

parent_inv = from_repo.get_inventory(parent_id)

4644

candidate_delta = inv._make_delta(parent_inv)

4645

if (delta is None or

4646

len(delta) > len(candidate_delta)):

4647

delta = candidate_delta

4648

basis_id = parent_id

4649

if delta is None:

4650

# Either none of the parents ended up being suitable, or we

4651

# were asked to delta against NULL

4652

basis_id = _mod_revision.NULL_REVISION

4653

delta = inv._make_delta(null_inventory)

4654

invs_sent_so_far.add(inv.revision_id)

4655

inventory_cache[inv.revision_id] = inv

4656

delta_serialized = ''.join(

4657

serializer.delta_to_lines(basis_id, key[-1], delta))

4658

yield versionedfile.FulltextContentFactory(

4659

key, parent_keys, None, delta_serialized)

4660

4661

4662

def _iter_for_revno(repo, partial_history_cache, stop_index=None,

4663

stop_revision=None):

4664

"""Extend the partial history to include a given index

4665

4666

If a stop_index is supplied, stop when that index has been reached.

4667

If a stop_revision is supplied, stop when that revision is

4668

encountered. Otherwise, stop when the beginning of history is

4669

reached.

4670

4671

:param stop_index: The index which should be present. When it is

4672

present, history extension will stop.

4673

:param stop_revision: The revision id which should be present. When

4674

it is encountered, history extension will stop.

4675

"""

4676

start_revision = partial_history_cache[-1]

4677

iterator = repo.iter_reverse_revision_history(start_revision)

4678

try:

4679

#skip the last revision in the list

4680

iterator.next()

4681

while True:

4682

if (stop_index is not None and

4683

len(partial_history_cache) > stop_index):

4684

break

4685

if partial_history_cache[-1] == stop_revision:

4686

break

4687

revision_id = iterator.next()

4688

partial_history_cache.append(revision_id)

4689

except StopIteration:

4690

# No more history

4691

return

4692

Older »