~bzr-pqm/bzr/bzr.dev

Committer: v.ladeuil+lp at free
Date: 2007-05-15 17:40:32 UTC
mto: (2485.8.44 bzr.connection.sharing)
mto: This revision was merged to the branch mainline in revision 2646.
Revision ID: v.ladeuil+lp@free.fr-20070515174032-qzdkangpv29l9e7g

Add a test that check that init connect only once. It fails.

* __init__.py:
(test_suite): Register the new test class.

* test_init.py:
(InstrumentedTransport): A transport that can track connections.
(TransportHooks): Transport specific hooks.
(TestInit): Iniit command behavior tests.

* ftp.py:
(FtpTransport.__init__): Mark place that need fixing regarding
transport connection sharing

* builtins.py:
(cmd_init.run): Mark places that need fixing regarding transport
connection sharing.

files added:
bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/graph.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_graph.py

bzrlib/textui.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/weave_commands.py

bzrlib/xml6.py

contrib/add-bzr-to-baz

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

doc/README.1st

doc/bazaar-vcs.org.kid

doc/index.txt

tools/biobench.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/trace-revisions

tools/weavebench.py

files removed:
.testr.conf

MANIFEST.in

NEWS

README_BDIST_RPM

apport

apport/README

apport/bzr-crashdb.conf

apport/source_bzr.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/btree_index.py

bzrlib/bundle/serializer/v4.py

bzrlib/cethread.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmd_test_script.py

bzrlib/cmdline.py

bzrlib/controldir.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/doc_generate/builders

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/conf.py

bzrlib/doc_generate/writers

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/email_message.py

bzrlib/export_pot.py

bzrlib/fifo_cache.py

bzrlib/filter_tree.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/conflict-types.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/location-alias.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/help_topics/en/url-special-chars.txt

bzrlib/help_topics/es

bzrlib/help_topics/es/conflict-types.txt

bzrlib/i18n.py

bzrlib/index.py

bzrlib/inventory_delta.py

bzrlib/library_state.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/mergetools.py

bzrlib/multiparent.py

bzrlib/pack.py

bzrlib/patiencediff.py

bzrlib/plugins/bash_completion

bzrlib/plugins/bash_completion/README.txt

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/bash_completion/tests

bzrlib/plugins/bash_completion/tests/__init__.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/changelog_merge

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/changelog_merge/tests

bzrlib/plugins/changelog_merge/tests/__init__.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_api_lite.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_api_lite.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/plugins/weave_fmt

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/tests

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/pyutils.py

bzrlib/readdir.h

bzrlib/reconfigure.py

bzrlib/recordcounter.py

bzrlib/rename_map.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/repofmt/pack_repo.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smtp_connection.py

bzrlib/static_tuple.py

bzrlib/switch.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_lookup_revision.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remember_option.py

bzrlib/tests/blackbox/test_repair_workingtree.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_revert.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/doc_generate

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders

bzrlib/tests/doc_generate/builders/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers

bzrlib/tests/doc_generate/writers/__init__.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/fixtures.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/https_server.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/test_format.py

bzrlib/tests/per_controldir/test_push.py

bzrlib/tests/per_controldir_colo

bzrlib/tests/per_controldir_colo/__init__.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_copy_content_into.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_interbranch/test_get.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_intertree/test_file_content_matches.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_file_graph.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_locking.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test__make_parents_provider.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_commit_with_stacking.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_repository_vf

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_repository_vf/helpers.py

bzrlib/tests/per_repository_vf/test__generate_text_key_index.py

bzrlib/tests/per_repository_vf/test_add_inventory_by_delta.py

bzrlib/tests/per_repository_vf/test_check.py

bzrlib/tests/per_repository_vf/test_check_reconcile.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_repository_vf/test_find_text_key_references.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_refresh_data.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_repository_vf/test_write_group.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_export.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_check_state.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/scenarios.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__btree_serializer.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_features.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filter_tree.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_fixtures.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_i18n.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_pyutils.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_script.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_utextwrap.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/testui.py

bzrlib/tests/transport_util.py

bzrlib/transport/brokenrename.py

bzrlib/transport/ftp

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/gio_transport.py

bzrlib/transport/log.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/utextwrap.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/vf_repository.py

bzrlib/views.py

bzrlib/workingtree_3.py

bzrlib/xml5.py

bzrlib/xml6.py

contrib/bash/bzr

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

contrib/zsh/README

doc/Bazaar-Logo-For-Manuals.png

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/configuration.txt

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/documenting-changes.txt

doc/developers/ec2.txt

doc/developers/fetch.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/index-plain.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/principles.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/transports.txt

doc/developers/ui.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/developers/win32_build_setup.txt

doc/developers/xdg_config_spec.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/index.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/licence.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/release-notes/bzr-0.1.txt

doc/en/release-notes/bzr-0.10.txt

doc/en/release-notes/bzr-0.11.txt

doc/en/release-notes/bzr-0.12.txt

doc/en/release-notes/bzr-0.13.txt

doc/en/release-notes/bzr-0.14.txt

doc/en/release-notes/bzr-0.15.txt

doc/en/release-notes/bzr-0.16.txt

doc/en/release-notes/bzr-0.17.txt

doc/en/release-notes/bzr-0.18.txt

doc/en/release-notes/bzr-0.6.txt

doc/en/release-notes/bzr-0.7.txt

doc/en/release-notes/bzr-0.8.txt

doc/en/release-notes/bzr-0.9.txt

doc/en/release-notes/bzr-0.90.txt

doc/en/release-notes/bzr-0.91.txt

doc/en/release-notes/bzr-0.92.txt

doc/en/release-notes/bzr-1.0.txt

doc/en/release-notes/bzr-1.1.txt

doc/en/release-notes/bzr-1.10.txt

doc/en/release-notes/bzr-1.11.txt

doc/en/release-notes/bzr-1.12.txt

doc/en/release-notes/bzr-1.13.txt

doc/en/release-notes/bzr-1.14.txt

doc/en/release-notes/bzr-1.15.txt

doc/en/release-notes/bzr-1.16.txt

doc/en/release-notes/bzr-1.17.txt

doc/en/release-notes/bzr-1.18.txt

doc/en/release-notes/bzr-1.2.txt

doc/en/release-notes/bzr-1.3.txt

doc/en/release-notes/bzr-1.4.txt

doc/en/release-notes/bzr-1.5.txt

doc/en/release-notes/bzr-1.6.txt

doc/en/release-notes/bzr-1.7.txt

doc/en/release-notes/bzr-1.8.txt

doc/en/release-notes/bzr-1.9.txt

doc/en/release-notes/bzr-2.0.txt

doc/en/release-notes/bzr-2.1.txt

doc/en/release-notes/bzr-2.2.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/bzr-2.5.txt

doc/en/release-notes/release-template.txt

doc/en/release-notes/series-template.txt

doc/en/tutorials

doc/en/tutorials/index.txt

doc/en/tutorials/licence.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/licence.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/gpg_signatures.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/licence.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/en/whats-new

doc/en/whats-new/template.txt

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/en/whats-new/whats-new-in-2.4.txt

doc/en/whats-new/whats-new-in-2.5.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/index.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/licence.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index-plain.txt

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/licence.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/build_mo.py

tools/check-newsbugs.py

tools/fixed-in.py

tools/generate_release_notes.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/rst2pdf.py

tools/subunit-sum

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/py2exe_boot_common.py

tools/win32/run_script.py

files renamed:
doc/en/release-notes/bzr-2.3.txt => NEWS

bzrlib/help_topics/__init__.py => bzrlib/help_topics.py

bzrlib/_patiencediff_py.py => bzrlib/patiencediff.py

bzrlib/plugins/launchpad/lp_directory.py => bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_directory.py => bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/weave_fmt/repository.py => bzrlib/repofmt/weaverepo.py

bzrlib/commit_signature_commands.py => bzrlib/sign_my_commits.py

bzrlib/tests/http_utils.py => bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/http_server.py => bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_send.py => bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/per_branch/ => bzrlib/tests/branch_implementations/

bzrlib/tests/per_controldir/ => bzrlib/tests/bzrdir_implementations/

bzrlib/tests/per_controldir/test_controldir.py => bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/per_interrepository/ => bzrlib/tests/interrepository_implementations/

bzrlib/tests/per_intertree/ => bzrlib/tests/intertree_implementations/

bzrlib/tests/per_repository/ => bzrlib/tests/repository_implementations/

bzrlib/tests/commands/test_init.py => bzrlib/tests/test_init.py

bzrlib/tests/test_revisionspec.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/per_transport.py => bzrlib/tests/test_transport_implementations.py

bzrlib/tests/per_versionedfile.py => bzrlib/tests/test_versionedfile.py

bzrlib/tests/per_tree/ => bzrlib/tests/tree_implementations/

bzrlib/tests/per_workingtree/ => bzrlib/tests/workingtree_implementations/

bzrlib/transport/ftp/__init__.py => bzrlib/transport/ftp.py

bzrlib/util/_bencode_py.py => bzrlib/util/bencode.py

bzrlib/plugins/weave_fmt/xml4.py => bzrlib/xml4.py

bzrlib/xml8.py => bzrlib/xml5.py

doc/en/tutorials/centralized_workflow.txt => doc/centralized_workflow.txt

bzrlib/help_topics/en/configuration.txt => doc/configuration.txt

doc/developers/HACKING.txt => doc/developers/HACKING

doc/en/user-guide/http_smart_server.txt => doc/http_smart_server.txt

doc/en/user-guide/plugins.txt => doc/plugins.txt

doc/en/user-guide/server.txt => doc/server.txt

doc/en/user-guide/setting_up_email.txt => doc/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt => doc/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt => doc/specifying_revisions.txt

doc/en/tutorials/tutorial.txt => doc/tutorial.txt

doc/en/user-guide/using_aliases.txt => doc/using_aliases.txt

doc/en/user-guide/version_info.txt => doc/version_info.txt

tools/generate_docs.py => generate_docs.py

bzrlib/doc_generate/ => tools/doc_generate/

files modified:
.bzrignore

INSTALL

Makefile

README

bzr.ico

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml7.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

profile_imports.py

setup.py

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/chk_map.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Persistent maps from tuple_of_strings->string using CHK stores.

Overview and current status:

The CHKMap class implements a dict from tuple_of_strings->string by using a trie

with internal nodes of 8-bit fan out; The key tuples are mapped to strings by

joining them by \x00, and \x00 padding shorter keys out to the length of the

longest key. Leaf nodes are packed as densely as possible, and internal nodes

are all an additional 8-bits wide leading to a sparse upper tree.

Updates to a CHKMap are done preferentially via the apply_delta method, to

allow optimisation of the update operation; but individual map/unmap calls are

possible and supported. Individual changes via map/unmap are buffered in memory

until the _save method is called to force serialisation of the tree.

apply_delta records its changes immediately by performing an implicit _save.

TODO:

-----

Densely packed upper nodes.

"""

import heapq

import threading

from bzrlib import lazy_import

lazy_import.lazy_import(globals(), """

from bzrlib import (

errors,

)

""")

from bzrlib import (

errors,

lru_cache,

osutils,

registry,

static_tuple,

trace,

)

from bzrlib.static_tuple import StaticTuple

# approx 4MB

# If each line is 50 bytes, and you have 255 internal pages, with 255-way fan

# out, it takes 3.1MB to cache the layer.

_PAGE_CACHE_SIZE = 4*1024*1024

# Per thread caches for 2 reasons:

# - in the server we may be serving very different content, so we get less

# cache thrashing.

# - we avoid locking on every cache lookup.

_thread_caches = threading.local()

# The page cache.

_thread_caches.page_cache = None

def _get_cache():

"""Get the per-thread page cache.

We need a function to do this because in a new thread the _thread_caches

threading.local object does not have the cache initialized yet.

"""

page_cache = getattr(_thread_caches, 'page_cache', None)

if page_cache is None:

# We are caching bytes so len(value) is perfectly accurate

page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)

_thread_caches.page_cache = page_cache

return page_cache

def clear_cache():

_get_cache().clear()

# If a ChildNode falls below this many bytes, we check for a remap

_INTERESTING_NEW_SIZE = 50

# If a ChildNode shrinks by more than this amount, we check for a remap

_INTERESTING_SHRINKAGE_LIMIT = 20

def _search_key_plain(key):

"""Map the key tuple into a search string that just uses the key bytes."""

return '\x00'.join(key)

100

search_key_registry = registry.Registry()

101

search_key_registry.register('plain', _search_key_plain)

102

103

104

class CHKMap(object):

105

"""A persistent map from string to string backed by a CHK store."""

106

107

__slots__ = ('_store', '_root_node', '_search_key_func')

108

109

def __init__(self, store, root_key, search_key_func=None):

110

"""Create a CHKMap object.

111

112

:param store: The store the CHKMap is stored in.

113

:param root_key: The root key of the map. None to create an empty

114

CHKMap.

115

:param search_key_func: A function mapping a key => bytes. These bytes

116

are then used by the internal nodes to split up leaf nodes into

117

multiple pages.

118

"""

119

self._store = store

120

if search_key_func is None:

121

search_key_func = _search_key_plain

122

self._search_key_func = search_key_func

123

if root_key is None:

124

self._root_node = LeafNode(search_key_func=search_key_func)

125

else:

126

self._root_node = self._node_key(root_key)

127

128

def apply_delta(self, delta):

129

"""Apply a delta to the map.

130

131

:param delta: An iterable of old_key, new_key, new_value tuples.

132

If new_key is not None, then new_key->new_value is inserted

133

into the map; if old_key is not None, then the old mapping

134

of old_key is removed.

135

"""

136

has_deletes = False

137

# Check preconditions first.

138

as_st = StaticTuple.from_sequence

139

new_items = set([as_st(key) for (old, key, value) in delta

140

if key is not None and old is None])

141

existing_new = list(self.iteritems(key_filter=new_items))

142

if existing_new:

143

raise errors.InconsistentDeltaDelta(delta,

144

"New items are already in the map %r." % existing_new)

145

# Now apply changes.

146

for old, new, value in delta:

147

if old is not None and old != new:

148

self.unmap(old, check_remap=False)

149

has_deletes = True

150

for old, new, value in delta:

151

if new is not None:

152

self.map(new, value)

153

if has_deletes:

154

self._check_remap()

155

return self._save()

156

157

def _ensure_root(self):

158

"""Ensure that the root node is an object not a key."""

159

if type(self._root_node) is StaticTuple:

160

# Demand-load the root

161

self._root_node = self._get_node(self._root_node)

162

163

def _get_node(self, node):

164

"""Get a node.

165

166

Note that this does not update the _items dict in objects containing a

167

reference to this node. As such it does not prevent subsequent IO being

168

performed.

169

170

:param node: A tuple key or node object.

171

:return: A node object.

172

"""

173

if type(node) is StaticTuple:

174

bytes = self._read_bytes(node)

175

return _deserialise(bytes, node,

176

search_key_func=self._search_key_func)

177

else:

178

return node

179

180

def _read_bytes(self, key):

181

try:

182

return _get_cache()[key]

183

except KeyError:

184

stream = self._store.get_record_stream([key], 'unordered', True)

185

bytes = stream.next().get_bytes_as('fulltext')

186

_get_cache()[key] = bytes

187

return bytes

188

189

def _dump_tree(self, include_keys=False):

190

"""Return the tree in a string representation."""

191

self._ensure_root()

192

res = self._dump_tree_node(self._root_node, prefix='', indent='',

193

include_keys=include_keys)

194

res.append('') # Give a trailing '\n'

195

return '\n'.join(res)

196

197

def _dump_tree_node(self, node, prefix, indent, include_keys=True):

198

"""For this node and all children, generate a string representation."""

199

result = []

200

if not include_keys:

201

key_str = ''

202

else:

203

node_key = node.key()

204

if node_key is not None:

205

key_str = ' %s' % (node_key[0],)

206

else:

207

key_str = ' None'

208

result.append('%s%r %s%s' % (indent, prefix, node.__class__.__name__,

209

key_str))

210

if type(node) is InternalNode:

211

# Trigger all child nodes to get loaded

212

list(node._iter_nodes(self._store))

213

for prefix, sub in sorted(node._items.iteritems()):

214

result.extend(self._dump_tree_node(sub, prefix, indent + ' ',

215

include_keys=include_keys))

216

else:

217

for key, value in sorted(node._items.iteritems()):

218

# Don't use prefix nor indent here to line up when used in

219

# tests in conjunction with assertEqualDiff

220

result.append(' %r %r' % (tuple(key), value))

221

return result

222

223

@classmethod

224

def from_dict(klass, store, initial_value, maximum_size=0, key_width=1,

225

search_key_func=None):

226

"""Create a CHKMap in store with initial_value as the content.

227

228

:param store: The store to record initial_value in, a VersionedFiles

229

object with 1-tuple keys supporting CHK key generation.

230

:param initial_value: A dict to store in store. Its keys and values

231

must be bytestrings.

232

:param maximum_size: The maximum_size rule to apply to nodes. This

233

determines the size at which no new data is added to a single node.

234

:param key_width: The number of elements in each key_tuple being stored

235

in this map.

236

:param search_key_func: A function mapping a key => bytes. These bytes

237

are then used by the internal nodes to split up leaf nodes into

238

multiple pages.

239

:return: The root chk of the resulting CHKMap.

240

"""

241

root_key = klass._create_directly(store, initial_value,

242

maximum_size=maximum_size, key_width=key_width,

243

search_key_func=search_key_func)

244

if type(root_key) is not StaticTuple:

245

raise AssertionError('we got a %s instead of a StaticTuple'

246

% (type(root_key),))

247

return root_key

248

249

@classmethod

250

def _create_via_map(klass, store, initial_value, maximum_size=0,

251

key_width=1, search_key_func=None):

252

result = klass(store, None, search_key_func=search_key_func)

253

result._root_node.set_maximum_size(maximum_size)

254

result._root_node._key_width = key_width

255

delta = []

256

for key, value in initial_value.items():

257

delta.append((None, key, value))

258

root_key = result.apply_delta(delta)

259

return root_key

260

261

@classmethod

262

def _create_directly(klass, store, initial_value, maximum_size=0,

263

key_width=1, search_key_func=None):

264

node = LeafNode(search_key_func=search_key_func)

265

node.set_maximum_size(maximum_size)

266

node._key_width = key_width

267

as_st = StaticTuple.from_sequence

268

node._items = dict([(as_st(key), val) for key, val

269

in initial_value.iteritems()])

270

node._raw_size = sum([node._key_value_len(key, value)

271

for key,value in node._items.iteritems()])

272

node._len = len(node._items)

273

node._compute_search_prefix()

274

node._compute_serialised_prefix()

275

if (node._len > 1

276

and maximum_size

277

and node._current_size() > maximum_size):

278

prefix, node_details = node._split(store)

279

if len(node_details) == 1:

280

raise AssertionError('Failed to split using node._split')

281

node = InternalNode(prefix, search_key_func=search_key_func)

282

node.set_maximum_size(maximum_size)

283

node._key_width = key_width

284

for split, subnode in node_details:

285

node.add_node(split, subnode)

286

keys = list(node.serialise(store))

287

return keys[-1]

288

289

def iter_changes(self, basis):

290

"""Iterate over the changes between basis and self.

291

292

:return: An iterator of tuples: (key, old_value, new_value). Old_value

293

is None for keys only in self; new_value is None for keys only in

294

basis.

295

"""

296

# Overview:

297

# Read both trees in lexographic, highest-first order.

298

# Any identical nodes we skip

299

# Any unique prefixes we output immediately.

300

# values in a leaf node are treated as single-value nodes in the tree

301

# which allows them to be not-special-cased. We know to output them

302

# because their value is a string, not a key(tuple) or node.

303

304

# corner cases to beware of when considering this function:

305

# *) common references are at different heights.

306

# consider two trees:

307

# {'a': LeafNode={'aaa':'foo', 'aab':'bar'}, 'b': LeafNode={'b'}}

308

# {'a': InternalNode={'aa':LeafNode={'aaa':'foo', 'aab':'bar'},

309

# 'ab':LeafNode={'ab':'bar'}}

310

# 'b': LeafNode={'b'}}

311

# the node with aaa/aab will only be encountered in the second tree

312

# after reading the 'a' subtree, but it is encountered in the first

313

# tree immediately. Variations on this may have read internal nodes

314

# like this. we want to cut the entire pending subtree when we

315

# realise we have a common node. For this we use a list of keys -

316

# the path to a node - and check the entire path is clean as we

317

# process each item.

318

if self._node_key(self._root_node) == self._node_key(basis._root_node):

319

return

320

self._ensure_root()

321

basis._ensure_root()

322

excluded_keys = set()

323

self_node = self._root_node

324

basis_node = basis._root_node

325

# A heap, each element is prefix, node(tuple/NodeObject/string),

326

# key_path (a list of tuples, tail-sharing down the tree.)

327

self_pending = []

328

basis_pending = []

329

def process_node(node, path, a_map, pending):

330

# take a node and expand it

331

node = a_map._get_node(node)

332

if type(node) == LeafNode:

333

path = (node._key, path)

334

for key, value in node._items.items():

335

# For a LeafNode, the key is a serialized_key, rather than

336

# a search_key, but the heap is using search_keys

337

search_key = node._search_key_func(key)

338

heapq.heappush(pending, (search_key, key, value, path))

339

else:

340

# type(node) == InternalNode

341

path = (node._key, path)

342

for prefix, child in node._items.items():

343

heapq.heappush(pending, (prefix, None, child, path))

344

def process_common_internal_nodes(self_node, basis_node):

345

self_items = set(self_node._items.items())

346

basis_items = set(basis_node._items.items())

347

path = (self_node._key, None)

348

for prefix, child in self_items - basis_items:

349

heapq.heappush(self_pending, (prefix, None, child, path))

350

path = (basis_node._key, None)

351

for prefix, child in basis_items - self_items:

352

heapq.heappush(basis_pending, (prefix, None, child, path))

353

def process_common_leaf_nodes(self_node, basis_node):

354

self_items = set(self_node._items.items())

355

basis_items = set(basis_node._items.items())

356

path = (self_node._key, None)

357

for key, value in self_items - basis_items:

358

prefix = self._search_key_func(key)

359

heapq.heappush(self_pending, (prefix, key, value, path))

360

path = (basis_node._key, None)

361

for key, value in basis_items - self_items:

362

prefix = basis._search_key_func(key)

363

heapq.heappush(basis_pending, (prefix, key, value, path))

364

def process_common_prefix_nodes(self_node, self_path,

365

basis_node, basis_path):

366

# Would it be more efficient if we could request both at the same

367

# time?

368

self_node = self._get_node(self_node)

369

basis_node = basis._get_node(basis_node)

370

if (type(self_node) == InternalNode

371

and type(basis_node) == InternalNode):

372

# Matching internal nodes

373

process_common_internal_nodes(self_node, basis_node)

374

elif (type(self_node) == LeafNode

375

and type(basis_node) == LeafNode):

376

process_common_leaf_nodes(self_node, basis_node)

377

else:

378

process_node(self_node, self_path, self, self_pending)

379

process_node(basis_node, basis_path, basis, basis_pending)

380

process_common_prefix_nodes(self_node, None, basis_node, None)

381

self_seen = set()

382

basis_seen = set()

383

excluded_keys = set()

384

def check_excluded(key_path):

385

# Note that this is N^2, it depends on us trimming trees

386

# aggressively to not become slow.

387

# A better implementation would probably have a reverse map

388

# back to the children of a node, and jump straight to it when

389

# a common node is detected, the proceed to remove the already

390

# pending children. bzrlib.graph has a searcher module with a

391

# similar problem.

392

while key_path is not None:

393

key, key_path = key_path

394

if key in excluded_keys:

395

return True

396

return False

397

398

loop_counter = 0

399

while self_pending or basis_pending:

400

loop_counter += 1

401

if not self_pending:

402

# self is exhausted: output remainder of basis

403

for prefix, key, node, path in basis_pending:

404

if check_excluded(path):

405

continue

406

node = basis._get_node(node)

407

if key is not None:

408

# a value

409

yield (key, node, None)

410

else:

411

# subtree - fastpath the entire thing.

412

for key, value in node.iteritems(basis._store):

413

yield (key, value, None)

414

return

415

elif not basis_pending:

416

# basis is exhausted: output remainder of self.

417

for prefix, key, node, path in self_pending:

418

if check_excluded(path):

419

continue

420

node = self._get_node(node)

421

if key is not None:

422

# a value

423

yield (key, None, node)

424

else:

425

# subtree - fastpath the entire thing.

426

for key, value in node.iteritems(self._store):

427

yield (key, None, value)

428

return

429

else:

430

# XXX: future optimisation - yield the smaller items

431

# immediately rather than pushing everything on/off the

432

# heaps. Applies to both internal nodes and leafnodes.

433

if self_pending[0][0] < basis_pending[0][0]:

434

# expand self

435

prefix, key, node, path = heapq.heappop(self_pending)

436

if check_excluded(path):

437

continue

438

if key is not None:

439

# a value

440

yield (key, None, node)

441

else:

442

process_node(node, path, self, self_pending)

443

continue

444

elif self_pending[0][0] > basis_pending[0][0]:

445

# expand basis

446

prefix, key, node, path = heapq.heappop(basis_pending)

447

if check_excluded(path):

448

continue

449

if key is not None:

450

# a value

451

yield (key, node, None)

452

else:

453

process_node(node, path, basis, basis_pending)

454

continue

455

else:

456

# common prefix: possibly expand both

457

if self_pending[0][1] is None:

458

# process next self

459

read_self = True

460

else:

461

read_self = False

462

if basis_pending[0][1] is None:

463

# process next basis

464

read_basis = True

465

else:

466

read_basis = False

467

if not read_self and not read_basis:

468

# compare a common value

469

self_details = heapq.heappop(self_pending)

470

basis_details = heapq.heappop(basis_pending)

471

if self_details[2] != basis_details[2]:

472

yield (self_details[1],

473

basis_details[2], self_details[2])

474

continue

475

# At least one side wasn't a simple value

476

if (self._node_key(self_pending[0][2]) ==

477

self._node_key(basis_pending[0][2])):

478

# Identical pointers, skip (and don't bother adding to

479

# excluded, it won't turn up again.

480

heapq.heappop(self_pending)

481

heapq.heappop(basis_pending)

482

continue

483

# Now we need to expand this node before we can continue

484

if read_self and read_basis:

485

# Both sides start with the same prefix, so process

486

# them in parallel

487

self_prefix, _, self_node, self_path = heapq.heappop(

488

self_pending)

489

basis_prefix, _, basis_node, basis_path = heapq.heappop(

490

basis_pending)

491

if self_prefix != basis_prefix:

492

raise AssertionError(

493

'%r != %r' % (self_prefix, basis_prefix))

494

process_common_prefix_nodes(

495

self_node, self_path,

496

basis_node, basis_path)

497

continue

498

if read_self:

499

prefix, key, node, path = heapq.heappop(self_pending)

500

if check_excluded(path):

501

continue

502

process_node(node, path, self, self_pending)

503

if read_basis:

504

prefix, key, node, path = heapq.heappop(basis_pending)

505

if check_excluded(path):

506

continue

507

process_node(node, path, basis, basis_pending)

508

# print loop_counter

509

510

def iteritems(self, key_filter=None):

511

"""Iterate over the entire CHKMap's contents."""

512

self._ensure_root()

513

if key_filter is not None:

514

as_st = StaticTuple.from_sequence

515

key_filter = [as_st(key) for key in key_filter]

516

return self._root_node.iteritems(self._store, key_filter=key_filter)

517

518

def key(self):

519

"""Return the key for this map."""

520

if type(self._root_node) is StaticTuple:

521

return self._root_node

522

else:

523

return self._root_node._key

524

525

def __len__(self):

526

self._ensure_root()

527

return len(self._root_node)

528

529

def map(self, key, value):

530

"""Map a key tuple to value.

531

532

:param key: A key to map.

533

:param value: The value to assign to key.

534

"""

535

key = StaticTuple.from_sequence(key)

536

# Need a root object.

537

self._ensure_root()

538

prefix, node_details = self._root_node.map(self._store, key, value)

539

if len(node_details) == 1:

540

self._root_node = node_details[0][1]

541

else:

542

self._root_node = InternalNode(prefix,

543

search_key_func=self._search_key_func)

544

self._root_node.set_maximum_size(node_details[0][1].maximum_size)

545

self._root_node._key_width = node_details[0][1]._key_width

546

for split, node in node_details:

547

self._root_node.add_node(split, node)

548

549

def _node_key(self, node):

550

"""Get the key for a node whether it's a tuple or node."""

551

if type(node) is tuple:

552

node = StaticTuple.from_sequence(node)

553

if type(node) is StaticTuple:

554

return node

555

else:

556

return node._key

557

558

def unmap(self, key, check_remap=True):

559

"""remove key from the map."""

560

key = StaticTuple.from_sequence(key)

561

self._ensure_root()

562

if type(self._root_node) is InternalNode:

563

unmapped = self._root_node.unmap(self._store, key,

564

check_remap=check_remap)

565

else:

566

unmapped = self._root_node.unmap(self._store, key)

567

self._root_node = unmapped

568

569

def _check_remap(self):

570

"""Check if nodes can be collapsed."""

571

self._ensure_root()

572

if type(self._root_node) is InternalNode:

573

self._root_node = self._root_node._check_remap(self._store)

574

575

def _save(self):

576

"""Save the map completely.

577

578

:return: The key of the root node.

579

"""

580

if type(self._root_node) is StaticTuple:

581

# Already saved.

582

return self._root_node

583

keys = list(self._root_node.serialise(self._store))

584

return keys[-1]

585

586

587

class Node(object):

588

"""Base class defining the protocol for CHK Map nodes.

589

590

:ivar _raw_size: The total size of the serialized key:value data, before

591

adding the header bytes, and without prefix compression.

592

"""

593

594

__slots__ = ('_key', '_len', '_maximum_size', '_key_width',

595

'_raw_size', '_items', '_search_prefix', '_search_key_func'

596

)

597

598

def __init__(self, key_width=1):

599

"""Create a node.

600

601

:param key_width: The width of keys for this node.

602

"""

603

self._key = None

604

# Current number of elements

605

self._len = 0

606

self._maximum_size = 0

607

self._key_width = key_width

608

# current size in bytes

609

self._raw_size = 0

610

# The pointers/values this node has - meaning defined by child classes.

611

self._items = {}

612

# The common search prefix

613

self._search_prefix = None

614

615

def __repr__(self):

616

items_str = str(sorted(self._items))

617

if len(items_str) > 20:

618

items_str = items_str[:16] + '...]'

619

return '%s(key:%s len:%s size:%s max:%s prefix:%s items:%s)' % (

620

self.__class__.__name__, self._key, self._len, self._raw_size,

621

self._maximum_size, self._search_prefix, items_str)

622

623

def key(self):

624

return self._key

625

626

def __len__(self):

627

return self._len

628

629

@property

630

def maximum_size(self):

631

"""What is the upper limit for adding references to a node."""

632

return self._maximum_size

633

634

def set_maximum_size(self, new_size):

635

"""Set the size threshold for nodes.

636

637

:param new_size: The size at which no data is added to a node. 0 for

638

unlimited.

639

"""

640

self._maximum_size = new_size

641

642

@classmethod

643

def common_prefix(cls, prefix, key):

644

"""Given 2 strings, return the longest prefix common to both.

645

646

:param prefix: This has been the common prefix for other keys, so it is

647

more likely to be the common prefix in this case as well.

648

:param key: Another string to compare to

649

"""

650

if key.startswith(prefix):

651

return prefix

652

pos = -1

653

# Is there a better way to do this?

654

for pos, (left, right) in enumerate(zip(prefix, key)):

655

if left != right:

656

pos -= 1

657

break

658

common = prefix[:pos+1]

659

return common

660

661

@classmethod

662

def common_prefix_for_keys(cls, keys):

663

"""Given a list of keys, find their common prefix.

664

665

:param keys: An iterable of strings.

666

:return: The longest common prefix of all keys.

667

"""

668

common_prefix = None

669

for key in keys:

670

if common_prefix is None:

671

common_prefix = key

672

continue

673

common_prefix = cls.common_prefix(common_prefix, key)

674

if not common_prefix:

675

# if common_prefix is the empty string, then we know it won't

676

# change further

677

return ''

678

return common_prefix

679

680

681

# Singleton indicating we have not computed _search_prefix yet

682

_unknown = object()

683

684

class LeafNode(Node):

685

"""A node containing actual key:value pairs.

686

687

:ivar _items: A dict of key->value items. The key is in tuple form.

688

:ivar _size: The number of bytes that would be used by serializing all of

689

the key/value pairs.

690

"""

691

692

__slots__ = ('_common_serialised_prefix',)

693

694

def __init__(self, search_key_func=None):

695

Node.__init__(self)

696

# All of the keys in this leaf node share this common prefix

697

self._common_serialised_prefix = None

698

if search_key_func is None:

699

self._search_key_func = _search_key_plain

700

else:

701

self._search_key_func = search_key_func

702

703

def __repr__(self):

704

items_str = str(sorted(self._items))

705

if len(items_str) > 20:

706

items_str = items_str[:16] + '...]'

707

return \

708

'%s(key:%s len:%s size:%s max:%s prefix:%s keywidth:%s items:%s)' \

709

% (self.__class__.__name__, self._key, self._len, self._raw_size,

710

self._maximum_size, self._search_prefix, self._key_width, items_str)

711

712

def _current_size(self):

713

"""Answer the current serialised size of this node.

714

715

This differs from self._raw_size in that it includes the bytes used for

716

the header.

717

"""

718

if self._common_serialised_prefix is None:

719

bytes_for_items = 0

720

prefix_len = 0

721

else:

722

# We will store a single string with the common prefix

723

# And then that common prefix will not be stored in any of the

724

# entry lines

725

prefix_len = len(self._common_serialised_prefix)

726

bytes_for_items = (self._raw_size - (prefix_len * self._len))

727

return (9 # 'chkleaf:\n'

728

+ len(str(self._maximum_size)) + 1

729

+ len(str(self._key_width)) + 1

730

+ len(str(self._len)) + 1

731

+ prefix_len + 1

732

+ bytes_for_items)

733

734

@classmethod

735

def deserialise(klass, bytes, key, search_key_func=None):

736

"""Deserialise bytes, with key key, into a LeafNode.

737

738

:param bytes: The bytes of the node.

739

:param key: The key that the serialised node has.

740

"""

741

key = static_tuple.expect_static_tuple(key)

742

return _deserialise_leaf_node(bytes, key,

743

search_key_func=search_key_func)

744

745

def iteritems(self, store, key_filter=None):

746

"""Iterate over items in the node.

747

748

:param key_filter: A filter to apply to the node. It should be a

749

list/set/dict or similar repeatedly iterable container.

750

"""

751

if key_filter is not None:

752

# Adjust the filter - short elements go to a prefix filter. All

753

# other items are looked up directly.

754

# XXX: perhaps defaultdict? Profiling<rinse and repeat>

755

filters = {}

756

for key in key_filter:

757

if len(key) == self._key_width:

758

# This filter is meant to match exactly one key, yield it

759

# if we have it.

760

try:

761

yield key, self._items[key]

762

except KeyError:

763

# This key is not present in this map, continue

764

pass

765

else:

766

# Short items, we need to match based on a prefix

767

length_filter = filters.setdefault(len(key), set())

768

length_filter.add(key)

769

if filters:

770

filters = filters.items()

771

for item in self._items.iteritems():

772

for length, length_filter in filters:

773

if item[0][:length] in length_filter:

774

yield item

775

break

776

else:

777

for item in self._items.iteritems():

778

yield item

779

780

def _key_value_len(self, key, value):

781

# TODO: Should probably be done without actually joining the key, but

782

# then that can be done via the C extension

783

return (len(self._serialise_key(key)) + 1

784

+ len(str(value.count('\n'))) + 1

785

+ len(value) + 1)

786

787

def _search_key(self, key):

788

return self._search_key_func(key)

789

790

def _map_no_split(self, key, value):

791

"""Map a key to a value.

792

793

This assumes either the key does not already exist, or you have already

794

removed its size and length from self.

795

796

:return: True if adding this node should cause us to split.

797

"""

798

self._items[key] = value

799

self._raw_size += self._key_value_len(key, value)

800

self._len += 1

801

serialised_key = self._serialise_key(key)

802

if self._common_serialised_prefix is None:

803

self._common_serialised_prefix = serialised_key

804

else:

805

self._common_serialised_prefix = self.common_prefix(

806

self._common_serialised_prefix, serialised_key)

807

search_key = self._search_key(key)

808

if self._search_prefix is _unknown:

809

self._compute_search_prefix()

810

if self._search_prefix is None:

811

self._search_prefix = search_key

812

else:

813

self._search_prefix = self.common_prefix(

814

self._search_prefix, search_key)

815

if (self._len > 1

816

and self._maximum_size

817

and self._current_size() > self._maximum_size):

818

# Check to see if all of the search_keys for this node are

819

# identical. We allow the node to grow under that circumstance

820

# (we could track this as common state, but it is infrequent)

821

if (search_key != self._search_prefix

822

or not self._are_search_keys_identical()):

823

return True

824

return False

825

826

def _split(self, store):

827

"""We have overflowed.

828

829

Split this node into multiple LeafNodes, return it up the stack so that

830

the next layer creates a new InternalNode and references the new nodes.

831

832

:return: (common_serialised_prefix, [(node_serialised_prefix, node)])

833

"""

834

if self._search_prefix is _unknown:

835

raise AssertionError('Search prefix must be known')

836

common_prefix = self._search_prefix

837

split_at = len(common_prefix) + 1

838

result = {}

839

for key, value in self._items.iteritems():

840

search_key = self._search_key(key)

841

prefix = search_key[:split_at]

842

# TODO: Generally only 1 key can be exactly the right length,

843

# which means we can only have 1 key in the node pointed

844

# at by the 'prefix\0' key. We might want to consider

845

# folding it into the containing InternalNode rather than

846

# having a fixed length-1 node.

847

# Note this is probably not true for hash keys, as they

848

# may get a '\00' node anywhere, but won't have keys of

849

# different lengths.

850

if len(prefix) < split_at:

851

prefix += '\x00'*(split_at - len(prefix))

852

if prefix not in result:

853

node = LeafNode(search_key_func=self._search_key_func)

854

node.set_maximum_size(self._maximum_size)

855

node._key_width = self._key_width

856

result[prefix] = node

857

else:

858

node = result[prefix]

859

sub_prefix, node_details = node.map(store, key, value)

860

if len(node_details) > 1:

861

if prefix != sub_prefix:

862

# This node has been split and is now found via a different

863

# path

864

result.pop(prefix)

865

new_node = InternalNode(sub_prefix,

866

search_key_func=self._search_key_func)

867

new_node.set_maximum_size(self._maximum_size)

868

new_node._key_width = self._key_width

869

for split, node in node_details:

870

new_node.add_node(split, node)

871

result[prefix] = new_node

872

return common_prefix, result.items()

873

874

def map(self, store, key, value):

875

"""Map key to value."""

876

if key in self._items:

877

self._raw_size -= self._key_value_len(key, self._items[key])

878

self._len -= 1

879

self._key = None

880

if self._map_no_split(key, value):

881

return self._split(store)

882

else:

883

if self._search_prefix is _unknown:

884

raise AssertionError('%r must be known' % self._search_prefix)

885

return self._search_prefix, [("", self)]

886

887

_serialise_key = '\x00'.join

888

889

def serialise(self, store):

890

"""Serialise the LeafNode to store.

891

892

:param store: A VersionedFiles honouring the CHK extensions.

893

:return: An iterable of the keys inserted by this operation.

894

"""

895

lines = ["chkleaf:\n"]

896

lines.append("%d\n" % self._maximum_size)

897

lines.append("%d\n" % self._key_width)

898

lines.append("%d\n" % self._len)

899

if self._common_serialised_prefix is None:

900

lines.append('\n')

901

if len(self._items) != 0:

902

raise AssertionError('If _common_serialised_prefix is None'

903

' we should have no items')

904

else:

905

lines.append('%s\n' % (self._common_serialised_prefix,))

906

prefix_len = len(self._common_serialised_prefix)

907

for key, value in sorted(self._items.items()):

908

# Always add a final newline

909

value_lines = osutils.chunks_to_lines([value + '\n'])

910

serialized = "%s\x00%s\n" % (self._serialise_key(key),

911

len(value_lines))

912

if not serialized.startswith(self._common_serialised_prefix):

913

raise AssertionError('We thought the common prefix was %r'

914

' but entry %r does not have it in common'

915

% (self._common_serialised_prefix, serialized))

916

lines.append(serialized[prefix_len:])

917

lines.extend(value_lines)

918

sha1, _, _ = store.add_lines((None,), (), lines)

919

self._key = StaticTuple("sha1:" + sha1,).intern()

920

bytes = ''.join(lines)

921

if len(bytes) != self._current_size():

922

raise AssertionError('Invalid _current_size')

923

_get_cache().add(self._key, bytes)

924

return [self._key]

925

926

def refs(self):

927

"""Return the references to other CHK's held by this node."""

928

return []

929

930

def _compute_search_prefix(self):

931

"""Determine the common search prefix for all keys in this node.

932

933

:return: A bytestring of the longest search key prefix that is

934

unique within this node.

935

"""

936

search_keys = [self._search_key_func(key) for key in self._items]

937

self._search_prefix = self.common_prefix_for_keys(search_keys)

938

return self._search_prefix

939

940

def _are_search_keys_identical(self):

941

"""Check to see if the search keys for all entries are the same.

942

943

When using a hash as the search_key it is possible for non-identical

944

keys to collide. If that happens enough, we may try overflow a

945

LeafNode, but as all are collisions, we must not split.

946

"""

947

common_search_key = None

948

for key in self._items:

949

search_key = self._search_key(key)

950

if common_search_key is None:

951

common_search_key = search_key

952

elif search_key != common_search_key:

953

return False

954

return True

955

956

def _compute_serialised_prefix(self):

957

"""Determine the common prefix for serialised keys in this node.

958

959

:return: A bytestring of the longest serialised key prefix that is

960

unique within this node.

961

"""

962

serialised_keys = [self._serialise_key(key) for key in self._items]

963

self._common_serialised_prefix = self.common_prefix_for_keys(

964

serialised_keys)

965

return self._common_serialised_prefix

966

967

def unmap(self, store, key):

968

"""Unmap key from the node."""

969

try:

970

self._raw_size -= self._key_value_len(key, self._items[key])

971

except KeyError:

972

trace.mutter("key %s not found in %r", key, self._items)

973

raise

974

self._len -= 1

975

del self._items[key]

976

self._key = None

977

# Recompute from scratch

978

self._compute_search_prefix()

979

self._compute_serialised_prefix()

980

return self

981

982

983

class InternalNode(Node):

984

"""A node that contains references to other nodes.

985

986

An InternalNode is responsible for mapping search key prefixes to child

987

nodes.

988

989

:ivar _items: serialised_key => node dictionary. node may be a tuple,

990

LeafNode or InternalNode.

991

"""

992

993

__slots__ = ('_node_width',)

994

995

def __init__(self, prefix='', search_key_func=None):

996

Node.__init__(self)

997

# The size of an internalnode with default values and no children.

998

# How many octets key prefixes within this node are.

999

self._node_width = 0

1000

self._search_prefix = prefix

1001

if search_key_func is None:

1002

self._search_key_func = _search_key_plain

1003

else:

1004

self._search_key_func = search_key_func

1005

1006

def add_node(self, prefix, node):

1007

"""Add a child node with prefix prefix, and node node.

1008

1009

:param prefix: The search key prefix for node.

1010

:param node: The node being added.

1011

"""

1012

if self._search_prefix is None:

1013

raise AssertionError("_search_prefix should not be None")

1014

if not prefix.startswith(self._search_prefix):

1015

raise AssertionError("prefixes mismatch: %s must start with %s"

1016

% (prefix,self._search_prefix))

1017

if len(prefix) != len(self._search_prefix) + 1:

1018

raise AssertionError("prefix wrong length: len(%s) is not %d" %

1019

(prefix, len(self._search_prefix) + 1))

1020

self._len += len(node)

1021

if not len(self._items):

1022

self._node_width = len(prefix)

1023

if self._node_width != len(self._search_prefix) + 1:

1024

raise AssertionError("node width mismatch: %d is not %d" %

1025

(self._node_width, len(self._search_prefix) + 1))

1026

self._items[prefix] = node

1027

self._key = None

1028

1029

def _current_size(self):

1030

"""Answer the current serialised size of this node."""

1031

return (self._raw_size + len(str(self._len)) + len(str(self._key_width)) +

1032

len(str(self._maximum_size)))

1033

1034

@classmethod

1035

def deserialise(klass, bytes, key, search_key_func=None):

1036

"""Deserialise bytes to an InternalNode, with key key.

1037

1038

:param bytes: The bytes of the node.

1039

:param key: The key that the serialised node has.

1040

:return: An InternalNode instance.

1041

"""

1042

key = static_tuple.expect_static_tuple(key)

1043

return _deserialise_internal_node(bytes, key,

1044

search_key_func=search_key_func)

1045

1046

def iteritems(self, store, key_filter=None):

1047

for node, node_filter in self._iter_nodes(store, key_filter=key_filter):

1048

for item in node.iteritems(store, key_filter=node_filter):

1049

yield item

1050

1051

def _iter_nodes(self, store, key_filter=None, batch_size=None):

1052

"""Iterate over node objects which match key_filter.

1053

1054

:param store: A store to use for accessing content.

1055

:param key_filter: A key filter to filter nodes. Only nodes that might

1056

contain a key in key_filter will be returned.

1057

:param batch_size: If not None, then we will return the nodes that had

1058

to be read using get_record_stream in batches, rather than reading

1059

them all at once.

1060

:return: An iterable of nodes. This function does not have to be fully

1061

consumed. (There will be no pending I/O when items are being returned.)

1062

"""

1063

# Map from chk key ('sha1:...',) to (prefix, key_filter)

1064

# prefix is the key in self._items to use, key_filter is the key_filter

1065

# entries that would match this node

1066

keys = {}

1067

shortcut = False

1068

if key_filter is None:

1069

# yielding all nodes, yield whatever we have, and queue up a read

1070

# for whatever we are missing

1071

shortcut = True

1072

for prefix, node in self._items.iteritems():

1073

if node.__class__ is StaticTuple:

1074

keys[node] = (prefix, None)

1075

else:

1076

yield node, None

1077

elif len(key_filter) == 1:

1078

# Technically, this path could also be handled by the first check

1079

# in 'self._node_width' in length_filters. However, we can handle

1080

# this case without spending any time building up the

1081

# prefix_to_keys, etc state.

1082

1083

# This is a bit ugly, but TIMEIT showed it to be by far the fastest

1084

# 0.626us list(key_filter)[0]

1085

# is a func() for list(), 2 mallocs, and a getitem

1086

# 0.489us [k for k in key_filter][0]

1087

# still has the mallocs, avoids the func() call

1088

# 0.350us iter(key_filter).next()

1089

# has a func() call, and mallocs an iterator

1090

# 0.125us for key in key_filter: pass

1091

# no func() overhead, might malloc an iterator

1092

# 0.105us for key in key_filter: break

1093

# no func() overhead, might malloc an iterator, probably

1094

# avoids checking an 'else' clause as part of the for

1095

for key in key_filter:

1096

break

1097

search_prefix = self._search_prefix_filter(key)

1098

if len(search_prefix) == self._node_width:

1099

# This item will match exactly, so just do a dict lookup, and

1100

# see what we can return

1101

shortcut = True

1102

try:

1103

node = self._items[search_prefix]

1104

except KeyError:

1105

# A given key can only match 1 child node, if it isn't

1106

# there, then we can just return nothing

1107

return

1108

if node.__class__ is StaticTuple:

1109

keys[node] = (search_prefix, [key])

1110

else:

1111

# This is loaded, and the only thing that can match,

1112

# return

1113

yield node, [key]

1114

return

1115

if not shortcut:

1116

# First, convert all keys into a list of search prefixes

1117

# Aggregate common prefixes, and track the keys they come from

1118

prefix_to_keys = {}

1119

length_filters = {}

1120

for key in key_filter:

1121

search_prefix = self._search_prefix_filter(key)

1122

length_filter = length_filters.setdefault(

1123

len(search_prefix), set())

1124

length_filter.add(search_prefix)

1125

prefix_to_keys.setdefault(search_prefix, []).append(key)

1126

1127

if (self._node_width in length_filters

1128

and len(length_filters) == 1):

1129

# all of the search prefixes match exactly _node_width. This

1130

# means that everything is an exact match, and we can do a

1131

# lookup into self._items, rather than iterating over the items

1132

# dict.

1133

search_prefixes = length_filters[self._node_width]

1134

for search_prefix in search_prefixes:

1135

try:

1136

node = self._items[search_prefix]

1137

except KeyError:

1138

# We can ignore this one

1139

continue

1140

node_key_filter = prefix_to_keys[search_prefix]

1141

if node.__class__ is StaticTuple:

1142

keys[node] = (search_prefix, node_key_filter)

1143

else:

1144

yield node, node_key_filter

1145

else:

1146

# The slow way. We walk every item in self._items, and check to

1147

# see if there are any matches

1148

length_filters = length_filters.items()

1149

for prefix, node in self._items.iteritems():

1150

node_key_filter = []

1151

for length, length_filter in length_filters:

1152

sub_prefix = prefix[:length]

1153

if sub_prefix in length_filter:

1154

node_key_filter.extend(prefix_to_keys[sub_prefix])

1155

if node_key_filter: # this key matched something, yield it

1156

if node.__class__ is StaticTuple:

1157

keys[node] = (prefix, node_key_filter)

1158

else:

1159

yield node, node_key_filter

1160

if keys:

1161

# Look in the page cache for some more bytes

1162

found_keys = set()

1163

for key in keys:

1164

try:

1165

bytes = _get_cache()[key]

1166

except KeyError:

1167

continue

1168

else:

1169

node = _deserialise(bytes, key,

1170

search_key_func=self._search_key_func)

1171

prefix, node_key_filter = keys[key]

1172

self._items[prefix] = node

1173

found_keys.add(key)

1174

yield node, node_key_filter

1175

for key in found_keys:

1176

del keys[key]

1177

if keys:

1178

# demand load some pages.

1179

if batch_size is None:

1180

# Read all the keys in

1181

batch_size = len(keys)

1182

key_order = list(keys)

1183

for batch_start in range(0, len(key_order), batch_size):

1184

batch = key_order[batch_start:batch_start + batch_size]

1185

# We have to fully consume the stream so there is no pending

1186

# I/O, so we buffer the nodes for now.

1187

stream = store.get_record_stream(batch, 'unordered', True)

1188

node_and_filters = []

1189

for record in stream:

1190

bytes = record.get_bytes_as('fulltext')

1191

node = _deserialise(bytes, record.key,

1192

search_key_func=self._search_key_func)

1193

prefix, node_key_filter = keys[record.key]

1194

node_and_filters.append((node, node_key_filter))

1195

self._items[prefix] = node

1196

_get_cache().add(record.key, bytes)

1197

for info in node_and_filters:

1198

yield info

1199

1200

def map(self, store, key, value):

1201

"""Map key to value."""

1202

if not len(self._items):

1203

raise AssertionError("can't map in an empty InternalNode.")

1204

search_key = self._search_key(key)

1205

if self._node_width != len(self._search_prefix) + 1:

1206

raise AssertionError("node width mismatch: %d is not %d" %

1207

(self._node_width, len(self._search_prefix) + 1))

1208

if not search_key.startswith(self._search_prefix):

1209

# This key doesn't fit in this index, so we need to split at the

1210

# point where it would fit, insert self into that internal node,

1211

# and then map this key into that node.

1212

new_prefix = self.common_prefix(self._search_prefix,

1213

search_key)

1214

new_parent = InternalNode(new_prefix,

1215

search_key_func=self._search_key_func)

1216

new_parent.set_maximum_size(self._maximum_size)

1217

new_parent._key_width = self._key_width

1218

new_parent.add_node(self._search_prefix[:len(new_prefix)+1],

1219

self)

1220

return new_parent.map(store, key, value)

1221

children = [node for node, _

1222

in self._iter_nodes(store, key_filter=[key])]

1223

if children:

1224

child = children[0]

1225

else:

1226

# new child needed:

1227

child = self._new_child(search_key, LeafNode)

1228

old_len = len(child)

1229

if type(child) is LeafNode:

1230

old_size = child._current_size()

1231

else:

1232

old_size = None

1233

prefix, node_details = child.map(store, key, value)

1234

if len(node_details) == 1:

1235

# child may have shrunk, or might be a new node

1236

child = node_details[0][1]

1237

self._len = self._len - old_len + len(child)

1238

self._items[search_key] = child

1239

self._key = None

1240

new_node = self

1241

if type(child) is LeafNode:

1242

if old_size is None:

1243

# The old node was an InternalNode which means it has now

1244

# collapsed, so we need to check if it will chain to a

1245

# collapse at this level.

1246

trace.mutter("checking remap as InternalNode -> LeafNode")

1247

new_node = self._check_remap(store)

1248

else:

1249

# If the LeafNode has shrunk in size, we may want to run

1250

# a remap check. Checking for a remap is expensive though

1251

# and the frequency of a successful remap is very low.

1252

# Shrinkage by small amounts is common, so we only do the

1253

# remap check if the new_size is low or the shrinkage

1254

# amount is over a configurable limit.

1255

new_size = child._current_size()

1256

shrinkage = old_size - new_size

1257

if (shrinkage > 0 and new_size < _INTERESTING_NEW_SIZE

1258

or shrinkage > _INTERESTING_SHRINKAGE_LIMIT):

1259

trace.mutter(

1260

"checking remap as size shrunk by %d to be %d",

1261

shrinkage, new_size)

1262

new_node = self._check_remap(store)

1263

if new_node._search_prefix is None:

1264

raise AssertionError("_search_prefix should not be None")

1265

return new_node._search_prefix, [('', new_node)]

1266

# child has overflown - create a new intermediate node.

1267

# XXX: This is where we might want to try and expand our depth

1268

# to refer to more bytes of every child (which would give us

1269

# multiple pointers to child nodes, but less intermediate nodes)

1270

child = self._new_child(search_key, InternalNode)

1271

child._search_prefix = prefix

1272

for split, node in node_details:

1273

child.add_node(split, node)

1274

self._len = self._len - old_len + len(child)

1275

self._key = None

1276

return self._search_prefix, [("", self)]

1277

1278

def _new_child(self, search_key, klass):

1279

"""Create a new child node of type klass."""

1280

child = klass()

1281

child.set_maximum_size(self._maximum_size)

1282

child._key_width = self._key_width

1283

child._search_key_func = self._search_key_func

1284

self._items[search_key] = child

1285

return child

1286

1287

def serialise(self, store):

1288

"""Serialise the node to store.

1289

1290

:param store: A VersionedFiles honouring the CHK extensions.

1291

:return: An iterable of the keys inserted by this operation.

1292

"""

1293

for node in self._items.itervalues():

1294

if type(node) is StaticTuple:

1295

# Never deserialised.

1296

continue

1297

if node._key is not None:

1298

# Never altered

1299

continue

1300

for key in node.serialise(store):

1301

yield key

1302

lines = ["chknode:\n"]

1303

lines.append("%d\n" % self._maximum_size)

1304

lines.append("%d\n" % self._key_width)

1305

lines.append("%d\n" % self._len)

1306

if self._search_prefix is None:

1307

raise AssertionError("_search_prefix should not be None")

1308

lines.append('%s\n' % (self._search_prefix,))

1309

prefix_len = len(self._search_prefix)

1310

for prefix, node in sorted(self._items.items()):

1311

if type(node) is StaticTuple:

1312

key = node[0]

1313

else:

1314

key = node._key[0]

1315

serialised = "%s\x00%s\n" % (prefix, key)

1316

if not serialised.startswith(self._search_prefix):

1317

raise AssertionError("prefixes mismatch: %s must start with %s"

1318

% (serialised, self._search_prefix))

1319

lines.append(serialised[prefix_len:])

1320

sha1, _, _ = store.add_lines((None,), (), lines)

1321

self._key = StaticTuple("sha1:" + sha1,).intern()

1322

_get_cache().add(self._key, ''.join(lines))

1323

yield self._key

1324

1325

def _search_key(self, key):

1326

"""Return the serialised key for key in this node."""

1327

# search keys are fixed width. All will be self._node_width wide, so we

1328

# pad as necessary.

1329

return (self._search_key_func(key) + '\x00'*self._node_width)[:self._node_width]

1330

1331

def _search_prefix_filter(self, key):

1332

"""Serialise key for use as a prefix filter in iteritems."""

1333

return self._search_key_func(key)[:self._node_width]

1334

1335

def _split(self, offset):

1336

"""Split this node into smaller nodes starting at offset.

1337

1338

:param offset: The offset to start the new child nodes at.

1339

:return: An iterable of (prefix, node) tuples. prefix is a byte

1340

prefix for reaching node.

1341

"""

1342

if offset >= self._node_width:

1343

for node in self._items.values():

1344

for result in node._split(offset):

1345

yield result

1346

return

1347

for key, node in self._items.items():

1348

pass

1349

1350

def refs(self):

1351

"""Return the references to other CHK's held by this node."""

1352

if self._key is None:

1353

raise AssertionError("unserialised nodes have no refs.")

1354

refs = []

1355

for value in self._items.itervalues():

1356

if type(value) is StaticTuple:

1357

refs.append(value)

1358

else:

1359

refs.append(value.key())

1360

return refs

1361

1362

def _compute_search_prefix(self, extra_key=None):

1363

"""Return the unique key prefix for this node.

1364

1365

:return: A bytestring of the longest search key prefix that is

1366

unique within this node.

1367

"""

1368

self._search_prefix = self.common_prefix_for_keys(self._items)

1369

return self._search_prefix

1370

1371

def unmap(self, store, key, check_remap=True):

1372

"""Remove key from this node and its children."""

1373

if not len(self._items):

1374

raise AssertionError("can't unmap in an empty InternalNode.")

1375

children = [node for node, _

1376

in self._iter_nodes(store, key_filter=[key])]

1377

if children:

1378

child = children[0]

1379

else:

1380

raise KeyError(key)

1381

self._len -= 1

1382

unmapped = child.unmap(store, key)

1383

self._key = None

1384

search_key = self._search_key(key)

1385

if len(unmapped) == 0:

1386

# All child nodes are gone, remove the child:

1387

del self._items[search_key]

1388

unmapped = None

1389

else:

1390

# Stash the returned node

1391

self._items[search_key] = unmapped

1392

if len(self._items) == 1:

1393

# this node is no longer needed:

1394

return self._items.values()[0]

1395

if type(unmapped) is InternalNode:

1396

return self

1397

if check_remap:

1398

return self._check_remap(store)

1399

else:

1400

return self

1401

1402

def _check_remap(self, store):

1403

"""Check if all keys contained by children fit in a single LeafNode.

1404

1405

:param store: A store to use for reading more nodes

1406

:return: Either self, or a new LeafNode which should replace self.

1407

"""

1408

# Logic for how we determine when we need to rebuild

1409

# 1) Implicitly unmap() is removing a key which means that the child

1410

# nodes are going to be shrinking by some extent.

1411

# 2) If all children are LeafNodes, it is possible that they could be

1412

# combined into a single LeafNode, which can then completely replace

1413

# this internal node with a single LeafNode

1414

# 3) If *one* child is an InternalNode, we assume it has already done

1415

# all the work to determine that its children cannot collapse, and

1416

# we can then assume that those nodes *plus* the current nodes don't

1417

# have a chance of collapsing either.

1418

# So a very cheap check is to just say if 'unmapped' is an

1419

# InternalNode, we don't have to check further.

1420

1421

# TODO: Another alternative is to check the total size of all known

1422

# LeafNodes. If there is some formula we can use to determine the

1423

# final size without actually having to read in any more

1424

# children, it would be nice to have. However, we have to be

1425

# careful with stuff like nodes that pull out the common prefix

1426

# of each key, as adding a new key can change the common prefix

1427

# and cause size changes greater than the length of one key.

1428

# So for now, we just add everything to a new Leaf until it

1429

# splits, as we know that will give the right answer

1430

new_leaf = LeafNode(search_key_func=self._search_key_func)

1431

new_leaf.set_maximum_size(self._maximum_size)

1432

new_leaf._key_width = self._key_width

1433

# A batch_size of 16 was chosen because:

1434

# a) In testing, a 4k page held 14 times. So if we have more than 16

1435

# leaf nodes we are unlikely to hold them in a single new leaf

1436

# node. This still allows for 1 round trip

1437

# b) With 16-way fan out, we can still do a single round trip

1438

# c) With 255-way fan out, we don't want to read all 255 and destroy

1439

# the page cache, just to determine that we really don't need it.

1440

for node, _ in self._iter_nodes(store, batch_size=16):

1441

if type(node) is InternalNode:

1442

# Without looking at any leaf nodes, we are sure

1443

return self

1444

for key, value in node._items.iteritems():

1445

if new_leaf._map_no_split(key, value):

1446

return self

1447

trace.mutter("remap generated a new LeafNode")

1448

return new_leaf

1449

1450

1451

def _deserialise(bytes, key, search_key_func):

1452

"""Helper for repositorydetails - convert bytes to a node."""

1453

if bytes.startswith("chkleaf:\n"):

1454

node = LeafNode.deserialise(bytes, key, search_key_func=search_key_func)

1455

elif bytes.startswith("chknode:\n"):

1456

node = InternalNode.deserialise(bytes, key,

1457

search_key_func=search_key_func)

1458

else:

1459

raise AssertionError("Unknown node type.")

1460

return node

1461

1462

1463

class CHKMapDifference(object):

1464

"""Iterate the stored pages and key,value pairs for (new - old).

1465

1466

This class provides a generator over the stored CHK pages and the

1467

(key, value) pairs that are in any of the new maps and not in any of the

1468

old maps.

1469

1470

Note that it may yield chk pages that are common (especially root nodes),

1471

but it won't yield (key,value) pairs that are common.

1472

"""

1473

1474

def __init__(self, store, new_root_keys, old_root_keys,

1475

search_key_func, pb=None):

1476

# TODO: Should we add a StaticTuple barrier here? It would be nice to

1477

# force callers to use StaticTuple, because there will often be

1478

# lots of keys passed in here. And even if we cast it locally,

1479

# that just meanst that we will have *both* a StaticTuple and a

1480

# tuple() in memory, referring to the same object. (so a net

1481

# increase in memory, not a decrease.)

1482

self._store = store

1483

self._new_root_keys = new_root_keys

1484

self._old_root_keys = old_root_keys

1485

self._pb = pb

1486

# All uninteresting chks that we have seen. By the time they are added

1487

# here, they should be either fully ignored, or queued up for

1488

# processing

1489

# TODO: This might grow to a large size if there are lots of merge

1490

# parents, etc. However, it probably doesn't scale to O(history)

1491

# like _processed_new_refs does.

1492

self._all_old_chks = set(self._old_root_keys)

1493

# All items that we have seen from the old_root_keys

1494

self._all_old_items = set()

1495

# These are interesting items which were either read, or already in the

1496

# interesting queue (so we don't need to walk them again)

1497

# TODO: processed_new_refs becomes O(all_chks), consider switching to

1498

# SimpleSet here.

1499

self._processed_new_refs = set()

1500

self._search_key_func = search_key_func

1501

1502

# The uninteresting and interesting nodes to be searched

1503

self._old_queue = []

1504

self._new_queue = []

1505

# Holds the (key, value) items found when processing the root nodes,

1506

# waiting for the uninteresting nodes to be walked

1507

self._new_item_queue = []

1508

self._state = None

1509

1510

def _read_nodes_from_store(self, keys):

1511

# We chose not to use _get_cache(), because we think in

1512

# terms of records to be yielded. Also, we expect to touch each page

1513

# only 1 time during this code. (We may want to evaluate saving the

1514

# raw bytes into the page cache, which would allow a working tree

1515

# update after the fetch to not have to read the bytes again.)

1516

as_st = StaticTuple.from_sequence

1517

stream = self._store.get_record_stream(keys, 'unordered', True)

1518

for record in stream:

1519

if self._pb is not None:

1520

self._pb.tick()

1521

if record.storage_kind == 'absent':

1522

raise errors.NoSuchRevision(self._store, record.key)

1523

bytes = record.get_bytes_as('fulltext')

1524

node = _deserialise(bytes, record.key,

1525

search_key_func=self._search_key_func)

1526

if type(node) is InternalNode:

1527

# Note we don't have to do node.refs() because we know that

1528

# there are no children that have been pushed into this node

1529

# Note: Using as_st() here seemed to save 1.2MB, which would

1530

# indicate that we keep 100k prefix_refs around while

1531

# processing. They *should* be shorter lived than that...

1532

# It does cost us ~10s of processing time

1533

#prefix_refs = [as_st(item) for item in node._items.iteritems()]

1534

prefix_refs = node._items.items()

1535

items = []

1536

else:

1537

prefix_refs = []

1538

# Note: We don't use a StaticTuple here. Profiling showed a

1539

# minor memory improvement (0.8MB out of 335MB peak 0.2%)

1540

# But a significant slowdown (15s / 145s, or 10%)

1541

items = node._items.items()

1542

yield record, node, prefix_refs, items

1543

1544

def _read_old_roots(self):

1545

old_chks_to_enqueue = []

1546

all_old_chks = self._all_old_chks

1547

for record, node, prefix_refs, items in \

1548

self._read_nodes_from_store(self._old_root_keys):

1549

# Uninteresting node

1550

prefix_refs = [p_r for p_r in prefix_refs

1551

if p_r[1] not in all_old_chks]

1552

new_refs = [p_r[1] for p_r in prefix_refs]

1553

all_old_chks.update(new_refs)

1554

# TODO: This might be a good time to turn items into StaticTuple

1555

# instances and possibly intern them. However, this does not

1556

# impact 'initial branch' performance, so I'm not worrying

1557

# about this yet

1558

self._all_old_items.update(items)

1559

# Queue up the uninteresting references

1560

# Don't actually put them in the 'to-read' queue until we have

1561

# finished checking the interesting references

1562

old_chks_to_enqueue.extend(prefix_refs)

1563

return old_chks_to_enqueue

1564

1565

def _enqueue_old(self, new_prefixes, old_chks_to_enqueue):

1566

# At this point, we have read all the uninteresting and interesting

1567

# items, so we can queue up the uninteresting stuff, knowing that we've

1568

# handled the interesting ones

1569

for prefix, ref in old_chks_to_enqueue:

1570

not_interesting = True

1571

for i in xrange(len(prefix), 0, -1):

1572

if prefix[:i] in new_prefixes:

1573

not_interesting = False

1574

break

1575

if not_interesting:

1576

# This prefix is not part of the remaining 'interesting set'

1577

continue

1578

self._old_queue.append(ref)

1579

1580

def _read_all_roots(self):

1581

"""Read the root pages.

1582

1583

This is structured as a generator, so that the root records can be

1584

yielded up to whoever needs them without any buffering.

1585

"""

1586

# This is the bootstrap phase

1587

if not self._old_root_keys:

1588

# With no old_root_keys we can just shortcut and be ready

1589

# for _flush_new_queue

1590

self._new_queue = list(self._new_root_keys)

1591

return

1592

old_chks_to_enqueue = self._read_old_roots()

1593

# filter out any root keys that are already known to be uninteresting

1594

new_keys = set(self._new_root_keys).difference(self._all_old_chks)

1595

# These are prefixes that are present in new_keys that we are

1596

# thinking to yield

1597

new_prefixes = set()

1598

# We are about to yield all of these, so we don't want them getting

1599

# added a second time

1600

processed_new_refs = self._processed_new_refs

1601

processed_new_refs.update(new_keys)

1602

for record, node, prefix_refs, items in \

1603

self._read_nodes_from_store(new_keys):

1604

# At this level, we now know all the uninteresting references

1605

# So we filter and queue up whatever is remaining

1606

prefix_refs = [p_r for p_r in prefix_refs

1607

if p_r[1] not in self._all_old_chks

1608

and p_r[1] not in processed_new_refs]

1609

refs = [p_r[1] for p_r in prefix_refs]

1610

new_prefixes.update([p_r[0] for p_r in prefix_refs])

1611

self._new_queue.extend(refs)

1612

# TODO: We can potentially get multiple items here, however the

1613

# current design allows for this, as callers will do the work

1614

# to make the results unique. We might profile whether we

1615

# gain anything by ensuring unique return values for items

1616

# TODO: This might be a good time to cast to StaticTuple, as

1617

# self._new_item_queue will hold the contents of multiple

1618

# records for an extended lifetime

1619

new_items = [item for item in items

1620

if item not in self._all_old_items]

1621

self._new_item_queue.extend(new_items)

1622

new_prefixes.update([self._search_key_func(item[0])

1623

for item in new_items])

1624

processed_new_refs.update(refs)

1625

yield record

1626

# For new_prefixes we have the full length prefixes queued up.

1627

# However, we also need possible prefixes. (If we have a known ref to

1628

# 'ab', then we also need to include 'a'.) So expand the

1629

# new_prefixes to include all shorter prefixes

1630

for prefix in list(new_prefixes):

1631

new_prefixes.update([prefix[:i] for i in xrange(1, len(prefix))])

1632

self._enqueue_old(new_prefixes, old_chks_to_enqueue)

1633

1634

def _flush_new_queue(self):

1635

# No need to maintain the heap invariant anymore, just pull things out

1636

# and process them

1637

refs = set(self._new_queue)

1638

self._new_queue = []

1639

# First pass, flush all interesting items and convert to using direct refs

1640

all_old_chks = self._all_old_chks

1641

processed_new_refs = self._processed_new_refs

1642

all_old_items = self._all_old_items

1643

new_items = [item for item in self._new_item_queue

1644

if item not in all_old_items]

1645

self._new_item_queue = []

1646

if new_items:

1647

yield None, new_items

1648

refs = refs.difference(all_old_chks)

1649

processed_new_refs.update(refs)

1650

while refs:

1651

# TODO: Using a SimpleSet for self._processed_new_refs and

1652

# saved as much as 10MB of peak memory. However, it requires

1653

# implementing a non-pyrex version.

1654

next_refs = set()

1655

next_refs_update = next_refs.update

1656

# Inlining _read_nodes_from_store improves 'bzr branch bzr.dev'

1657

# from 1m54s to 1m51s. Consider it.

1658

for record, _, p_refs, items in self._read_nodes_from_store(refs):

1659

if all_old_items:

1660

# using the 'if' check saves about 145s => 141s, when

1661

# streaming initial branch of Launchpad data.

1662

items = [item for item in items

1663

if item not in all_old_items]

1664

yield record, items

1665

next_refs_update([p_r[1] for p_r in p_refs])

1666

del p_refs

1667

# set1.difference(set/dict) walks all of set1, and checks if it

1668

# exists in 'other'.

1669

# set1.difference(iterable) walks all of iterable, and does a

1670

# 'difference_update' on a clone of set1. Pick wisely based on the

1671

# expected sizes of objects.

1672

# in our case it is expected that 'new_refs' will always be quite

1673

# small.

1674

next_refs = next_refs.difference(all_old_chks)

1675

next_refs = next_refs.difference(processed_new_refs)

1676

processed_new_refs.update(next_refs)

1677

refs = next_refs

1678

1679

def _process_next_old(self):

1680

# Since we don't filter uninteresting any further than during

1681

# _read_all_roots, process the whole queue in a single pass.

1682

refs = self._old_queue

1683

self._old_queue = []

1684

all_old_chks = self._all_old_chks

1685

for record, _, prefix_refs, items in self._read_nodes_from_store(refs):

1686

# TODO: Use StaticTuple here?

1687

self._all_old_items.update(items)

1688

refs = [r for _,r in prefix_refs if r not in all_old_chks]

1689

self._old_queue.extend(refs)

1690

all_old_chks.update(refs)

1691

1692

def _process_queues(self):

1693

while self._old_queue:

1694

self._process_next_old()

1695

return self._flush_new_queue()

1696

1697

def process(self):

1698

for record in self._read_all_roots():

1699

yield record, []

1700

for record, items in self._process_queues():

1701

yield record, items

1702

1703

1704

def iter_interesting_nodes(store, interesting_root_keys,

1705

uninteresting_root_keys, pb=None):

1706

"""Given root keys, find interesting nodes.

1707

1708

Evaluate nodes referenced by interesting_root_keys. Ones that are also

1709

referenced from uninteresting_root_keys are not considered interesting.

1710

1711

:param interesting_root_keys: keys which should be part of the

1712

"interesting" nodes (which will be yielded)

1713

:param uninteresting_root_keys: keys which should be filtered out of the

1714

result set.

1715

:return: Yield

1716

(interesting record, {interesting key:values})

1717

"""

1718

iterator = CHKMapDifference(store, interesting_root_keys,

1719

uninteresting_root_keys,

1720

search_key_func=store._search_key_func,

1721

pb=pb)

1722

return iterator.process()

1723

1724

1725

try:

1726

from bzrlib._chk_map_pyx import (

1727

_bytes_to_text_key,

1728

_search_key_16,

1729

_search_key_255,

1730

_deserialise_leaf_node,

1731

_deserialise_internal_node,

1732

)

1733

except ImportError, e:

1734

osutils.failed_to_load_extension(e)

1735

from bzrlib._chk_map_py import (

1736

_bytes_to_text_key,

1737

_search_key_16,

1738

_search_key_255,

1739

_deserialise_leaf_node,

1740

_deserialise_internal_node,

1741

)

1742

search_key_registry.register('hash-16-way', _search_key_16)

1743

search_key_registry.register('hash-255-way', _search_key_255)

1744

1745

1746

def _check_key(key):

1747

"""Helper function to assert that a key is properly formatted.

1748

1749

This generally shouldn't be used in production code, but it can be helpful

1750

to debug problems.

1751

"""

1752

if type(key) is not StaticTuple:

1753

raise TypeError('key %r is not StaticTuple but %s' % (key, type(key)))

1754

if len(key) != 1:

1755

raise ValueError('key %r should have length 1, not %d' % (key, len(key),))

1756

if type(key[0]) is not str:

1757

raise TypeError('key %r should hold a str, not %r'

1758

% (key, type(key[0])))

1759

if not key[0].startswith('sha1:'):

1760

raise ValueError('key %r should point to a sha1:' % (key,))

1761

1762

Older »