~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/btree_index.py

Committer: Robert Collins
Date: 2010-05-06 23:54:05 UTC
mto: This revision was merged to the branch mainline in revision 5223.
Revision ID: robertc@robertcollins.net-20100506235405-wii4elupfhzl3jvy

Add __str__ to the new helper classes.

files added:
.testr.conf

MANIFEST.in

NEWS-template.txt

README_BDIST_RPM

apport

apport/README

apport/bzr-crashdb.conf

apport/source_bzr.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/btree_index.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmdline.py

bzrlib/crash.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/location-alias.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/help_topics/es

bzrlib/help_topics/es/conflict-types.txt

bzrlib/inventory_delta.py

bzrlib/lru_cache.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/rename_map.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/static_tuple.py

bzrlib/switch.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/commands/test_revert.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/https_server.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_bzrdir_colo

bzrlib/tests/per_bzrdir_colo/__init__.py

bzrlib/tests/per_bzrdir_colo/test_supported.py

bzrlib/tests/per_bzrdir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_script.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/transport/ftp

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/log.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/util/bencode.py

bzrlib/version_info_formats/format_custom.py

bzrlib/views.py

bzrlib/xml5.py

bzrlib/xml6.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

doc/Bazaar-Logo-For-Manuals.png

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/apport.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/index-plain.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/miscellaneous-notes.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/principles.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/specifications.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/index.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/quick-reference/index.txt

doc/en/tutorials

doc/en/tutorials/index.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference/readme.txt

doc/en/whats-new

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/check-newsbugs.py

tools/generate_release_notes.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/rst2pdf.py

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/run_script.py

files removed:
bzrlib/plugins/multiparent.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_escaped_store.py

bzrlib/textui.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/tests/test_bencode.py

bzrlib/weave_commands.py

bzrlib/xml6.py

contrib/fortune

doc/bazaar-vcs.org.kid

doc/developers/performance-contributing.txt

doc/en/developer-guide

doc/en/user-guide/index.txt

doc/en/user-reference/hooks.txt

doc/en/user-reference/index.txt

tools/biobench.py

tools/history2revfiles.py

tools/win32/survey.txt

files renamed:
bzrlib/_dirstate_helpers_c.h => bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_c.pyx => bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_knit_load_data_c.pyx => bzrlib/_knit_load_data_pyx.pyx

tools/doc_generate/ => bzrlib/doc_generate/

bzrlib/help_topics.py => bzrlib/help_topics/__init__.py

doc/en/user-guide/configuration.txt => bzrlib/help_topics/en/configuration.txt

doc/en/user-guide/conflicts.txt => bzrlib/help_topics/en/conflict-types.txt

bzrlib/plugins/launchpad/lp_indirect.py => bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/test_lp_indirect.py => bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/tests/HttpServer.py => bzrlib/tests/http_server.py

bzrlib/tests/HTTPTestUtil.py => bzrlib/tests/http_utils.py

bzrlib/tests/branch_implementations/ => bzrlib/tests/per_branch/

bzrlib/tests/bzrdir_implementations/ => bzrlib/tests/per_bzrdir/

bzrlib/tests/interrepository_implementations/ => bzrlib/tests/per_interrepository/

bzrlib/tests/intertree_implementations/ => bzrlib/tests/per_intertree/

bzrlib/tests/inventory_implementations/ => bzrlib/tests/per_inventory/

bzrlib/tests/repository_implementations/ => bzrlib/tests/per_repository/

bzrlib/tests/test_transport_implementations.py => bzrlib/tests/per_transport.py

bzrlib/tests/tree_implementations/ => bzrlib/tests/per_tree/

bzrlib/tests/test_versionedfile.py => bzrlib/tests/per_versionedfile.py

bzrlib/tests/workingtree_implementations/ => bzrlib/tests/per_workingtree/

bzrlib/tests/test_revisionnamespaces.py => bzrlib/tests/test_revisionspec.py

bzrlib/transport/ftp.py => bzrlib/transport/ftp/__init__.py

bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

bzrlib/xml5.py => bzrlib/xml8.py

doc/developers/knitpack.txt => doc/developers/packrepo.txt

doc/en/quick-reference/Makefile => doc/en/_static/en/Makefile

doc/en/quick-reference/quick-start-summary.svg => doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/user-guide/centralized_workflow.txt => doc/en/tutorials/centralized_workflow.txt

doc/en/user-guide/tutorial.txt => doc/en/tutorials/tutorial.txt

generate_docs.py => tools/generate_docs.py

files modified:
.bzrignore

INSTALL

Makefile

NEWS

README

bzr.ico

bzrlib/__init__.py

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml7.py

bzrlib/xml_serializer.py

contrib/newinventory.py

contrib/pwclient.full

doc/default.css

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/last-modified.txt

doc/developers/merge-scaling.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/profiling.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/update.txt

doc/en/mini-tutorial/index.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/version_info.txt

doc/index.txt

profile_imports.py

setup.py

tools/bzr_epydoc_uid.py

tools/convertfile.py

tools/convertinv.py

tools/rst2html.py

tools/weavebench.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/info.txt

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/btree_index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""B+Tree indices"""

import cStringIO

from bisect import bisect_right

import math

import tempfile

import zlib

from bzrlib import (

chunk_writer,

debug,

errors,

fifo_cache,

index,

lru_cache,

osutils,

static_tuple,

trace,

)

from bzrlib.index import _OPTION_NODE_REFS, _OPTION_KEY_ELEMENTS, _OPTION_LEN

from bzrlib.transport import get_transport

_BTSIGNATURE = "B+Tree Graph Index 2\n"

_OPTION_ROW_LENGTHS = "row_lengths="

_LEAF_FLAG = "type=leaf\n"

_INTERNAL_FLAG = "type=internal\n"

_INTERNAL_OFFSET = "offset="

_RESERVED_HEADER_BYTES = 120

_PAGE_SIZE = 4096

# 4K per page: 4MB - 1000 entries

_NODE_CACHE_SIZE = 1000

class _BuilderRow(object):

"""The stored state accumulated while writing out a row in the index.

:ivar spool: A temporary file used to accumulate nodes for this row

in the tree.

:ivar nodes: The count of nodes emitted so far.

"""

def __init__(self):

"""Create a _BuilderRow."""

self.nodes = 0

self.spool = None# tempfile.TemporaryFile(prefix='bzr-index-row-')

self.writer = None

def finish_node(self, pad=True):

byte_lines, _, padding = self.writer.finish()

if self.nodes == 0:

self.spool = cStringIO.StringIO()

# padded note:

self.spool.write("\x00" * _RESERVED_HEADER_BYTES)

elif self.nodes == 1:

# We got bigger than 1 node, switch to a temp file

spool = tempfile.TemporaryFile(prefix='bzr-index-row-')

spool.write(self.spool.getvalue())

self.spool = spool

skipped_bytes = 0

if not pad and padding:

del byte_lines[-1]

skipped_bytes = padding

self.spool.writelines(byte_lines)

remainder = (self.spool.tell() + skipped_bytes) % _PAGE_SIZE

if remainder != 0:

raise AssertionError("incorrect node length: %d, %d"

% (self.spool.tell(), remainder))

self.nodes += 1

self.writer = None

class _InternalBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out internal rows."""

def finish_node(self, pad=True):

if not pad:

raise AssertionError("Must pad internal nodes only.")

_BuilderRow.finish_node(self)

100

101

class _LeafBuilderRow(_BuilderRow):

102

"""The stored state accumulated while writing out a leaf rows."""

103

104

105

class BTreeBuilder(index.GraphIndexBuilder):

106

"""A Builder for B+Tree based Graph indices.

107

108

The resulting graph has the structure:

109

110

_SIGNATURE OPTIONS NODES

111

_SIGNATURE := 'B+Tree Graph Index 1' NEWLINE

112

OPTIONS := REF_LISTS KEY_ELEMENTS LENGTH

113

REF_LISTS := 'node_ref_lists=' DIGITS NEWLINE

114

KEY_ELEMENTS := 'key_elements=' DIGITS NEWLINE

115

LENGTH := 'len=' DIGITS NEWLINE

116

ROW_LENGTHS := 'row_lengths' DIGITS (COMMA DIGITS)*

117

NODES := NODE_COMPRESSED*

118

NODE_COMPRESSED:= COMPRESSED_BYTES{4096}

119

NODE_RAW := INTERNAL | LEAF

120

INTERNAL := INTERNAL_FLAG POINTERS

121

LEAF := LEAF_FLAG ROWS

122

KEY_ELEMENT := Not-whitespace-utf8

123

KEY := KEY_ELEMENT (NULL KEY_ELEMENT)*

124

ROWS := ROW*

125

ROW := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

126

ABSENT := 'a'

127

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

128

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

129

REFERENCE := KEY

130

VALUE := no-newline-no-null-bytes

131

"""

132

133

def __init__(self, reference_lists=0, key_elements=1, spill_at=100000):

134

"""See GraphIndexBuilder.__init__.

135

136

:param spill_at: Optional parameter controlling the maximum number

137

of nodes that BTreeBuilder will hold in memory.

138

"""

139

index.GraphIndexBuilder.__init__(self, reference_lists=reference_lists,

140

key_elements=key_elements)

141

self._spill_at = spill_at

142

self._backing_indices = []

143

# A map of {key: (node_refs, value)}

144

self._nodes = {}

145

# Indicate it hasn't been built yet

146

self._nodes_by_key = None

147

self._optimize_for_size = False

148

149

def add_node(self, key, value, references=()):

150

"""Add a node to the index.

151

152

If adding the node causes the builder to reach its spill_at threshold,

153

disk spilling will be triggered.

154

155

:param key: The key. keys are non-empty tuples containing

156

as many whitespace-free utf8 bytestrings as the key length

157

defined for this index.

158

:param references: An iterable of iterables of keys. Each is a

159

reference to another key.

160

:param value: The value to associate with the key. It may be any

161

bytes as long as it does not contain \0 or \n.

162

"""

163

# Ensure that 'key' is a StaticTuple

164

key = static_tuple.StaticTuple.from_sequence(key).intern()

165

# we don't care about absent_references

166

node_refs, _ = self._check_key_ref_value(key, references, value)

167

if key in self._nodes:

168

raise errors.BadIndexDuplicateKey(key, self)

169

self._nodes[key] = static_tuple.StaticTuple(node_refs, value)

170

if self._nodes_by_key is not None and self._key_length > 1:

171

self._update_nodes_by_key(key, value, node_refs)

172

if len(self._nodes) < self._spill_at:

173

return

174

self._spill_mem_keys_to_disk()

175

176

def _spill_mem_keys_to_disk(self):

177

"""Write the in memory keys down to disk to cap memory consumption.

178

179

If we already have some keys written to disk, we will combine them so

180

as to preserve the sorted order. The algorithm for combining uses

181

powers of two. So on the first spill, write all mem nodes into a

182

single index. On the second spill, combine the mem nodes with the nodes

183

on disk to create a 2x sized disk index and get rid of the first index.

184

On the third spill, create a single new disk index, which will contain

185

the mem nodes, and preserve the existing 2x sized index. On the fourth,

186

combine mem with the first and second indexes, creating a new one of

187

size 4x. On the fifth create a single new one, etc.

188

"""

189

if self._combine_backing_indices:

190

(new_backing_file, size,

191

backing_pos) = self._spill_mem_keys_and_combine()

192

else:

193

new_backing_file, size = self._spill_mem_keys_without_combining()

194

# Note: The transport here isn't strictly needed, because we will use

195

# direct access to the new_backing._file object

196

new_backing = BTreeGraphIndex(get_transport('.'), '<temp>', size)

197

# GC will clean up the file

198

new_backing._file = new_backing_file

199

if self._combine_backing_indices:

200

if len(self._backing_indices) == backing_pos:

201

self._backing_indices.append(None)

202

self._backing_indices[backing_pos] = new_backing

203

for backing_pos in range(backing_pos):

204

self._backing_indices[backing_pos] = None

205

else:

206

self._backing_indices.append(new_backing)

207

self._nodes = {}

208

self._nodes_by_key = None

209

210

def _spill_mem_keys_without_combining(self):

211

return self._write_nodes(self._iter_mem_nodes(), allow_optimize=False)

212

213

def _spill_mem_keys_and_combine(self):

214

iterators_to_combine = [self._iter_mem_nodes()]

215

pos = -1

216

for pos, backing in enumerate(self._backing_indices):

217

if backing is None:

218

pos -= 1

219

break

220

iterators_to_combine.append(backing.iter_all_entries())

221

backing_pos = pos + 1

222

new_backing_file, size = \

223

self._write_nodes(self._iter_smallest(iterators_to_combine),

224

allow_optimize=False)

225

return new_backing_file, size, backing_pos

226

227

def add_nodes(self, nodes):

228

"""Add nodes to the index.

229

230

:param nodes: An iterable of (key, node_refs, value) entries to add.

231

"""

232

if self.reference_lists:

233

for (key, value, node_refs) in nodes:

234

self.add_node(key, value, node_refs)

235

else:

236

for (key, value) in nodes:

237

self.add_node(key, value)

238

239

def _iter_mem_nodes(self):

240

"""Iterate over the nodes held in memory."""

241

nodes = self._nodes

242

if self.reference_lists:

243

for key in sorted(nodes):

244

references, value = nodes[key]

245

yield self, key, value, references

246

else:

247

for key in sorted(nodes):

248

references, value = nodes[key]

249

yield self, key, value

250

251

def _iter_smallest(self, iterators_to_combine):

252

if len(iterators_to_combine) == 1:

253

for value in iterators_to_combine[0]:

254

yield value

255

return

256

current_values = []

257

for iterator in iterators_to_combine:

258

try:

259

current_values.append(iterator.next())

260

except StopIteration:

261

current_values.append(None)

262

last = None

263

while True:

264

# Decorate candidates with the value to allow 2.4's min to be used.

265

candidates = [(item[1][1], item) for item

266

in enumerate(current_values) if item[1] is not None]

267

if not len(candidates):

268

return

269

selected = min(candidates)

270

# undecorate back to (pos, node)

271

selected = selected[1]

272

if last == selected[1][1]:

273

raise errors.BadIndexDuplicateKey(last, self)

274

last = selected[1][1]

275

# Yield, with self as the index

276

yield (self,) + selected[1][1:]

277

pos = selected[0]

278

try:

279

current_values[pos] = iterators_to_combine[pos].next()

280

except StopIteration:

281

current_values[pos] = None

282

283

def _add_key(self, string_key, line, rows, allow_optimize=True):

284

"""Add a key to the current chunk.

285

286

:param string_key: The key to add.

287

:param line: The fully serialised key and value.

288

:param allow_optimize: If set to False, prevent setting the optimize

289

flag when writing out. This is used by the _spill_mem_keys_to_disk

290

functionality.

291

"""

292

if rows[-1].writer is None:

293

# opening a new leaf chunk;

294

for pos, internal_row in enumerate(rows[:-1]):

295

# flesh out any internal nodes that are needed to

296

# preserve the height of the tree

297

if internal_row.writer is None:

298

length = _PAGE_SIZE

299

if internal_row.nodes == 0:

300

length -= _RESERVED_HEADER_BYTES # padded

301

if allow_optimize:

302

optimize_for_size = self._optimize_for_size

303

else:

304

optimize_for_size = False

305

internal_row.writer = chunk_writer.ChunkWriter(length, 0,

306

optimize_for_size=optimize_for_size)

307

internal_row.writer.write(_INTERNAL_FLAG)

308

internal_row.writer.write(_INTERNAL_OFFSET +

309

str(rows[pos + 1].nodes) + "\n")

310

# add a new leaf

311

length = _PAGE_SIZE

312

if rows[-1].nodes == 0:

313

length -= _RESERVED_HEADER_BYTES # padded

314

rows[-1].writer = chunk_writer.ChunkWriter(length,

315

optimize_for_size=self._optimize_for_size)

316

rows[-1].writer.write(_LEAF_FLAG)

317

if rows[-1].writer.write(line):

318

# this key did not fit in the node:

319

rows[-1].finish_node()

320

key_line = string_key + "\n"

321

new_row = True

322

for row in reversed(rows[:-1]):

323

# Mark the start of the next node in the node above. If it

324

# doesn't fit then propagate upwards until we find one that

325

# it does fit into.

326

if row.writer.write(key_line):

327

row.finish_node()

328

else:

329

# We've found a node that can handle the pointer.

330

new_row = False

331

break

332

# If we reached the current root without being able to mark the

333

# division point, then we need a new root:

334

if new_row:

335

# We need a new row

336

if 'index' in debug.debug_flags:

337

trace.mutter('Inserting new global row.')

338

new_row = _InternalBuilderRow()

339

reserved_bytes = 0

340

rows.insert(0, new_row)

341

# This will be padded, hence the -100

342

new_row.writer = chunk_writer.ChunkWriter(

343

_PAGE_SIZE - _RESERVED_HEADER_BYTES,

344

reserved_bytes,

345

optimize_for_size=self._optimize_for_size)

346

new_row.writer.write(_INTERNAL_FLAG)

347

new_row.writer.write(_INTERNAL_OFFSET +

348

str(rows[1].nodes - 1) + "\n")

349

new_row.writer.write(key_line)

350

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

351

352

def _write_nodes(self, node_iterator, allow_optimize=True):

353

"""Write node_iterator out as a B+Tree.

354

355

:param node_iterator: An iterator of sorted nodes. Each node should

356

match the output given by iter_all_entries.

357

:param allow_optimize: If set to False, prevent setting the optimize

358

flag when writing out. This is used by the _spill_mem_keys_to_disk

359

functionality.

360

:return: A file handle for a temporary file containing a B+Tree for

361

the nodes.

362

"""

363

# The index rows - rows[0] is the root, rows[1] is the layer under it

364

# etc.

365

rows = []

366

# forward sorted by key. In future we may consider topological sorting,

367

# at the cost of table scans for direct lookup, or a second index for

368

# direct lookup

369

key_count = 0

370

# A stack with the number of nodes of each size. 0 is the root node

371

# and must always be 1 (if there are any nodes in the tree).

372

self.row_lengths = []

373

# Loop over all nodes adding them to the bottom row

374

# (rows[-1]). When we finish a chunk in a row,

375

# propagate the key that didn't fit (comes after the chunk) to the

376

# row above, transitively.

377

for node in node_iterator:

378

if key_count == 0:

379

# First key triggers the first row

380

rows.append(_LeafBuilderRow())

381

key_count += 1

382

string_key, line = _btree_serializer._flatten_node(node,

383

self.reference_lists)

384

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

385

for row in reversed(rows):

386

pad = (type(row) != _LeafBuilderRow)

387

row.finish_node(pad=pad)

388

lines = [_BTSIGNATURE]

389

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

390

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

391

lines.append(_OPTION_LEN + str(key_count) + '\n')

392

row_lengths = [row.nodes for row in rows]

393

lines.append(_OPTION_ROW_LENGTHS + ','.join(map(str, row_lengths)) + '\n')

394

if row_lengths and row_lengths[-1] > 1:

395

result = tempfile.NamedTemporaryFile(prefix='bzr-index-')

396

else:

397

result = cStringIO.StringIO()

398

result.writelines(lines)

399

position = sum(map(len, lines))

400

root_row = True

401

if position > _RESERVED_HEADER_BYTES:

402

raise AssertionError("Could not fit the header in the"

403

" reserved space: %d > %d"

404

% (position, _RESERVED_HEADER_BYTES))

405

# write the rows out:

406

for row in rows:

407

reserved = _RESERVED_HEADER_BYTES # reserved space for first node

408

row.spool.flush()

409

row.spool.seek(0)

410

# copy nodes to the finalised file.

411

# Special case the first node as it may be prefixed

412

node = row.spool.read(_PAGE_SIZE)

413

result.write(node[reserved:])

414

if len(node) == _PAGE_SIZE:

415

result.write("\x00" * (reserved - position))

416

position = 0 # Only the root row actually has an offset

417

copied_len = osutils.pumpfile(row.spool, result)

418

if copied_len != (row.nodes - 1) * _PAGE_SIZE:

419

if type(row) != _LeafBuilderRow:

420

raise AssertionError("Incorrect amount of data copied"

421

" expected: %d, got: %d"

422

% ((row.nodes - 1) * _PAGE_SIZE,

423

copied_len))

424

result.flush()

425

size = result.tell()

426

result.seek(0)

427

return result, size

428

429

def finish(self):

430

"""Finalise the index.

431

432

:return: A file handle for a temporary file containing the nodes added

433

to the index.

434

"""

435

return self._write_nodes(self.iter_all_entries())[0]

436

437

def iter_all_entries(self):

438

"""Iterate over all keys within the index

439

440

:return: An iterable of (index, key, value, reference_lists). There is

441

no defined order for the result iteration - it will be in the most

442

efficient order for the index (in this case dictionary hash order).

443

"""

444

if 'evil' in debug.debug_flags:

445

trace.mutter_callsite(3,

446

"iter_all_entries scales with size of history.")

447

# Doing serial rather than ordered would be faster; but this shouldn't

448

# be getting called routinely anyway.

449

iterators = [self._iter_mem_nodes()]

450

for backing in self._backing_indices:

451

if backing is not None:

452

iterators.append(backing.iter_all_entries())

453

if len(iterators) == 1:

454

return iterators[0]

455

return self._iter_smallest(iterators)

456

457

def iter_entries(self, keys):

458

"""Iterate over keys within the index.

459

460

:param keys: An iterable providing the keys to be retrieved.

461

:return: An iterable of (index, key, value, reference_lists). There is no

462

defined order for the result iteration - it will be in the most

463

efficient order for the index (keys iteration order in this case).

464

"""

465

keys = set(keys)

466

# Note: We don't use keys.intersection() here. If you read the C api,

467

# set.intersection(other) special cases when other is a set and

468

# will iterate the smaller of the two and lookup in the other.

469

# It does *not* do this for any other type (even dict, unlike

470

# some other set functions.) Since we expect keys is generally <<

471

# self._nodes, it is faster to iterate over it in a list

472

# comprehension

473

nodes = self._nodes

474

local_keys = [key for key in keys if key in nodes]

475

if self.reference_lists:

476

for key in local_keys:

477

node = nodes[key]

478

yield self, key, node[1], node[0]

479

else:

480

for key in local_keys:

481

node = nodes[key]

482

yield self, key, node[1]

483

# Find things that are in backing indices that have not been handled

484

# yet.

485

if not self._backing_indices:

486

return # We won't find anything there either

487

# Remove all of the keys that we found locally

488

keys.difference_update(local_keys)

489

for backing in self._backing_indices:

490

if backing is None:

491

continue

492

if not keys:

493

return

494

for node in backing.iter_entries(keys):

495

keys.remove(node[1])

496

yield (self,) + node[1:]

497

498

def iter_entries_prefix(self, keys):

499

"""Iterate over keys within the index using prefix matching.

500

501

Prefix matching is applied within the tuple of a key, not to within

502

the bytestring of each key element. e.g. if you have the keys ('foo',

503

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

504

only the former key is returned.

505

506

:param keys: An iterable providing the key prefixes to be retrieved.

507

Each key prefix takes the form of a tuple the length of a key, but

508

with the last N elements 'None' rather than a regular bytestring.

509

The first element cannot be 'None'.

510

:return: An iterable as per iter_all_entries, but restricted to the

511

keys with a matching prefix to those supplied. No additional keys

512

will be returned, and every match that is in the index will be

513

returned.

514

"""

515

# XXX: To much duplication with the GraphIndex class; consider finding

516

# a good place to pull out the actual common logic.

517

keys = set(keys)

518

if not keys:

519

return

520

for backing in self._backing_indices:

521

if backing is None:

522

continue

523

for node in backing.iter_entries_prefix(keys):

524

yield (self,) + node[1:]

525

if self._key_length == 1:

526

for key in keys:

527

# sanity check

528

if key[0] is None:

529

raise errors.BadIndexKey(key)

530

if len(key) != self._key_length:

531

raise errors.BadIndexKey(key)

532

try:

533

node = self._nodes[key]

534

except KeyError:

535

continue

536

if self.reference_lists:

537

yield self, key, node[1], node[0]

538

else:

539

yield self, key, node[1]

540

return

541

for key in keys:

542

# sanity check

543

if key[0] is None:

544

raise errors.BadIndexKey(key)

545

if len(key) != self._key_length:

546

raise errors.BadIndexKey(key)

547

# find what it refers to:

548

key_dict = self._get_nodes_by_key()

549

elements = list(key)

550

# find the subdict to return

551

try:

552

while len(elements) and elements[0] is not None:

553

key_dict = key_dict[elements[0]]

554

elements.pop(0)

555

except KeyError:

556

# a non-existant lookup.

557

continue

558

if len(elements):

559

dicts = [key_dict]

560

while dicts:

561

key_dict = dicts.pop(-1)

562

# can't be empty or would not exist

563

item, value = key_dict.iteritems().next()

564

if type(value) == dict:

565

# push keys

566

dicts.extend(key_dict.itervalues())

567

else:

568

# yield keys

569

for value in key_dict.itervalues():

570

yield (self, ) + tuple(value)

571

else:

572

yield (self, ) + key_dict

573

574

def _get_nodes_by_key(self):

575

if self._nodes_by_key is None:

576

nodes_by_key = {}

577

if self.reference_lists:

578

for key, (references, value) in self._nodes.iteritems():

579

key_dict = nodes_by_key

580

for subkey in key[:-1]:

581

key_dict = key_dict.setdefault(subkey, {})

582

key_dict[key[-1]] = key, value, references

583

else:

584

for key, (references, value) in self._nodes.iteritems():

585

key_dict = nodes_by_key

586

for subkey in key[:-1]:

587

key_dict = key_dict.setdefault(subkey, {})

588

key_dict[key[-1]] = key, value

589

self._nodes_by_key = nodes_by_key

590

return self._nodes_by_key

591

592

def key_count(self):

593

"""Return an estimate of the number of keys in this index.

594

595

For InMemoryGraphIndex the estimate is exact.

596

"""

597

return len(self._nodes) + sum(backing.key_count() for backing in

598

self._backing_indices if backing is not None)

599

600

def validate(self):

601

"""In memory index's have no known corruption at the moment."""

602

603

604

class _LeafNode(object):

605

"""A leaf node for a serialised B+Tree index."""

606

607

__slots__ = ('keys', 'min_key', 'max_key')

608

609

def __init__(self, bytes, key_length, ref_list_length):

610

"""Parse bytes to create a leaf node object."""

611

# splitlines mangles the \r delimiters.. don't use it.

612

key_list = _btree_serializer._parse_leaf_lines(bytes,

613

key_length, ref_list_length)

614

if key_list:

615

self.min_key = key_list[0][0]

616

self.max_key = key_list[-1][0]

617

else:

618

self.min_key = self.max_key = None

619

self.keys = dict(key_list)

620

621

622

class _InternalNode(object):

623

"""An internal node for a serialised B+Tree index."""

624

625

__slots__ = ('keys', 'offset')

626

627

def __init__(self, bytes):

628

"""Parse bytes to create an internal node object."""

629

# splitlines mangles the \r delimiters.. don't use it.

630

self.keys = self._parse_lines(bytes.split('\n'))

631

632

def _parse_lines(self, lines):

633

nodes = []

634

self.offset = int(lines[1][7:])

635

as_st = static_tuple.StaticTuple.from_sequence

636

for line in lines[2:]:

637

if line == '':

638

break

639

nodes.append(as_st(map(intern, line.split('\0'))).intern())

640

return nodes

641

642

643

class BTreeGraphIndex(object):

644

"""Access to nodes via the standard GraphIndex interface for B+Tree's.

645

646

Individual nodes are held in a LRU cache. This holds the root node in

647

memory except when very large walks are done.

648

"""

649

650

def __init__(self, transport, name, size, unlimited_cache=False,

651

offset=0):

652

"""Create a B+Tree index object on the index name.

653

654

:param transport: The transport to read data for the index from.

655

:param name: The file name of the index on transport.

656

:param size: Optional size of the index in bytes. This allows

657

compatibility with the GraphIndex API, as well as ensuring that

658

the initial read (to read the root node header) can be done

659

without over-reading even on empty indices, and on small indices

660

allows single-IO to read the entire index.

661

:param unlimited_cache: If set to True, then instead of using an

662

LRUCache with size _NODE_CACHE_SIZE, we will use a dict and always

663

cache all leaf nodes.

664

:param offset: The start of the btree index data isn't byte 0 of the

665

file. Instead it starts at some point later.

666

"""

667

self._transport = transport

668

self._name = name

669

self._size = size

670

self._file = None

671

self._recommended_pages = self._compute_recommended_pages()

672

self._root_node = None

673

self._base_offset = offset

674

# Default max size is 100,000 leave values

675

self._leaf_value_cache = None # lru_cache.LRUCache(100*1000)

676

if unlimited_cache:

677

self._leaf_node_cache = {}

678

self._internal_node_cache = {}

679

else:

680

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

681

# We use a FIFO here just to prevent possible blowout. However, a

682

# 300k record btree has only 3k leaf nodes, and only 20 internal

683

# nodes. A value of 100 scales to ~100*100*100 = 1M records.

684

self._internal_node_cache = fifo_cache.FIFOCache(100)

685

self._key_count = None

686

self._row_lengths = None

687

self._row_offsets = None # Start of each row, [-1] is the end

688

689

def __eq__(self, other):

690

"""Equal when self and other were created with the same parameters."""

691

return (

692

type(self) == type(other) and

693

self._transport == other._transport and

694

self._name == other._name and

695

self._size == other._size)

696

697

def __ne__(self, other):

698

return not self.__eq__(other)

699

700

def _get_and_cache_nodes(self, nodes):

701

"""Read nodes and cache them in the lru.

702

703

The nodes list supplied is sorted and then read from disk, each node

704

being inserted it into the _node_cache.

705

706

Note: Asking for more nodes than the _node_cache can contain will

707

result in some of the results being immediately discarded, to prevent

708

this an assertion is raised if more nodes are asked for than are

709

cachable.

710

711

:return: A dict of {node_pos: node}

712

"""

713

found = {}

714

start_of_leaves = None

715

for node_pos, node in self._read_nodes(sorted(nodes)):

716

if node_pos == 0: # Special case

717

self._root_node = node

718

else:

719

if start_of_leaves is None:

720

start_of_leaves = self._row_offsets[-2]

721

if node_pos < start_of_leaves:

722

self._internal_node_cache[node_pos] = node

723

else:

724

self._leaf_node_cache[node_pos] = node

725

found[node_pos] = node

726

return found

727

728

def _compute_recommended_pages(self):

729

"""Convert transport's recommended_page_size into btree pages.

730

731

recommended_page_size is in bytes, we want to know how many _PAGE_SIZE

732

pages fit in that length.

733

"""

734

recommended_read = self._transport.recommended_page_size()

735

recommended_pages = int(math.ceil(recommended_read /

736

float(_PAGE_SIZE)))

737

return recommended_pages

738

739

def _compute_total_pages_in_index(self):

740

"""How many pages are in the index.

741

742

If we have read the header we will use the value stored there.

743

Otherwise it will be computed based on the length of the index.

744

"""

745

if self._size is None:

746

raise AssertionError('_compute_total_pages_in_index should not be'

747

' called when self._size is None')

748

if self._root_node is not None:

749

# This is the number of pages as defined by the header

750

return self._row_offsets[-1]

751

# This is the number of pages as defined by the size of the index. They

752

# should be indentical.

753

total_pages = int(math.ceil(self._size / float(_PAGE_SIZE)))

754

return total_pages

755

756

def _expand_offsets(self, offsets):

757

"""Find extra pages to download.

758

759

The idea is that we always want to make big-enough requests (like 64kB

760

for http), so that we don't waste round trips. So given the entries

761

that we already have cached and the new pages being downloaded figure

762

out what other pages we might want to read.

763

764

See also doc/developers/btree_index_prefetch.txt for more details.

765

766

:param offsets: The offsets to be read

767

:return: A list of offsets to download

768

"""

769

if 'index' in debug.debug_flags:

770

trace.mutter('expanding: %s\toffsets: %s', self._name, offsets)

771

772

if len(offsets) >= self._recommended_pages:

773

# Don't add more, we are already requesting more than enough

774

if 'index' in debug.debug_flags:

775

trace.mutter(' not expanding large request (%s >= %s)',

776

len(offsets), self._recommended_pages)

777

return offsets

778

if self._size is None:

779

# Don't try anything, because we don't know where the file ends

780

if 'index' in debug.debug_flags:

781

trace.mutter(' not expanding without knowing index size')

782

return offsets

783

total_pages = self._compute_total_pages_in_index()

784

cached_offsets = self._get_offsets_to_cached_pages()

785

# If reading recommended_pages would read the rest of the index, just

786

# do so.

787

if total_pages - len(cached_offsets) <= self._recommended_pages:

788

# Read whatever is left

789

if cached_offsets:

790

expanded = [x for x in xrange(total_pages)

791

if x not in cached_offsets]

792

else:

793

expanded = range(total_pages)

794

if 'index' in debug.debug_flags:

795

trace.mutter(' reading all unread pages: %s', expanded)

796

return expanded

797

798

if self._root_node is None:

799

# ATM on the first read of the root node of a large index, we don't

800

# bother pre-reading any other pages. This is because the

801

# likelyhood of actually reading interesting pages is very low.

802

# See doc/developers/btree_index_prefetch.txt for a discussion, and

803

# a possible implementation when we are guessing that the second

804

# layer index is small

805

final_offsets = offsets

806

else:

807

tree_depth = len(self._row_lengths)

808

if len(cached_offsets) < tree_depth and len(offsets) == 1:

809

# We haven't read enough to justify expansion

810

# If we are only going to read the root node, and 1 leaf node,

811

# then it isn't worth expanding our request. Once we've read at

812

# least 2 nodes, then we are probably doing a search, and we

813

# start expanding our requests.

814

if 'index' in debug.debug_flags:

815

trace.mutter(' not expanding on first reads')

816

return offsets

817

final_offsets = self._expand_to_neighbors(offsets, cached_offsets,

818

total_pages)

819

820

final_offsets = sorted(final_offsets)

821

if 'index' in debug.debug_flags:

822

trace.mutter('expanded: %s', final_offsets)

823

return final_offsets

824

825

def _expand_to_neighbors(self, offsets, cached_offsets, total_pages):

826

"""Expand requests to neighbors until we have enough pages.

827

828

This is called from _expand_offsets after policy has determined that we

829

want to expand.

830

We only want to expand requests within a given layer. We cheat a little

831

bit and assume all requests will be in the same layer. This is true

832

given the current design, but if it changes this algorithm may perform

833

oddly.

834

835

:param offsets: requested offsets

836

:param cached_offsets: offsets for pages we currently have cached

837

:return: A set() of offsets after expansion

838

"""

839

final_offsets = set(offsets)

840

first = end = None

841

new_tips = set(final_offsets)

842

while len(final_offsets) < self._recommended_pages and new_tips:

843

next_tips = set()

844

for pos in new_tips:

845

if first is None:

846

first, end = self._find_layer_first_and_end(pos)

847

previous = pos - 1

848

if (previous > 0

849

and previous not in cached_offsets

850

and previous not in final_offsets

851

and previous >= first):

852

next_tips.add(previous)

853

after = pos + 1

854

if (after < total_pages

855

and after not in cached_offsets

856

and after not in final_offsets

857

and after < end):

858

next_tips.add(after)

859

# This would keep us from going bigger than

860

# recommended_pages by only expanding the first offsets.

861

# However, if we are making a 'wide' request, it is

862

# reasonable to expand all points equally.

863

# if len(final_offsets) > recommended_pages:

864

# break

865

final_offsets.update(next_tips)

866

new_tips = next_tips

867

return final_offsets

868

869

def clear_cache(self):

870

"""Clear out any cached/memoized values.

871

872

This can be called at any time, but generally it is used when we have

873

extracted some information, but don't expect to be requesting any more

874

from this index.

875

"""

876

# Note that we don't touch self._root_node or self._internal_node_cache

877

# We don't expect either of those to be big, and it can save

878

# round-trips in the future. We may re-evaluate this if InternalNode

879

# memory starts to be an issue.

880

self._leaf_node_cache.clear()

881

882

def external_references(self, ref_list_num):

883

if self._root_node is None:

884

self._get_root_node()

885

if ref_list_num + 1 > self.node_ref_lists:

886

raise ValueError('No ref list %d, index has %d ref lists'

887

% (ref_list_num, self.node_ref_lists))

888

keys = set()

889

refs = set()

890

for node in self.iter_all_entries():

891

keys.add(node[1])

892

refs.update(node[3][ref_list_num])

893

return refs - keys

894

895

def _find_layer_first_and_end(self, offset):

896

"""Find the start/stop nodes for the layer corresponding to offset.

897

898

:return: (first, end)

899

first is the first node in this layer

900

end is the first node of the next layer

901

"""

902

first = end = 0

903

for roffset in self._row_offsets:

904

first = end

905

end = roffset

906

if offset < roffset:

907

break

908

return first, end

909

910

def _get_offsets_to_cached_pages(self):

911

"""Determine what nodes we already have cached."""

912

cached_offsets = set(self._internal_node_cache.keys())

913

cached_offsets.update(self._leaf_node_cache.keys())

914

if self._root_node is not None:

915

cached_offsets.add(0)

916

return cached_offsets

917

918

def _get_root_node(self):

919

if self._root_node is None:

920

# We may not have a root node yet

921

self._get_internal_nodes([0])

922

return self._root_node

923

924

def _get_nodes(self, cache, node_indexes):

925

found = {}

926

needed = []

927

for idx in node_indexes:

928

if idx == 0 and self._root_node is not None:

929

found[0] = self._root_node

930

continue

931

try:

932

found[idx] = cache[idx]

933

except KeyError:

934

needed.append(idx)

935

if not needed:

936

return found

937

needed = self._expand_offsets(needed)

938

found.update(self._get_and_cache_nodes(needed))

939

return found

940

941

def _get_internal_nodes(self, node_indexes):

942

"""Get a node, from cache or disk.

943

944

After getting it, the node will be cached.

945

"""

946

return self._get_nodes(self._internal_node_cache, node_indexes)

947

948

def _cache_leaf_values(self, nodes):

949

"""Cache directly from key => value, skipping the btree."""

950

if self._leaf_value_cache is not None:

951

for node in nodes.itervalues():

952

for key, value in node.keys.iteritems():

953

if key in self._leaf_value_cache:

954

# Don't add the rest of the keys, we've seen this node

955

# before.

956

break

957

self._leaf_value_cache[key] = value

958

959

def _get_leaf_nodes(self, node_indexes):

960

"""Get a bunch of nodes, from cache or disk."""

961

found = self._get_nodes(self._leaf_node_cache, node_indexes)

962

self._cache_leaf_values(found)

963

return found

964

965

def iter_all_entries(self):

966

"""Iterate over all keys within the index.

967

968

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

969

The former tuple is used when there are no reference lists in the

970

index, making the API compatible with simple key:value index types.

971

There is no defined order for the result iteration - it will be in

972

the most efficient order for the index.

973

"""

974

if 'evil' in debug.debug_flags:

975

trace.mutter_callsite(3,

976

"iter_all_entries scales with size of history.")

977

if not self.key_count():

978

return

979

if self._row_offsets[-1] == 1:

980

# There is only the root node, and we read that via key_count()

981

if self.node_ref_lists:

982

for key, (value, refs) in sorted(self._root_node.keys.items()):

983

yield (self, key, value, refs)

984

else:

985

for key, (value, refs) in sorted(self._root_node.keys.items()):

986

yield (self, key, value)

987

return

988

start_of_leaves = self._row_offsets[-2]

989

end_of_leaves = self._row_offsets[-1]

990

needed_offsets = range(start_of_leaves, end_of_leaves)

991

if needed_offsets == [0]:

992

# Special case when we only have a root node, as we have already

993

# read everything

994

nodes = [(0, self._root_node)]

995

else:

996

nodes = self._read_nodes(needed_offsets)

997

# We iterate strictly in-order so that we can use this function

998

# for spilling index builds to disk.

999

if self.node_ref_lists:

1000

for _, node in nodes:

1001

for key, (value, refs) in sorted(node.keys.items()):

1002

yield (self, key, value, refs)

1003

else:

1004

for _, node in nodes:

1005

for key, (value, refs) in sorted(node.keys.items()):

1006

yield (self, key, value)

1007

1008

@staticmethod

1009

def _multi_bisect_right(in_keys, fixed_keys):

1010

"""Find the positions where each 'in_key' would fit in fixed_keys.

1011

1012

This is equivalent to doing "bisect_right" on each in_key into

1013

fixed_keys

1014

1015

:param in_keys: A sorted list of keys to match with fixed_keys

1016

:param fixed_keys: A sorted list of keys to match against

1017

:return: A list of (integer position, [key list]) tuples.

1018

"""

1019

if not in_keys:

1020

return []

1021

if not fixed_keys:

1022

# no pointers in the fixed_keys list, which means everything must

1023

# fall to the left.

1024

return [(0, in_keys)]

1025

1026

# TODO: Iterating both lists will generally take M + N steps

1027

# Bisecting each key will generally take M * log2 N steps.

1028

# If we had an efficient way to compare, we could pick the method

1029

# based on which has the fewer number of steps.

1030

# There is also the argument that bisect_right is a compiled

1031

# function, so there is even more to be gained.

1032

# iter_steps = len(in_keys) + len(fixed_keys)

1033

# bisect_steps = len(in_keys) * math.log(len(fixed_keys), 2)

1034

if len(in_keys) == 1: # Bisect will always be faster for M = 1

1035

return [(bisect_right(fixed_keys, in_keys[0]), in_keys)]

1036

# elif bisect_steps < iter_steps:

1037

# offsets = {}

1038

# for key in in_keys:

1039

# offsets.setdefault(bisect_right(fixed_keys, key),

1040

# []).append(key)

1041

# return [(o, offsets[o]) for o in sorted(offsets)]

1042

in_keys_iter = iter(in_keys)

1043

fixed_keys_iter = enumerate(fixed_keys)

1044

cur_in_key = in_keys_iter.next()

1045

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1046

1047

class InputDone(Exception): pass

1048

class FixedDone(Exception): pass

1049

1050

output = []

1051

cur_out = []

1052

1053

# TODO: Another possibility is that rather than iterating on each side,

1054

# we could use a combination of bisecting and iterating. For

1055

# example, while cur_in_key < fixed_key, bisect to find its

1056

# point, then iterate all matching keys, then bisect (restricted

1057

# to only the remainder) for the next one, etc.

1058

try:

1059

while True:

1060

if cur_in_key < cur_fixed_key:

1061

cur_keys = []

1062

cur_out = (cur_fixed_offset, cur_keys)

1063

output.append(cur_out)

1064

while cur_in_key < cur_fixed_key:

1065

cur_keys.append(cur_in_key)

1066

try:

1067

cur_in_key = in_keys_iter.next()

1068

except StopIteration:

1069

raise InputDone

1070

# At this point cur_in_key must be >= cur_fixed_key

1071

# step the cur_fixed_key until we pass the cur key, or walk off

1072

# the end

1073

while cur_in_key >= cur_fixed_key:

1074

try:

1075

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1076

except StopIteration:

1077

raise FixedDone

1078

except InputDone:

1079

# We consumed all of the input, nothing more to do

1080

pass

1081

except FixedDone:

1082

# There was some input left, but we consumed all of fixed, so we

1083

# have to add one more for the tail

1084

cur_keys = [cur_in_key]

1085

cur_keys.extend(in_keys_iter)

1086

cur_out = (len(fixed_keys), cur_keys)

1087

output.append(cur_out)

1088

return output

1089

1090

def _walk_through_internal_nodes(self, keys):

1091

"""Take the given set of keys, and find the corresponding LeafNodes.

1092

1093

:param keys: An unsorted iterable of keys to search for

1094

:return: (nodes, index_and_keys)

1095

nodes is a dict mapping {index: LeafNode}

1096

keys_at_index is a list of tuples of [(index, [keys for Leaf])]

1097

"""

1098

# 6 seconds spent in miss_torture using the sorted() line.

1099

# Even with out of order disk IO it seems faster not to sort it when

1100

# large queries are being made.

1101

keys_at_index = [(0, sorted(keys))]

1102

1103

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

1104

node_indexes = [idx for idx, s_keys in keys_at_index]

1105

nodes = self._get_internal_nodes(node_indexes)

1106

1107

next_nodes_and_keys = []

1108

for node_index, sub_keys in keys_at_index:

1109

node = nodes[node_index]

1110

positions = self._multi_bisect_right(sub_keys, node.keys)

1111

node_offset = next_row_start + node.offset

1112

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

1113

for pos, s_keys in positions])

1114

keys_at_index = next_nodes_and_keys

1115

# We should now be at the _LeafNodes

1116

node_indexes = [idx for idx, s_keys in keys_at_index]

1117

1118

# TODO: We may *not* want to always read all the nodes in one

1119

# big go. Consider setting a max size on this.

1120

nodes = self._get_leaf_nodes(node_indexes)

1121

return nodes, keys_at_index

1122

1123

def iter_entries(self, keys):

1124

"""Iterate over keys within the index.

1125

1126

:param keys: An iterable providing the keys to be retrieved.

1127

:return: An iterable as per iter_all_entries, but restricted to the

1128

keys supplied. No additional keys will be returned, and every

1129

key supplied that is in the index will be returned.

1130

"""

1131

# 6 seconds spent in miss_torture using the sorted() line.

1132

# Even with out of order disk IO it seems faster not to sort it when

1133

# large queries are being made.

1134

# However, now that we are doing multi-way bisecting, we need the keys

1135

# in sorted order anyway. We could change the multi-way code to not

1136

# require sorted order. (For example, it bisects for the first node,

1137

# does an in-order search until a key comes before the current point,

1138

# which it then bisects for, etc.)

1139

keys = frozenset(keys)

1140

if not keys:

1141

return

1142

1143

if not self.key_count():

1144

return

1145

1146

needed_keys = []

1147

if self._leaf_value_cache is None:

1148

needed_keys = keys

1149

else:

1150

for key in keys:

1151

value = self._leaf_value_cache.get(key, None)

1152

if value is not None:

1153

# This key is known not to be here, skip it

1154

value, refs = value

1155

if self.node_ref_lists:

1156

yield (self, key, value, refs)

1157

else:

1158

yield (self, key, value)

1159

else:

1160

needed_keys.append(key)

1161

1162

last_key = None

1163

needed_keys = keys

1164

if not needed_keys:

1165

return

1166

nodes, nodes_and_keys = self._walk_through_internal_nodes(needed_keys)

1167

for node_index, sub_keys in nodes_and_keys:

1168

if not sub_keys:

1169

continue

1170

node = nodes[node_index]

1171

for next_sub_key in sub_keys:

1172

if next_sub_key in node.keys:

1173

value, refs = node.keys[next_sub_key]

1174

if self.node_ref_lists:

1175

yield (self, next_sub_key, value, refs)

1176

else:

1177

yield (self, next_sub_key, value)

1178

1179

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

1180

"""Find the parent_map information for the set of keys.

1181

1182

This populates the parent_map dict and missing_keys set based on the

1183

queried keys. It also can fill out an arbitrary number of parents that

1184

it finds while searching for the supplied keys.

1185

1186

It is unlikely that you want to call this directly. See

1187

"CombinedGraphIndex.find_ancestry()" for a more appropriate API.

1188

1189

:param keys: A keys whose ancestry we want to return

1190

Every key will either end up in 'parent_map' or 'missing_keys'.

1191

:param ref_list_num: This index in the ref_lists is the parents we

1192

care about.

1193

:param parent_map: {key: parent_keys} for keys that are present in this

1194

index. This may contain more entries than were in 'keys', that are

1195

reachable ancestors of the keys requested.

1196

:param missing_keys: keys which are known to be missing in this index.

1197

This may include parents that were not directly requested, but we

1198

were able to determine that they are not present in this index.

1199

:return: search_keys parents that were found but not queried to know

1200

if they are missing or present. Callers can re-query this index for

1201

those keys, and they will be placed into parent_map or missing_keys

1202

"""

1203

if not self.key_count():

1204

# We use key_count() to trigger reading the root node and

1205

# determining info about this BTreeGraphIndex

1206

# If we don't have any keys, then everything is missing

1207

missing_keys.update(keys)

1208

return set()

1209

if ref_list_num >= self.node_ref_lists:

1210

raise ValueError('No ref list %d, index has %d ref lists'

1211

% (ref_list_num, self.node_ref_lists))

1212

1213

# The main trick we are trying to accomplish is that when we find a

1214

# key listing its parents, we expect that the parent key is also likely

1215

# to sit on the same page. Allowing us to expand parents quickly

1216

# without suffering the full stack of bisecting, etc.

1217

nodes, nodes_and_keys = self._walk_through_internal_nodes(keys)

1218

1219

# These are parent keys which could not be immediately resolved on the

1220

# page where the child was present. Note that we may already be

1221

# searching for that key, and it may actually be present [or known

1222

# missing] on one of the other pages we are reading.

1223

# TODO:

1224

# We could try searching for them in the immediate previous or next

1225

# page. If they occur "later" we could put them in a pending lookup

1226

# set, and then for each node we read thereafter we could check to

1227

# see if they are present.

1228

# However, we don't know the impact of keeping this list of things

1229

# that I'm going to search for every node I come across from here on

1230

# out.

1231

# It doesn't handle the case when the parent key is missing on a

1232

# page that we *don't* read. So we already have to handle being

1233

# re-entrant for that.

1234

# Since most keys contain a date string, they are more likely to be

1235

# found earlier in the file than later, but we would know that right

1236

# away (key < min_key), and wouldn't keep searching it on every other

1237

# page that we read.

1238

# Mostly, it is an idea, one which should be benchmarked.

1239

parents_not_on_page = set()

1240

1241

for node_index, sub_keys in nodes_and_keys:

1242

if not sub_keys:

1243

continue

1244

# sub_keys is all of the keys we are looking for that should exist

1245

# on this page, if they aren't here, then they won't be found

1246

node = nodes[node_index]

1247

node_keys = node.keys

1248

parents_to_check = set()

1249

for next_sub_key in sub_keys:

1250

if next_sub_key not in node_keys:

1251

# This one is just not present in the index at all

1252

missing_keys.add(next_sub_key)

1253

else:

1254

value, refs = node_keys[next_sub_key]

1255

parent_keys = refs[ref_list_num]

1256

parent_map[next_sub_key] = parent_keys

1257

parents_to_check.update(parent_keys)

1258

# Don't look for things we've already found

1259

parents_to_check = parents_to_check.difference(parent_map)

1260

# this can be used to test the benefit of having the check loop

1261

# inlined.

1262

# parents_not_on_page.update(parents_to_check)

1263

# continue

1264

while parents_to_check:

1265

next_parents_to_check = set()

1266

for key in parents_to_check:

1267

if key in node_keys:

1268

value, refs = node_keys[key]

1269

parent_keys = refs[ref_list_num]

1270

parent_map[key] = parent_keys

1271

next_parents_to_check.update(parent_keys)

1272

else:

1273

# This parent either is genuinely missing, or should be

1274

# found on another page. Perf test whether it is better

1275

# to check if this node should fit on this page or not.

1276

# in the 'everything-in-one-pack' scenario, this *not*

1277

# doing the check is 237ms vs 243ms.

1278

# So slightly better, but I assume the standard 'lots

1279

# of packs' is going to show a reasonable improvement

1280

# from the check, because it avoids 'going around

1281

# again' for everything that is in another index

1282

# parents_not_on_page.add(key)

1283

# Missing for some reason

1284

if key < node.min_key:

1285

# in the case of bzr.dev, 3.4k/5.3k misses are

1286

# 'earlier' misses (65%)

1287

parents_not_on_page.add(key)

1288

elif key > node.max_key:

1289

# This parent key would be present on a different

1290

# LeafNode

1291

parents_not_on_page.add(key)

1292

else:

1293

# assert key != node.min_key and key != node.max_key

1294

# If it was going to be present, it would be on

1295

# *this* page, so mark it missing.

1296

missing_keys.add(key)

1297

parents_to_check = next_parents_to_check.difference(parent_map)

1298

# Might want to do another .difference() from missing_keys

1299

# parents_not_on_page could have been found on a different page, or be

1300

# known to be missing. So cull out everything that has already been

1301

# found.

1302

search_keys = parents_not_on_page.difference(

1303

parent_map).difference(missing_keys)

1304

return search_keys

1305

1306

def iter_entries_prefix(self, keys):

1307

"""Iterate over keys within the index using prefix matching.

1308

1309

Prefix matching is applied within the tuple of a key, not to within

1310

the bytestring of each key element. e.g. if you have the keys ('foo',

1311

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1312

only the former key is returned.

1313

1314

WARNING: Note that this method currently causes a full index parse

1315

unconditionally (which is reasonably appropriate as it is a means for

1316

thunking many small indices into one larger one and still supplies

1317

iter_all_entries at the thunk layer).

1318

1319

:param keys: An iterable providing the key prefixes to be retrieved.

1320

Each key prefix takes the form of a tuple the length of a key, but

1321

with the last N elements 'None' rather than a regular bytestring.

1322

The first element cannot be 'None'.

1323

:return: An iterable as per iter_all_entries, but restricted to the

1324

keys with a matching prefix to those supplied. No additional keys

1325

will be returned, and every match that is in the index will be

1326

returned.

1327

"""

1328

keys = sorted(set(keys))

1329

if not keys:

1330

return

1331

# Load if needed to check key lengths

1332

if self._key_count is None:

1333

self._get_root_node()

1334

# TODO: only access nodes that can satisfy the prefixes we are looking

1335

# for. For now, to meet API usage (as this function is not used by

1336

# current bzrlib) just suck the entire index and iterate in memory.

1337

nodes = {}

1338

if self.node_ref_lists:

1339

if self._key_length == 1:

1340

for _1, key, value, refs in self.iter_all_entries():

1341

nodes[key] = value, refs

1342

else:

1343

nodes_by_key = {}

1344

for _1, key, value, refs in self.iter_all_entries():

1345

key_value = key, value, refs

1346

# For a key of (foo, bar, baz) create

1347

# _nodes_by_key[foo][bar][baz] = key_value

1348

key_dict = nodes_by_key

1349

for subkey in key[:-1]:

1350

key_dict = key_dict.setdefault(subkey, {})

1351

key_dict[key[-1]] = key_value

1352

else:

1353

if self._key_length == 1:

1354

for _1, key, value in self.iter_all_entries():

1355

nodes[key] = value

1356

else:

1357

nodes_by_key = {}

1358

for _1, key, value in self.iter_all_entries():

1359

key_value = key, value

1360

# For a key of (foo, bar, baz) create

1361

# _nodes_by_key[foo][bar][baz] = key_value

1362

key_dict = nodes_by_key

1363

for subkey in key[:-1]:

1364

key_dict = key_dict.setdefault(subkey, {})

1365

key_dict[key[-1]] = key_value

1366

if self._key_length == 1:

1367

for key in keys:

1368

# sanity check

1369

if key[0] is None:

1370

raise errors.BadIndexKey(key)

1371

if len(key) != self._key_length:

1372

raise errors.BadIndexKey(key)

1373

try:

1374

if self.node_ref_lists:

1375

value, node_refs = nodes[key]

1376

yield self, key, value, node_refs

1377

else:

1378

yield self, key, nodes[key]

1379

except KeyError:

1380

pass

1381

return

1382

for key in keys:

1383

# sanity check

1384

if key[0] is None:

1385

raise errors.BadIndexKey(key)

1386

if len(key) != self._key_length:

1387

raise errors.BadIndexKey(key)

1388

# find what it refers to:

1389

key_dict = nodes_by_key

1390

elements = list(key)

1391

# find the subdict whose contents should be returned.

1392

try:

1393

while len(elements) and elements[0] is not None:

1394

key_dict = key_dict[elements[0]]

1395

elements.pop(0)

1396

except KeyError:

1397

# a non-existant lookup.

1398

continue

1399

if len(elements):

1400

dicts = [key_dict]

1401

while dicts:

1402

key_dict = dicts.pop(-1)

1403

# can't be empty or would not exist

1404

item, value = key_dict.iteritems().next()

1405

if type(value) == dict:

1406

# push keys

1407

dicts.extend(key_dict.itervalues())

1408

else:

1409

# yield keys

1410

for value in key_dict.itervalues():

1411

# each value is the key:value:node refs tuple

1412

# ready to yield.

1413

yield (self, ) + value

1414

else:

1415

# the last thing looked up was a terminal element

1416

yield (self, ) + key_dict

1417

1418

def key_count(self):

1419

"""Return an estimate of the number of keys in this index.

1420

1421

For BTreeGraphIndex the estimate is exact as it is contained in the

1422

header.

1423

"""

1424

if self._key_count is None:

1425

self._get_root_node()

1426

return self._key_count

1427

1428

def _compute_row_offsets(self):

1429

"""Fill out the _row_offsets attribute based on _row_lengths."""

1430

offsets = []

1431

row_offset = 0

1432

for row in self._row_lengths:

1433

offsets.append(row_offset)

1434

row_offset += row

1435

offsets.append(row_offset)

1436

self._row_offsets = offsets

1437

1438

def _parse_header_from_bytes(self, bytes):

1439

"""Parse the header from a region of bytes.

1440

1441

:param bytes: The data to parse.

1442

:return: An offset, data tuple such as readv yields, for the unparsed

1443

data. (which may be of length 0).

1444

"""

1445

signature = bytes[0:len(self._signature())]

1446

if not signature == self._signature():

1447

raise errors.BadIndexFormatSignature(self._name, BTreeGraphIndex)

1448

lines = bytes[len(self._signature()):].splitlines()

1449

options_line = lines[0]

1450

if not options_line.startswith(_OPTION_NODE_REFS):

1451

raise errors.BadIndexOptions(self)

1452

try:

1453

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

1454

except ValueError:

1455

raise errors.BadIndexOptions(self)

1456

options_line = lines[1]

1457

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

1458

raise errors.BadIndexOptions(self)

1459

try:

1460

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

1461

except ValueError:

1462

raise errors.BadIndexOptions(self)

1463

options_line = lines[2]

1464

if not options_line.startswith(_OPTION_LEN):

1465

raise errors.BadIndexOptions(self)

1466

try:

1467

self._key_count = int(options_line[len(_OPTION_LEN):])

1468

except ValueError:

1469

raise errors.BadIndexOptions(self)

1470

options_line = lines[3]

1471

if not options_line.startswith(_OPTION_ROW_LENGTHS):

1472

raise errors.BadIndexOptions(self)

1473

try:

1474

self._row_lengths = map(int, [length for length in

1475

options_line[len(_OPTION_ROW_LENGTHS):].split(',')

1476

if len(length)])

1477

except ValueError:

1478

raise errors.BadIndexOptions(self)

1479

self._compute_row_offsets()

1480

1481

# calculate the bytes we have processed

1482

header_end = (len(signature) + sum(map(len, lines[0:4])) + 4)

1483

return header_end, bytes[header_end:]

1484

1485

def _read_nodes(self, nodes):

1486

"""Read some nodes from disk into the LRU cache.

1487

1488

This performs a readv to get the node data into memory, and parses each

1489

node, then yields it to the caller. The nodes are requested in the

1490

supplied order. If possible doing sort() on the list before requesting

1491

a read may improve performance.

1492

1493

:param nodes: The nodes to read. 0 - first node, 1 - second node etc.

1494

:return: None

1495

"""

1496

# may be the byte string of the whole file

1497

bytes = None

1498

# list of (offset, length) regions of the file that should, evenually

1499

# be read in to data_ranges, either from 'bytes' or from the transport

1500

ranges = []

1501

base_offset = self._base_offset

1502

for index in nodes:

1503

offset = (index * _PAGE_SIZE)

1504

size = _PAGE_SIZE

1505

if index == 0:

1506

# Root node - special case

1507

if self._size:

1508

size = min(_PAGE_SIZE, self._size)

1509

else:

1510

# The only case where we don't know the size, is for very

1511

# small indexes. So we read the whole thing

1512

bytes = self._transport.get_bytes(self._name)

1513

num_bytes = len(bytes)

1514

self._size = num_bytes - base_offset

1515

# the whole thing should be parsed out of 'bytes'

1516

ranges = [(start, min(_PAGE_SIZE, num_bytes - start))

1517

for start in xrange(base_offset, num_bytes, _PAGE_SIZE)]

1518

break

1519

else:

1520

if offset > self._size:

1521

raise AssertionError('tried to read past the end'

1522

' of the file %s > %s'

1523

% (offset, self._size))

1524

size = min(size, self._size - offset)

1525

ranges.append((base_offset + offset, size))

1526

if not ranges:

1527

return

1528

elif bytes is not None:

1529

# already have the whole file

1530

data_ranges = [(start, bytes[start:start+size])

1531

for start, size in ranges]

1532

elif self._file is None:

1533

data_ranges = self._transport.readv(self._name, ranges)

1534

else:

1535

data_ranges = []

1536

for offset, size in ranges:

1537

self._file.seek(offset)

1538

data_ranges.append((offset, self._file.read(size)))

1539

for offset, data in data_ranges:

1540

offset -= base_offset

1541

if offset == 0:

1542

# extract the header

1543

offset, data = self._parse_header_from_bytes(data)

1544

if len(data) == 0:

1545

continue

1546

bytes = zlib.decompress(data)

1547

if bytes.startswith(_LEAF_FLAG):

1548

node = _LeafNode(bytes, self._key_length, self.node_ref_lists)

1549

elif bytes.startswith(_INTERNAL_FLAG):

1550

node = _InternalNode(bytes)

1551

else:

1552

raise AssertionError("Unknown node type for %r" % bytes)

1553

yield offset / _PAGE_SIZE, node

1554

1555

def _signature(self):

1556

"""The file signature for this index type."""

1557

return _BTSIGNATURE

1558

1559

def validate(self):

1560

"""Validate that everything in the index can be accessed."""

1561

# just read and parse every node.

1562

self._get_root_node()

1563

if len(self._row_lengths) > 1:

1564

start_node = self._row_offsets[1]

1565

else:

1566

# We shouldn't be reading anything anyway

1567

start_node = 1

1568

node_end = self._row_offsets[-1]

1569

for node in self._read_nodes(range(start_node, node_end)):

1570

pass

1571

1572

1573

try:

1574

from bzrlib import _btree_serializer_pyx as _btree_serializer

1575

except ImportError, e:

1576

osutils.failed_to_load_extension(e)

1577

from bzrlib import _btree_serializer_py as _btree_serializer

Older »