~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/btree_index.py

Committer: Gordon Tyler
Date: 2010-02-02 06:30:43 UTC
mto: (5037.3.1 integration)
mto: This revision was merged to the branch mainline in revision 5046.
Revision ID: gordon@doxxx.net-20100202063043-3ygr1114d25m3f7m

Added cmdline.split function, which replaces commands.shlex_split_unicode.

files added:
MANIFEST.in

README_BDIST_RPM

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_import_c_api.h

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/cleanup.py

bzrlib/cmdline.py

bzrlib/crash.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/filters/eol.py

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/es

bzrlib/inventory_delta.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/static_tuple.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/features.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/script.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_script.py

bzrlib/tests/test_serializer.py

bzrlib/transport/pathfilter.py

bzrlib/util/bencode.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

doc/Bazaar-Logo-For-Manuals.png

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/apport.txt

doc/developers/bug-handling.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/implementation-notes.txt

doc/developers/index-plain.txt

doc/developers/miscellaneous-notes.txt

doc/developers/plans.txt

doc/developers/principles.txt

doc/developers/process.txt

doc/developers/specifications.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/quick-reference/index.txt

doc/en/tutorials/index.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/quick-reference/index.txt

doc/es/user-guide/index-plain.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/generate_release_notes.py

tools/package_docs.py

tools/packaging/update-control.sh

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

files removed:
bzrlib/tests/blackbox/test_guess_renames.py

bzrlib/tests/test_http_implementations.py

bzrlib/textui.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/tests/test_bencode.py

doc/bazaar-vcs.org.kid

doc/developers/performance-contributing.txt

doc/en/developer-guide

doc/en/user-guide/index.txt

doc/es/guia-desarrollador

doc/es/notas-version

doc/es/referencia

files renamed:
bzrlib/_btree_serializer_c.pyx => bzrlib/_btree_serializer_pyx.pyx

bzrlib/_dirstate_helpers_c.h => bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_c.pyx => bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_knit_load_data_c.pyx => bzrlib/_knit_load_data_pyx.pyx

tools/doc_generate/ => bzrlib/doc_generate/

bzrlib/help_topics/en/conflicts.txt => bzrlib/help_topics/en/conflict-types.txt

doc/es/guia-usuario/resolving_conflicts.txt => bzrlib/help_topics/es/conflicts.txt

bzrlib/tests/branch_implementations/ => bzrlib/tests/per_branch/

bzrlib/tests/bzrdir_implementations/ => bzrlib/tests/per_bzrdir/

bzrlib/tests/interrepository_implementations/ => bzrlib/tests/per_interrepository/

bzrlib/tests/intertree_implementations/ => bzrlib/tests/per_intertree/

bzrlib/tests/inventory_implementations/ => bzrlib/tests/per_inventory/

bzrlib/tests/test_pack_repository.py => bzrlib/tests/per_pack_repository.py

bzrlib/tests/test_transport_implementations.py => bzrlib/tests/per_transport.py

bzrlib/tests/tree_implementations/ => bzrlib/tests/per_tree/

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py => bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/test_versionedfile.py => bzrlib/tests/per_versionedfile.py

bzrlib/tests/workingtree_implementations/ => bzrlib/tests/per_workingtree/

bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

doc/en/quick-reference/Makefile => doc/en/_static/en/Makefile

doc/en/quick-reference/quick-start-summary.pdf => doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/quick-reference/quick-start-summary.png => doc/en/_static/en/bzr-en-quick-reference.png

doc/en/quick-reference/quick-start-summary.svg => doc/en/_static/en/bzr-en-quick-reference.svg

doc/es/referencia-rapida/Makefile => doc/es/_static/es/Makefile

doc/es/referencia-rapida/referencia-rapida.svg => doc/es/_static/es/bzr-es-quick-reference.svg

doc/index.es.txt => doc/es/index.txt

doc/es/referencia-rapida/ => doc/es/quick-reference/

doc/es/guia-usuario/ => doc/es/user-guide/

generate_docs.py => tools/generate_docs.py

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_btree_serializer_py.py

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/errors.py

bzrlib/export/dir_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/foreign.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/version.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/update.txt

doc/en/admin-guide/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/es/mini-tutorial/index.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.txt

setup.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/win32/build_release.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/btree_index.py

"""B+Tree indices"""

import array

import bisect

import cStringIO

from bisect import bisect_right

from copy import deepcopy

import math

import struct

import tempfile

import zlib

index,

lru_cache,

osutils,

static_tuple,

trace,

)

from bzrlib.index import _OPTION_NODE_REFS, _OPTION_KEY_ELEMENTS, _OPTION_LEN

def __init__(self):

"""Create a _BuilderRow."""

self.nodes = 0

self.spool = tempfile.TemporaryFile()

self.spool = None# tempfile.TemporaryFile(prefix='bzr-index-row-')

self.writer = None

def finish_node(self, pad=True):

byte_lines, _, padding = self.writer.finish()

if self.nodes == 0:

self.spool = cStringIO.StringIO()

# padded note:

self.spool.write("\x00" * _RESERVED_HEADER_BYTES)

elif self.nodes == 1:

# We got bigger than 1 node, switch to a temp file

spool = tempfile.TemporaryFile(prefix='bzr-index-row-')

spool.write(self.spool.getvalue())

self.spool = spool

skipped_bytes = 0

if not pad and padding:

del byte_lines[-1]

156

160

:param value: The value to associate with the key. It may be any

157

161

bytes as long as it does not contain \0 or \n.

158

162

"""

163

# Ensure that 'key' is a StaticTuple

164

key = static_tuple.StaticTuple.from_sequence(key).intern()

159

165

# we don't care about absent_references

160

166

node_refs, _ = self._check_key_ref_value(key, references, value)

161

167

if key in self._nodes:

162

168

raise errors.BadIndexDuplicateKey(key, self)

163

self._nodes[key] = (node_refs, value)

164

self._keys.add(key)

169

self._nodes[key] = static_tuple.StaticTuple(node_refs, value)

165

170

if self._nodes_by_key is not None and self._key_length > 1:

166

171

self._update_nodes_by_key(key, value, node_refs)

167

if len(self._keys) < self._spill_at:

172

if len(self._nodes) < self._spill_at:

168

173

return

169

174

self._spill_mem_keys_to_disk()

170

175

186

191

backing_pos) = self._spill_mem_keys_and_combine()

187

192

else:

188

193

new_backing_file, size = self._spill_mem_keys_without_combining()

189

dir_path, base_name = osutils.split(new_backing_file.name)

190

194

# Note: The transport here isn't strictly needed, because we will use

191

195

# direct access to the new_backing._file object

192

new_backing = BTreeGraphIndex(get_transport(dir_path),

193

base_name, size)

196

new_backing = BTreeGraphIndex(get_transport('.'), '<temp>', size)

194

197

# GC will clean up the file

195

198

new_backing._file = new_backing_file

196

199

if self._combine_backing_indices:

201

204

self._backing_indices[backing_pos] = None

202

205

else:

203

206

self._backing_indices.append(new_backing)

204

self._keys = set()

205

207

self._nodes = {}

206

208

self._nodes_by_key = None

207

209

319

321

new_row = True

320

322

for row in reversed(rows[:-1]):

321

323

# Mark the start of the next node in the node above. If it

322

# doesn't fit then propogate upwards until we find one that

324

# doesn't fit then propagate upwards until we find one that

323

325

# it does fit into.

324

326

if row.writer.write(key_line):

325

327

row.finish_node()

370

372

self.row_lengths = []

371

373

# Loop over all nodes adding them to the bottom row

372

374

# (rows[-1]). When we finish a chunk in a row,

373

# propogate the key that didn't fit (comes after the chunk) to the

375

# propagate the key that didn't fit (comes after the chunk) to the

374

376

# row above, transitively.

375

377

for node in node_iterator:

376

378

if key_count == 0:

383

385

for row in reversed(rows):

384

386

pad = (type(row) != _LeafBuilderRow)

385

387

row.finish_node(pad=pad)

386

result = tempfile.NamedTemporaryFile(prefix='bzr-index-')

387

388

lines = [_BTSIGNATURE]

388

389

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

389

390

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

390

391

lines.append(_OPTION_LEN + str(key_count) + '\n')

391

392

row_lengths = [row.nodes for row in rows]

392

393

lines.append(_OPTION_ROW_LENGTHS + ','.join(map(str, row_lengths)) + '\n')

394

if row_lengths and row_lengths[-1] > 1:

395

result = tempfile.NamedTemporaryFile(prefix='bzr-index-')

396

else:

397

result = cStringIO.StringIO()

393

398

result.writelines(lines)

394

399

position = sum(map(len, lines))

395

400

root_row = True

406

411

# Special case the first node as it may be prefixed

407

412

node = row.spool.read(_PAGE_SIZE)

408

413

result.write(node[reserved:])

409

result.write("\x00" * (reserved - position))

414

if len(node) == _PAGE_SIZE:

415

result.write("\x00" * (reserved - position))

410

416

position = 0 # Only the root row actually has an offset

411

417

copied_len = osutils.pumpfile(row.spool, result)

412

418

if copied_len != (row.nodes - 1) * _PAGE_SIZE:

431

437

def iter_all_entries(self):

432

438

"""Iterate over all keys within the index

433

439

434

:return: An iterable of (index, key, reference_lists, value). There is no

435

defined order for the result iteration - it will be in the most

440

:return: An iterable of (index, key, value, reference_lists). There is

441

no defined order for the result iteration - it will be in the most

436

442

efficient order for the index (in this case dictionary hash order).

437

443

"""

438

444

if 'evil' in debug.debug_flags:

457

463

efficient order for the index (keys iteration order in this case).

458

464

"""

459

465

keys = set(keys)

460

local_keys = keys.intersection(self._keys)

466

# Note: We don't use keys.intersection() here. If you read the C api,

467

# set.intersection(other) special cases when other is a set and

468

# will iterate the smaller of the two and lookup in the other.

469

# It does *not* do this for any other type (even dict, unlike

470

# some other set functions.) Since we expect keys is generally <<

471

# self._nodes, it is faster to iterate over it in a list

472

# comprehension

473

nodes = self._nodes

474

local_keys = [key for key in keys if key in nodes]

461

475

if self.reference_lists:

462

476

for key in local_keys:

463

node = self._nodes[key]

477

node = nodes[key]

464

478

yield self, key, node[1], node[0]

465

479

else:

466

480

for key in local_keys:

467

node = self._nodes[key]

481

node = nodes[key]

468

482

yield self, key, node[1]

469

483

# Find things that are in backing indices that have not been handled

470

484

# yet.

580

594

581

595

For InMemoryGraphIndex the estimate is exact.

582

596

"""

583

return len(self._keys) + sum(backing.key_count() for backing in

597

return len(self._nodes) + sum(backing.key_count() for backing in

584

598

self._backing_indices if backing is not None)

585

599

586

600

def validate(self):

590

604

class _LeafNode(object):

591

605

"""A leaf node for a serialised B+Tree index."""

592

606

607

__slots__ = ('keys', 'min_key', 'max_key')

608

593

609

def __init__(self, bytes, key_length, ref_list_length):

594

610

"""Parse bytes to create a leaf node object."""

595

611

# splitlines mangles the \r delimiters.. don't use it.

596

self.keys = dict(_btree_serializer._parse_leaf_lines(bytes,

597

key_length, ref_list_length))

612

key_list = _btree_serializer._parse_leaf_lines(bytes,

613

key_length, ref_list_length)

614

if key_list:

615

self.min_key = key_list[0][0]

616

self.max_key = key_list[-1][0]

617

else:

618

self.min_key = self.max_key = None

619

self.keys = dict(key_list)

598

620

599

621

600

622

class _InternalNode(object):

601

623

"""An internal node for a serialised B+Tree index."""

602

624

625

__slots__ = ('keys', 'offset')

626

603

627

def __init__(self, bytes):

604

628

"""Parse bytes to create an internal node object."""

605

629

# splitlines mangles the \r delimiters.. don't use it.

608

632

def _parse_lines(self, lines):

609

633

nodes = []

610

634

self.offset = int(lines[1][7:])

635

as_st = static_tuple.StaticTuple.from_sequence

611

636

for line in lines[2:]:

612

637

if line == '':

613

638

break

614

nodes.append(tuple(line.split('\0')))

639

nodes.append(as_st(map(intern, line.split('\0'))).intern())

615

640

return nodes

616

641

617

642

622

647

memory except when very large walks are done.

623

648

"""

624

649

625

def __init__(self, transport, name, size):

650

def __init__(self, transport, name, size, unlimited_cache=False):

626

651

"""Create a B+Tree index object on the index name.

627

652

628

653

:param transport: The transport to read data for the index from.

632

657

the initial read (to read the root node header) can be done

633

658

without over-reading even on empty indices, and on small indices

634

659

allows single-IO to read the entire index.

660

:param unlimited_cache: If set to True, then instead of using an

661

LRUCache with size _NODE_CACHE_SIZE, we will use a dict and always

662

cache all leaf nodes.

635

663

"""

636

664

self._transport = transport

637

665

self._name = name

641

669

self._root_node = None

642

670

# Default max size is 100,000 leave values

643

671

self._leaf_value_cache = None # lru_cache.LRUCache(100*1000)

644

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

645

# We could limit this, but even a 300k record btree has only 3k leaf

646

# nodes, and only 20 internal nodes. So the default of 100 nodes in an

647

# LRU would mean we always cache everything anyway, no need to pay the

648

# overhead of LRU

649

self._internal_node_cache = fifo_cache.FIFOCache(100)

672

if unlimited_cache:

673

self._leaf_node_cache = {}

674

self._internal_node_cache = {}

675

else:

676

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

677

# We use a FIFO here just to prevent possible blowout. However, a

678

# 300k record btree has only 3k leaf nodes, and only 20 internal

679

# nodes. A value of 100 scales to ~100*100*100 = 1M records.

680

self._internal_node_cache = fifo_cache.FIFOCache(100)

650

681

self._key_count = None

651

682

self._row_lengths = None

652

683

self._row_offsets = None # Start of each row, [-1] is the end

684

715

if start_of_leaves is None:

685

716

start_of_leaves = self._row_offsets[-2]

686

717

if node_pos < start_of_leaves:

687

self._internal_node_cache.add(node_pos, node)

718

self._internal_node_cache[node_pos] = node

688

719

else:

689

self._leaf_node_cache.add(node_pos, node)

720

self._leaf_node_cache[node_pos] = node

690

721

found[node_pos] = node

691

722

return found

692

723

831

862

new_tips = next_tips

832

863

return final_offsets

833

864

865

def clear_cache(self):

866

"""Clear out any cached/memoized values.

867

868

This can be called at any time, but generally it is used when we have

869

extracted some information, but don't expect to be requesting any more

870

from this index.

871

"""

872

# Note that we don't touch self._root_node or self._internal_node_cache

873

# We don't expect either of those to be big, and it can save

874

# round-trips in the future. We may re-evaluate this if InternalNode

875

# memory starts to be an issue.

876

self._leaf_node_cache.clear()

877

834

878

def external_references(self, ref_list_num):

835

879

if self._root_node is None:

836

880

self._get_root_node()

1039

1083

output.append(cur_out)

1040

1084

return output

1041

1085

1086

def _walk_through_internal_nodes(self, keys):

1087

"""Take the given set of keys, and find the corresponding LeafNodes.

1088

1089

:param keys: An unsorted iterable of keys to search for

1090

:return: (nodes, index_and_keys)

1091

nodes is a dict mapping {index: LeafNode}

1092

keys_at_index is a list of tuples of [(index, [keys for Leaf])]

1093

"""

1094

# 6 seconds spent in miss_torture using the sorted() line.

1095

# Even with out of order disk IO it seems faster not to sort it when

1096

# large queries are being made.

1097

keys_at_index = [(0, sorted(keys))]

1098

1099

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

1100

node_indexes = [idx for idx, s_keys in keys_at_index]

1101

nodes = self._get_internal_nodes(node_indexes)

1102

1103

next_nodes_and_keys = []

1104

for node_index, sub_keys in keys_at_index:

1105

node = nodes[node_index]

1106

positions = self._multi_bisect_right(sub_keys, node.keys)

1107

node_offset = next_row_start + node.offset

1108

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

1109

for pos, s_keys in positions])

1110

keys_at_index = next_nodes_and_keys

1111

# We should now be at the _LeafNodes

1112

node_indexes = [idx for idx, s_keys in keys_at_index]

1113

1114

# TODO: We may *not* want to always read all the nodes in one

1115

# big go. Consider setting a max size on this.

1116

nodes = self._get_leaf_nodes(node_indexes)

1117

return nodes, keys_at_index

1118

1042

1119

def iter_entries(self, keys):

1043

1120

"""Iterate over keys within the index.

1044

1121

1082

1159

needed_keys = keys

1083

1160

if not needed_keys:

1084

1161

return

1085

# 6 seconds spent in miss_torture using the sorted() line.

1086

# Even with out of order disk IO it seems faster not to sort it when

1087

# large queries are being made.

1088

needed_keys = sorted(needed_keys)

1089

1090

nodes_and_keys = [(0, needed_keys)]

1091

1092

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

1093

node_indexes = [idx for idx, s_keys in nodes_and_keys]

1094

nodes = self._get_internal_nodes(node_indexes)

1095

1096

next_nodes_and_keys = []

1097

for node_index, sub_keys in nodes_and_keys:

1098

node = nodes[node_index]

1099

positions = self._multi_bisect_right(sub_keys, node.keys)

1100

node_offset = next_row_start + node.offset

1101

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

1102

for pos, s_keys in positions])

1103

nodes_and_keys = next_nodes_and_keys

1104

# We should now be at the _LeafNodes

1105

node_indexes = [idx for idx, s_keys in nodes_and_keys]

1106

1107

# TODO: We may *not* want to always read all the nodes in one

1108

# big go. Consider setting a max size on this.

1109

1110

nodes = self._get_leaf_nodes(node_indexes)

1162

nodes, nodes_and_keys = self._walk_through_internal_nodes(needed_keys)

1111

1163

for node_index, sub_keys in nodes_and_keys:

1112

1164

if not sub_keys:

1113

1165

continue

1120

1172

else:

1121

1173

yield (self, next_sub_key, value)

1122

1174

1175

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

1176

"""Find the parent_map information for the set of keys.

1177

1178

This populates the parent_map dict and missing_keys set based on the

1179

queried keys. It also can fill out an arbitrary number of parents that

1180

it finds while searching for the supplied keys.

1181

1182

It is unlikely that you want to call this directly. See

1183

"CombinedGraphIndex.find_ancestry()" for a more appropriate API.

1184

1185

:param keys: A keys whose ancestry we want to return

1186

Every key will either end up in 'parent_map' or 'missing_keys'.

1187

:param ref_list_num: This index in the ref_lists is the parents we

1188

care about.

1189

:param parent_map: {key: parent_keys} for keys that are present in this

1190

index. This may contain more entries than were in 'keys', that are

1191

reachable ancestors of the keys requested.

1192

:param missing_keys: keys which are known to be missing in this index.

1193

This may include parents that were not directly requested, but we

1194

were able to determine that they are not present in this index.

1195

:return: search_keys parents that were found but not queried to know

1196

if they are missing or present. Callers can re-query this index for

1197

those keys, and they will be placed into parent_map or missing_keys

1198

"""

1199

if not self.key_count():

1200

# We use key_count() to trigger reading the root node and

1201

# determining info about this BTreeGraphIndex

1202

# If we don't have any keys, then everything is missing

1203

missing_keys.update(keys)

1204

return set()

1205

if ref_list_num >= self.node_ref_lists:

1206

raise ValueError('No ref list %d, index has %d ref lists'

1207

% (ref_list_num, self.node_ref_lists))

1208

1209

# The main trick we are trying to accomplish is that when we find a

1210

# key listing its parents, we expect that the parent key is also likely

1211

# to sit on the same page. Allowing us to expand parents quickly

1212

# without suffering the full stack of bisecting, etc.

1213

nodes, nodes_and_keys = self._walk_through_internal_nodes(keys)

1214

1215

# These are parent keys which could not be immediately resolved on the

1216

# page where the child was present. Note that we may already be

1217

# searching for that key, and it may actually be present [or known

1218

# missing] on one of the other pages we are reading.

1219

# TODO:

1220

# We could try searching for them in the immediate previous or next

1221

# page. If they occur "later" we could put them in a pending lookup

1222

# set, and then for each node we read thereafter we could check to

1223

# see if they are present.

1224

# However, we don't know the impact of keeping this list of things

1225

# that I'm going to search for every node I come across from here on

1226

# out.

1227

# It doesn't handle the case when the parent key is missing on a

1228

# page that we *don't* read. So we already have to handle being

1229

# re-entrant for that.

1230

# Since most keys contain a date string, they are more likely to be

1231

# found earlier in the file than later, but we would know that right

1232

# away (key < min_key), and wouldn't keep searching it on every other

1233

# page that we read.

1234

# Mostly, it is an idea, one which should be benchmarked.

1235

parents_not_on_page = set()

1236

1237

for node_index, sub_keys in nodes_and_keys:

1238

if not sub_keys:

1239

continue

1240

# sub_keys is all of the keys we are looking for that should exist

1241

# on this page, if they aren't here, then they won't be found

1242

node = nodes[node_index]

1243

node_keys = node.keys

1244

parents_to_check = set()

1245

for next_sub_key in sub_keys:

1246

if next_sub_key not in node_keys:

1247

# This one is just not present in the index at all

1248

missing_keys.add(next_sub_key)

1249

else:

1250

value, refs = node_keys[next_sub_key]

1251

parent_keys = refs[ref_list_num]

1252

parent_map[next_sub_key] = parent_keys

1253

parents_to_check.update(parent_keys)

1254

# Don't look for things we've already found

1255

parents_to_check = parents_to_check.difference(parent_map)

1256

# this can be used to test the benefit of having the check loop

1257

# inlined.

1258

# parents_not_on_page.update(parents_to_check)

1259

# continue

1260

while parents_to_check:

1261

next_parents_to_check = set()

1262

for key in parents_to_check:

1263

if key in node_keys:

1264

value, refs = node_keys[key]

1265

parent_keys = refs[ref_list_num]

1266

parent_map[key] = parent_keys

1267

next_parents_to_check.update(parent_keys)

1268

else:

1269

# This parent either is genuinely missing, or should be

1270

# found on another page. Perf test whether it is better

1271

# to check if this node should fit on this page or not.

1272

# in the 'everything-in-one-pack' scenario, this *not*

1273

# doing the check is 237ms vs 243ms.

1274

# So slightly better, but I assume the standard 'lots

1275

# of packs' is going to show a reasonable improvement

1276

# from the check, because it avoids 'going around

1277

# again' for everything that is in another index

1278

# parents_not_on_page.add(key)

1279

# Missing for some reason

1280

if key < node.min_key:

1281

# in the case of bzr.dev, 3.4k/5.3k misses are

1282

# 'earlier' misses (65%)

1283

parents_not_on_page.add(key)

1284

elif key > node.max_key:

1285

# This parent key would be present on a different

1286

# LeafNode

1287

parents_not_on_page.add(key)

1288

else:

1289

# assert key != node.min_key and key != node.max_key

1290

# If it was going to be present, it would be on

1291

# *this* page, so mark it missing.

1292

missing_keys.add(key)

1293

parents_to_check = next_parents_to_check.difference(parent_map)

1294

# Might want to do another .difference() from missing_keys

1295

# parents_not_on_page could have been found on a different page, or be

1296

# known to be missing. So cull out everything that has already been

1297

# found.

1298

search_keys = parents_not_on_page.difference(

1299

parent_map).difference(missing_keys)

1300

return search_keys

1301

1123

1302

def iter_entries_prefix(self, keys):

1124

1303

"""Iterate over keys within the index using prefix matching.

1125

1304

1384

1563

1385

1564

1386

1565

try:

1387

from bzrlib import _btree_serializer_c as _btree_serializer

1388

except ImportError:

1566

from bzrlib import _btree_serializer_pyx as _btree_serializer

1567

except ImportError, e:

1568

osutils.failed_to_load_extension(e)

1389

1569

from bzrlib import _btree_serializer_py as _btree_serializer

Older »