~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/chk_map.py

Committer: Gordon Tyler
Date: 2010-02-02 06:30:43 UTC
mto: (5037.3.1 integration)
mto: This revision was merged to the branch mainline in revision 5046.
Revision ID: gordon@doxxx.net-20100202063043-3ygr1114d25m3f7m

Added cmdline.split function, which replaces commands.shlex_split_unicode.

files added:
MANIFEST.in

README_BDIST_RPM

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_import_c_api.h

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/cleanup.py

bzrlib/cmdline.py

bzrlib/crash.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/filters/eol.py

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/es

bzrlib/inventory_delta.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/static_tuple.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/features.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/script.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_script.py

bzrlib/tests/test_serializer.py

bzrlib/transport/pathfilter.py

bzrlib/util/bencode.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

doc/Bazaar-Logo-For-Manuals.png

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/apport.txt

doc/developers/bug-handling.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/implementation-notes.txt

doc/developers/index-plain.txt

doc/developers/miscellaneous-notes.txt

doc/developers/plans.txt

doc/developers/principles.txt

doc/developers/process.txt

doc/developers/specifications.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/quick-reference/index.txt

doc/en/tutorials/index.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/quick-reference/index.txt

doc/es/user-guide/index-plain.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/generate_release_notes.py

tools/package_docs.py

tools/packaging/update-control.sh

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

files removed:
bzrlib/tests/blackbox/test_guess_renames.py

bzrlib/tests/test_http_implementations.py

bzrlib/textui.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/tests/test_bencode.py

doc/bazaar-vcs.org.kid

doc/developers/performance-contributing.txt

doc/en/developer-guide

doc/en/user-guide/index.txt

doc/es/guia-desarrollador

doc/es/notas-version

doc/es/referencia

files renamed:
bzrlib/_btree_serializer_c.pyx => bzrlib/_btree_serializer_pyx.pyx

bzrlib/_dirstate_helpers_c.h => bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_c.pyx => bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_knit_load_data_c.pyx => bzrlib/_knit_load_data_pyx.pyx

tools/doc_generate/ => bzrlib/doc_generate/

bzrlib/help_topics/en/conflicts.txt => bzrlib/help_topics/en/conflict-types.txt

doc/es/guia-usuario/resolving_conflicts.txt => bzrlib/help_topics/es/conflicts.txt

bzrlib/tests/branch_implementations/ => bzrlib/tests/per_branch/

bzrlib/tests/bzrdir_implementations/ => bzrlib/tests/per_bzrdir/

bzrlib/tests/interrepository_implementations/ => bzrlib/tests/per_interrepository/

bzrlib/tests/intertree_implementations/ => bzrlib/tests/per_intertree/

bzrlib/tests/inventory_implementations/ => bzrlib/tests/per_inventory/

bzrlib/tests/test_pack_repository.py => bzrlib/tests/per_pack_repository.py

bzrlib/tests/test_transport_implementations.py => bzrlib/tests/per_transport.py

bzrlib/tests/tree_implementations/ => bzrlib/tests/per_tree/

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py => bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/test_versionedfile.py => bzrlib/tests/per_versionedfile.py

bzrlib/tests/workingtree_implementations/ => bzrlib/tests/per_workingtree/

bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

doc/en/quick-reference/Makefile => doc/en/_static/en/Makefile

doc/en/quick-reference/quick-start-summary.pdf => doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/quick-reference/quick-start-summary.png => doc/en/_static/en/bzr-en-quick-reference.png

doc/en/quick-reference/quick-start-summary.svg => doc/en/_static/en/bzr-en-quick-reference.svg

doc/es/referencia-rapida/Makefile => doc/es/_static/es/Makefile

doc/es/referencia-rapida/referencia-rapida.svg => doc/es/_static/es/bzr-es-quick-reference.svg

doc/index.es.txt => doc/es/index.txt

doc/es/referencia-rapida/ => doc/es/quick-reference/

doc/es/guia-usuario/ => doc/es/user-guide/

generate_docs.py => tools/generate_docs.py

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_btree_serializer_py.py

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/errors.py

bzrlib/export/dir_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/foreign.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/version.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/update.txt

doc/en/admin-guide/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/es/mini-tutorial/index.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.txt

setup.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/win32/build_release.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/chk_map.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

Updates to a CHKMap are done preferentially via the apply_delta method, to

allow optimisation of the update operation; but individual map/unmap calls are

possible and supported. All changes via map/unmap are buffered in memory until

the _save method is called to force serialisation of the tree. apply_delta

performs a _save implicitly.

possible and supported. Individual changes via map/unmap are buffered in memory

until the _save method is called to force serialisation of the tree.

apply_delta records its changes immediately by performing an implicit _save.

TODO:

-----

"""

import heapq

import time

from bzrlib import lazy_import

lazy_import.lazy_import(globals(), """

from bzrlib import versionedfile

from bzrlib import (

errors,

versionedfile,

)

""")

from bzrlib import (

errors,

lru_cache,

osutils,

registry,

static_tuple,

trace,

)

from bzrlib.static_tuple import StaticTuple

# approx 4MB

# If each line is 50 bytes, and you have 255 internal pages, with 255-way fan

# We are caching bytes so len(value) is perfectly accurate

_page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)

def clear_cache():

_page_cache.clear()

# If a ChildNode falls below this many bytes, we check for a remap

_INTERESTING_NEW_SIZE = 50

# If a ChildNode shrinks by more than this amount, we check for a remap

class CHKMap(object):

"""A persistent map from string to string backed by a CHK store."""

__slots__ = ('_store', '_root_node', '_search_key_func')

def __init__(self, store, root_key, search_key_func=None):

"""Create a CHKMap object.

107

115

of old_key is removed.

108

116

"""

109

117

delete_count = 0

118

# Check preconditions first.

119

as_st = StaticTuple.from_sequence

120

new_items = set([as_st(key) for (old, key, value) in delta

121

if key is not None and old is None])

122

existing_new = list(self.iteritems(key_filter=new_items))

123

if existing_new:

124

raise errors.InconsistentDeltaDelta(delta,

125

"New items are already in the map %r." % existing_new)

126

# Now apply changes.

110

127

for old, new, value in delta:

111

128

if old is not None and old != new:

112

129

self.unmap(old, check_remap=False)

121

138

122

139

def _ensure_root(self):

123

140

"""Ensure that the root node is an object not a key."""

124

if type(self._root_node) == tuple:

141

if type(self._root_node) is StaticTuple:

125

142

# Demand-load the root

126

143

self._root_node = self._get_node(self._root_node)

127

144

135

152

:param node: A tuple key or node object.

136

153

:return: A node object.

137

154

"""

138

if type(node) == tuple:

155

if type(node) is StaticTuple:

139

156

bytes = self._read_bytes(node)

140

157

return _deserialise(bytes, node,

141

158

search_key_func=self._search_key_func)

182

199

for key, value in sorted(node._items.iteritems()):

183

200

# Don't use prefix nor indent here to line up when used in

184

201

# tests in conjunction with assertEqualDiff

185

result.append(' %r %r' % (key, value))

202

result.append(' %r %r' % (tuple(key), value))

186

203

return result

187

204

188

205

@classmethod

203

220

multiple pages.

204

221

:return: The root chk of the resulting CHKMap.

205

222

"""

206

result = CHKMap(store, None, search_key_func=search_key_func)

223

root_key = klass._create_directly(store, initial_value,

224

maximum_size=maximum_size, key_width=key_width,

225

search_key_func=search_key_func)

226

if type(root_key) is not StaticTuple:

227

raise AssertionError('we got a %s instead of a StaticTuple'

228

% (type(root_key),))

229

return root_key

230

231

@classmethod

232

def _create_via_map(klass, store, initial_value, maximum_size=0,

233

key_width=1, search_key_func=None):

234

result = klass(store, None, search_key_func=search_key_func)

207

235

result._root_node.set_maximum_size(maximum_size)

208

236

result._root_node._key_width = key_width

209

237

delta = []

210

238

for key, value in initial_value.items():

211

239

delta.append((None, key, value))

212

return result.apply_delta(delta)

240

root_key = result.apply_delta(delta)

241

return root_key

242

243

@classmethod

244

def _create_directly(klass, store, initial_value, maximum_size=0,

245

key_width=1, search_key_func=None):

246

node = LeafNode(search_key_func=search_key_func)

247

node.set_maximum_size(maximum_size)

248

node._key_width = key_width

249

as_st = StaticTuple.from_sequence

250

node._items = dict([(as_st(key), val) for key, val

251

in initial_value.iteritems()])

252

node._raw_size = sum([node._key_value_len(key, value)

253

for key,value in node._items.iteritems()])

254

node._len = len(node._items)

255

node._compute_search_prefix()

256

node._compute_serialised_prefix()

257

if (node._len > 1

258

and maximum_size

259

and node._current_size() > maximum_size):

260

prefix, node_details = node._split(store)

261

if len(node_details) == 1:

262

raise AssertionError('Failed to split using node._split')

263

node = InternalNode(prefix, search_key_func=search_key_func)

264

node.set_maximum_size(maximum_size)

265

node._key_width = key_width

266

for split, subnode in node_details:

267

node.add_node(split, subnode)

268

keys = list(node.serialise(store))

269

return keys[-1]

213

270

214

271

def iter_changes(self, basis):

215

272

"""Iterate over the changes between basis and self.

413

470

self_pending)

414

471

basis_prefix, _, basis_node, basis_path = heapq.heappop(

415

472

basis_pending)

416

assert self_prefix == basis_prefix

473

if self_prefix != basis_prefix:

474

raise AssertionError(

475

'%r != %r' % (self_prefix, basis_prefix))

417

476

process_common_prefix_nodes(

418

477

self_node, self_path,

419

478

basis_node, basis_path)

433

492

def iteritems(self, key_filter=None):

434

493

"""Iterate over the entire CHKMap's contents."""

435

494

self._ensure_root()

495

if key_filter is not None:

496

as_st = StaticTuple.from_sequence

497

key_filter = [as_st(key) for key in key_filter]

436

498

return self._root_node.iteritems(self._store, key_filter=key_filter)

437

499

438

500

def key(self):

439

501

"""Return the key for this map."""

440

if type(self._root_node) is tuple:

502

if type(self._root_node) is StaticTuple:

441

503

return self._root_node

442

504

else:

443

505

return self._root_node._key

447

509

return len(self._root_node)

448

510

449

511

def map(self, key, value):

450

"""Map a key tuple to value."""

512

"""Map a key tuple to value.

513

514

:param key: A key to map.

515

:param value: The value to assign to key.

516

"""

517

key = StaticTuple.from_sequence(key)

451

518

# Need a root object.

452

519

self._ensure_root()

453

520

prefix, node_details = self._root_node.map(self._store, key, value)

463

530

464

531

def _node_key(self, node):

465

532

"""Get the key for a node whether it's a tuple or node."""

466

if type(node) == tuple:

533

if type(node) is tuple:

534

node = StaticTuple.from_sequence(node)

535

if type(node) is StaticTuple:

467

536

return node

468

537

else:

469

538

return node._key

470

539

471

540

def unmap(self, key, check_remap=True):

472

541

"""remove key from the map."""

542

key = StaticTuple.from_sequence(key)

473

543

self._ensure_root()

474

544

if type(self._root_node) is InternalNode:

475

545

unmapped = self._root_node.unmap(self._store, key,

489

559

490

560

:return: The key of the root node.

491

561

"""

492

if type(self._root_node) == tuple:

562

if type(self._root_node) is StaticTuple:

493

563

# Already saved.

494

564

return self._root_node

495

565

keys = list(self._root_node.serialise(self._store))

503

573

adding the header bytes, and without prefix compression.

504

574

"""

505

575

576

__slots__ = ('_key', '_len', '_maximum_size', '_key_width',

577

'_raw_size', '_items', '_search_prefix', '_search_key_func'

578

)

579

506

580

def __init__(self, key_width=1):

507

581

"""Create a node.

508

582

557

631

"""

558

632

if key.startswith(prefix):

559

633

return prefix

634

pos = -1

560

635

# Is there a better way to do this?

561

636

for pos, (left, right) in enumerate(zip(prefix, key)):

562

637

if left != right:

596

671

the key/value pairs.

597

672

"""

598

673

674

__slots__ = ('_common_serialised_prefix', '_serialise_key')

675

599

676

def __init__(self, search_key_func=None):

600

677

Node.__init__(self)

601

678

# All of the keys in this leaf node share this common prefix

644

721

:param bytes: The bytes of the node.

645

722

:param key: The key that the serialised node has.

646

723

"""

724

key = static_tuple.expect_static_tuple(key)

647

725

return _deserialise_leaf_node(bytes, key,

648

726

search_key_func=search_key_func)

649

727

736

814

737

815

:return: (common_serialised_prefix, [(node_serialised_prefix, node)])

738

816

"""

739

assert self._search_prefix is not _unknown

817

if self._search_prefix is _unknown:

818

raise AssertionError('Search prefix must be known')

740

819

common_prefix = self._search_prefix

741

820

split_at = len(common_prefix) + 1

742

821

result = {}

760

839

result[prefix] = node

761

840

else:

762

841

node = result[prefix]

763

node.map(store, key, value)

842

sub_prefix, node_details = node.map(store, key, value)

843

if len(node_details) > 1:

844

if prefix != sub_prefix:

845

# This node has been split and is now found via a different

846

# path

847

result.pop(prefix)

848

new_node = InternalNode(sub_prefix,

849

search_key_func=self._search_key_func)

850

new_node.set_maximum_size(self._maximum_size)

851

new_node._key_width = self._key_width

852

for split, node in node_details:

853

new_node.add_node(split, node)

854

result[prefix] = new_node

764

855

return common_prefix, result.items()

765

856

766

857

def map(self, store, key, value):

772

863

if self._map_no_split(key, value):

773

864

return self._split(store)

774

865

else:

775

assert self._search_prefix is not _unknown

866

if self._search_prefix is _unknown:

867

raise AssertionError('%r must be known' % self._search_prefix)

776

868

return self._search_prefix, [("", self)]

777

869

778

870

def serialise(self, store):

805

897

lines.append(serialized[prefix_len:])

806

898

lines.extend(value_lines)

807

899

sha1, _, _ = store.add_lines((None,), (), lines)

808

self._key = ("sha1:" + sha1,)

900

self._key = StaticTuple("sha1:" + sha1,).intern()

809

901

bytes = ''.join(lines)

810

902

if len(bytes) != self._current_size():

811

903

raise AssertionError('Invalid _current_size')

879

971

LeafNode or InternalNode.

880

972

"""

881

973

974

__slots__ = ('_node_width',)

975

882

976

def __init__(self, prefix='', search_key_func=None):

883

977

Node.__init__(self)

884

978

# The size of an internalnode with default values and no children.

926

1020

:param key: The key that the serialised node has.

927

1021

:return: An InternalNode instance.

928

1022

"""

1023

key = static_tuple.expect_static_tuple(key)

929

1024

return _deserialise_internal_node(bytes, key,

930

1025

search_key_func=search_key_func)

931

1026

950

1045

# prefix is the key in self._items to use, key_filter is the key_filter

951

1046

# entries that would match this node

952

1047

keys = {}

1048

shortcut = False

953

1049

if key_filter is None:

1050

# yielding all nodes, yield whatever we have, and queue up a read

1051

# for whatever we are missing

1052

shortcut = True

954

1053

for prefix, node in self._items.iteritems():

955

if type(node) == tuple:

1054

if node.__class__ is StaticTuple:

956

1055

keys[node] = (prefix, None)

957

1056

else:

958

1057

yield node, None

959

else:

960

# XXX defaultdict ?

1058

elif len(key_filter) == 1:

1059

# Technically, this path could also be handled by the first check

1060

# in 'self._node_width' in length_filters. However, we can handle

1061

# this case without spending any time building up the

1062

# prefix_to_keys, etc state.

1063

1064

# This is a bit ugly, but TIMEIT showed it to be by far the fastest

1065

# 0.626us list(key_filter)[0]

1066

# is a func() for list(), 2 mallocs, and a getitem

1067

# 0.489us [k for k in key_filter][0]

1068

# still has the mallocs, avoids the func() call

1069

# 0.350us iter(key_filter).next()

1070

# has a func() call, and mallocs an iterator

1071

# 0.125us for key in key_filter: pass

1072

# no func() overhead, might malloc an iterator

1073

# 0.105us for key in key_filter: break

1074

# no func() overhead, might malloc an iterator, probably

1075

# avoids checking an 'else' clause as part of the for

1076

for key in key_filter:

1077

break

1078

search_prefix = self._search_prefix_filter(key)

1079

if len(search_prefix) == self._node_width:

1080

# This item will match exactly, so just do a dict lookup, and

1081

# see what we can return

1082

shortcut = True

1083

try:

1084

node = self._items[search_prefix]

1085

except KeyError:

1086

# A given key can only match 1 child node, if it isn't

1087

# there, then we can just return nothing

1088

return

1089

if node.__class__ is StaticTuple:

1090

keys[node] = (search_prefix, [key])

1091

else:

1092

# This is loaded, and the only thing that can match,

1093

# return

1094

yield node, [key]

1095

return

1096

if not shortcut:

1097

# First, convert all keys into a list of search prefixes

1098

# Aggregate common prefixes, and track the keys they come from

961

1099

prefix_to_keys = {}

962

1100

length_filters = {}

963

1101

for key in key_filter:

964

search_key = self._search_prefix_filter(key)

1102

search_prefix = self._search_prefix_filter(key)

965

1103

length_filter = length_filters.setdefault(

966

len(search_key), set())

967

length_filter.add(search_key)

968

prefix_to_keys.setdefault(search_key, []).append(key)

969

length_filters = length_filters.items()

970

for prefix, node in self._items.iteritems():

971

node_key_filter = []

972

for length, length_filter in length_filters:

973

sub_prefix = prefix[:length]

974

if sub_prefix in length_filter:

975

node_key_filter.extend(prefix_to_keys[sub_prefix])

976

if node_key_filter: # this key matched something, yield it

977

if type(node) == tuple:

978

keys[node] = (prefix, node_key_filter)

1104

len(search_prefix), set())

1105

length_filter.add(search_prefix)

1106

prefix_to_keys.setdefault(search_prefix, []).append(key)

1107

1108

if (self._node_width in length_filters

1109

and len(length_filters) == 1):

1110

# all of the search prefixes match exactly _node_width. This

1111

# means that everything is an exact match, and we can do a

1112

# lookup into self._items, rather than iterating over the items

1113

# dict.

1114

search_prefixes = length_filters[self._node_width]

1115

for search_prefix in search_prefixes:

1116

try:

1117

node = self._items[search_prefix]

1118

except KeyError:

1119

# We can ignore this one

1120

continue

1121

node_key_filter = prefix_to_keys[search_prefix]

1122

if node.__class__ is StaticTuple:

1123

keys[node] = (search_prefix, node_key_filter)

979

1124

else:

980

1125

yield node, node_key_filter

1126

else:

1127

# The slow way. We walk every item in self._items, and check to

1128

# see if there are any matches

1129

length_filters = length_filters.items()

1130

for prefix, node in self._items.iteritems():

1131

node_key_filter = []

1132

for length, length_filter in length_filters:

1133

sub_prefix = prefix[:length]

1134

if sub_prefix in length_filter:

1135

node_key_filter.extend(prefix_to_keys[sub_prefix])

1136

if node_key_filter: # this key matched something, yield it

1137

if node.__class__ is StaticTuple:

1138

keys[node] = (prefix, node_key_filter)

1139

else:

1140

yield node, node_key_filter

981

1141

if keys:

982

1142

# Look in the page cache for some more bytes

983

1143

found_keys = set()

1112

1272

:return: An iterable of the keys inserted by this operation.

1113

1273

"""

1114

1274

for node in self._items.itervalues():

1115

if type(node) == tuple:

1275

if type(node) is StaticTuple:

1116

1276

# Never deserialised.

1117

1277

continue

1118

1278

if node._key is not None:

1129

1289

lines.append('%s\n' % (self._search_prefix,))

1130

1290

prefix_len = len(self._search_prefix)

1131

1291

for prefix, node in sorted(self._items.items()):

1132

if type(node) == tuple:

1292

if type(node) is StaticTuple:

1133

1293

key = node[0]

1134

1294

else:

1135

1295

key = node._key[0]

1139

1299

% (serialised, self._search_prefix))

1140

1300

lines.append(serialised[prefix_len:])

1141

1301

sha1, _, _ = store.add_lines((None,), (), lines)

1142

self._key = ("sha1:" + sha1,)

1302

self._key = StaticTuple("sha1:" + sha1,).intern()

1143

1303

_page_cache.add(self._key, ''.join(lines))

1144

1304

yield self._key

1145

1305

1174

1334

raise AssertionError("unserialised nodes have no refs.")

1175

1335

refs = []

1176

1336

for value in self._items.itervalues():

1177

if type(value) == tuple:

1337

if type(value) is StaticTuple:

1178

1338

refs.append(value)

1179

1339

else:

1180

1340

refs.append(value.key())

1281

1441

return node

1282

1442

1283

1443

1284

def _find_children_info(store, interesting_keys, uninteresting_keys, pb):

1285

"""Read the associated records, and determine what is interesting."""

1286

uninteresting_keys = set(uninteresting_keys)

1287

chks_to_read = uninteresting_keys.union(interesting_keys)

1288

next_uninteresting = set()

1289

next_interesting = set()

1290

uninteresting_items = set()

1291

interesting_items = set()

1292

interesting_records = []

1293

# records_read = set()

1294

for record in store.get_record_stream(chks_to_read, 'unordered', True):

1295

# records_read.add(record.key())

1296

if pb is not None:

1297

pb.tick()

1298

bytes = record.get_bytes_as('fulltext')

1299

# We don't care about search_key_func for this code, because we only

1300

# care about external references.

1301

node = _deserialise(bytes, record.key, search_key_func=None)

1302

if record.key in uninteresting_keys:

1303

if type(node) is InternalNode:

1304

next_uninteresting.update(node.refs())

1305

else:

1306

# We know we are at a LeafNode, so we can pass None for the

1307

# store

1308

uninteresting_items.update(node.iteritems(None))

1309

else:

1310

interesting_records.append(record)

1311

if type(node) is InternalNode:

1312

next_interesting.update(node.refs())

1313

else:

1314

interesting_items.update(node.iteritems(None))

1315

# TODO: Filter out records that have already been read, as node splitting

1316

# can cause us to reference the same nodes via shorter and longer

1317

# paths

1318

return (next_uninteresting, uninteresting_items,

1319

next_interesting, interesting_records, interesting_items)

1320

1321

1322

def _find_all_uninteresting(store, interesting_root_keys,

1323

uninteresting_root_keys, adapter, pb):

1324

"""Determine the full set of uninteresting keys."""

1325

# What about duplicates between interesting_root_keys and

1326

# uninteresting_root_keys?

1327

if not uninteresting_root_keys:

1328

# Shortcut case. We know there is nothing uninteresting to filter out

1329

# So we just let the rest of the algorithm do the work

1330

# We know there is nothing uninteresting, and we didn't have to read

1331

# any interesting records yet.

1332

return (set(), set(), set(interesting_root_keys), [], set())

1333

all_uninteresting_chks = set(uninteresting_root_keys)

1334

all_uninteresting_items = set()

1335

1336

# First step, find the direct children of both the interesting and

1337

# uninteresting set

1338

(uninteresting_keys, uninteresting_items,

1339

interesting_keys, interesting_records,

1340

interesting_items) = _find_children_info(store, interesting_root_keys,

1341

uninteresting_root_keys,

1342

pb=pb)

1343

all_uninteresting_chks.update(uninteresting_keys)

1344

all_uninteresting_items.update(uninteresting_items)

1345

del uninteresting_items

1346

# Note: Exact matches between interesting and uninteresting do not need

1347

# to be search further. Non-exact matches need to be searched in case

1348

# there is a future exact-match

1349

uninteresting_keys.difference_update(interesting_keys)

1350

1351

# Second, find the full set of uninteresting bits reachable by the

1352

# uninteresting roots

1353

chks_to_read = uninteresting_keys

1354

while chks_to_read:

1355

next_chks = set()

1356

for record in store.get_record_stream(chks_to_read, 'unordered', False):

1357

# TODO: Handle 'absent'

1358

if pb is not None:

1359

pb.tick()

1360

try:

1361

bytes = record.get_bytes_as('fulltext')

1362

except errors.UnavailableRepresentation:

1363

bytes = adapter.get_bytes(record)

1364

# We don't care about search_key_func for this code, because we

1365

# only care about external references.

1366

node = _deserialise(bytes, record.key, search_key_func=None)

1367

if type(node) is InternalNode:

1368

# uninteresting_prefix_chks.update(node._items.iteritems())

1369

chks = node._items.values()

1370

# TODO: We remove the entries that are already in

1371

# uninteresting_chks ?

1372

next_chks.update(chks)

1373

all_uninteresting_chks.update(chks)

1374

else:

1375

all_uninteresting_items.update(node._items.iteritems())

1376

chks_to_read = next_chks

1377

return (all_uninteresting_chks, all_uninteresting_items,

1378

interesting_keys, interesting_records, interesting_items)

1444

class CHKMapDifference(object):

1445

"""Iterate the stored pages and key,value pairs for (new - old).

1446

1447

This class provides a generator over the stored CHK pages and the

1448

(key, value) pairs that are in any of the new maps and not in any of the

1449

old maps.

1450

1451

Note that it may yield chk pages that are common (especially root nodes),

1452

but it won't yield (key,value) pairs that are common.

1453

"""

1454

1455

def __init__(self, store, new_root_keys, old_root_keys,

1456

search_key_func, pb=None):

1457

# TODO: Should we add a StaticTuple barrier here? It would be nice to

1458

# force callers to use StaticTuple, because there will often be

1459

# lots of keys passed in here. And even if we cast it locally,

1460

# that just meanst that we will have *both* a StaticTuple and a

1461

# tuple() in memory, referring to the same object. (so a net

1462

# increase in memory, not a decrease.)

1463

self._store = store

1464

self._new_root_keys = new_root_keys

1465

self._old_root_keys = old_root_keys

1466

self._pb = pb

1467

# All uninteresting chks that we have seen. By the time they are added

1468

# here, they should be either fully ignored, or queued up for

1469

# processing

1470

# TODO: This might grow to a large size if there are lots of merge

1471

# parents, etc. However, it probably doesn't scale to O(history)

1472

# like _processed_new_refs does.

1473

self._all_old_chks = set(self._old_root_keys)

1474

# All items that we have seen from the old_root_keys

1475

self._all_old_items = set()

1476

# These are interesting items which were either read, or already in the

1477

# interesting queue (so we don't need to walk them again)

1478

# TODO: processed_new_refs becomes O(all_chks), consider switching to

1479

# SimpleSet here.

1480

self._processed_new_refs = set()

1481

self._search_key_func = search_key_func

1482

1483

# The uninteresting and interesting nodes to be searched

1484

self._old_queue = []

1485

self._new_queue = []

1486

# Holds the (key, value) items found when processing the root nodes,

1487

# waiting for the uninteresting nodes to be walked

1488

self._new_item_queue = []

1489

self._state = None

1490

1491

def _read_nodes_from_store(self, keys):

1492

# We chose not to use _page_cache, because we think in terms of records

1493

# to be yielded. Also, we expect to touch each page only 1 time during

1494

# this code. (We may want to evaluate saving the raw bytes into the

1495

# page cache, which would allow a working tree update after the fetch

1496

# to not have to read the bytes again.)

1497

as_st = StaticTuple.from_sequence

1498

stream = self._store.get_record_stream(keys, 'unordered', True)

1499

for record in stream:

1500

if self._pb is not None:

1501

self._pb.tick()

1502

if record.storage_kind == 'absent':

1503

raise errors.NoSuchRevision(self._store, record.key)

1504

bytes = record.get_bytes_as('fulltext')

1505

node = _deserialise(bytes, record.key,

1506

search_key_func=self._search_key_func)

1507

if type(node) is InternalNode:

1508

# Note we don't have to do node.refs() because we know that

1509

# there are no children that have been pushed into this node

1510

# Note: Using as_st() here seemed to save 1.2MB, which would

1511

# indicate that we keep 100k prefix_refs around while

1512

# processing. They *should* be shorter lived than that...

1513

# It does cost us ~10s of processing time

1514

#prefix_refs = [as_st(item) for item in node._items.iteritems()]

1515

prefix_refs = node._items.items()

1516

items = []

1517

else:

1518

prefix_refs = []

1519

# Note: We don't use a StaticTuple here. Profiling showed a

1520

# minor memory improvement (0.8MB out of 335MB peak 0.2%)

1521

# But a significant slowdown (15s / 145s, or 10%)

1522

items = node._items.items()

1523

yield record, node, prefix_refs, items

1524

1525

def _read_old_roots(self):

1526

old_chks_to_enqueue = []

1527

all_old_chks = self._all_old_chks

1528

for record, node, prefix_refs, items in \

1529

self._read_nodes_from_store(self._old_root_keys):

1530

# Uninteresting node

1531

prefix_refs = [p_r for p_r in prefix_refs

1532

if p_r[1] not in all_old_chks]

1533

new_refs = [p_r[1] for p_r in prefix_refs]

1534

all_old_chks.update(new_refs)

1535

# TODO: This might be a good time to turn items into StaticTuple

1536

# instances and possibly intern them. However, this does not

1537

# impact 'initial branch' performance, so I'm not worrying

1538

# about this yet

1539

self._all_old_items.update(items)

1540

# Queue up the uninteresting references

1541

# Don't actually put them in the 'to-read' queue until we have

1542

# finished checking the interesting references

1543

old_chks_to_enqueue.extend(prefix_refs)

1544

return old_chks_to_enqueue

1545

1546

def _enqueue_old(self, new_prefixes, old_chks_to_enqueue):

1547

# At this point, we have read all the uninteresting and interesting

1548

# items, so we can queue up the uninteresting stuff, knowing that we've

1549

# handled the interesting ones

1550

for prefix, ref in old_chks_to_enqueue:

1551

not_interesting = True

1552

for i in xrange(len(prefix), 0, -1):

1553

if prefix[:i] in new_prefixes:

1554

not_interesting = False

1555

break

1556

if not_interesting:

1557

# This prefix is not part of the remaining 'interesting set'

1558

continue

1559

self._old_queue.append(ref)

1560

1561

def _read_all_roots(self):

1562

"""Read the root pages.

1563

1564

This is structured as a generator, so that the root records can be

1565

yielded up to whoever needs them without any buffering.

1566

"""

1567

# This is the bootstrap phase

1568

if not self._old_root_keys:

1569

# With no old_root_keys we can just shortcut and be ready

1570

# for _flush_new_queue

1571

self._new_queue = list(self._new_root_keys)

1572

return

1573

old_chks_to_enqueue = self._read_old_roots()

1574

# filter out any root keys that are already known to be uninteresting

1575

new_keys = set(self._new_root_keys).difference(self._all_old_chks)

1576

# These are prefixes that are present in new_keys that we are

1577

# thinking to yield

1578

new_prefixes = set()

1579

# We are about to yield all of these, so we don't want them getting

1580

# added a second time

1581

processed_new_refs = self._processed_new_refs

1582

processed_new_refs.update(new_keys)

1583

for record, node, prefix_refs, items in \

1584

self._read_nodes_from_store(new_keys):

1585

# At this level, we now know all the uninteresting references

1586

# So we filter and queue up whatever is remaining

1587

prefix_refs = [p_r for p_r in prefix_refs

1588

if p_r[1] not in self._all_old_chks

1589

and p_r[1] not in processed_new_refs]

1590

refs = [p_r[1] for p_r in prefix_refs]

1591

new_prefixes.update([p_r[0] for p_r in prefix_refs])

1592

self._new_queue.extend(refs)

1593

# TODO: We can potentially get multiple items here, however the

1594

# current design allows for this, as callers will do the work

1595

# to make the results unique. We might profile whether we

1596

# gain anything by ensuring unique return values for items

1597

# TODO: This might be a good time to cast to StaticTuple, as

1598

# self._new_item_queue will hold the contents of multiple

1599

# records for an extended lifetime

1600

new_items = [item for item in items

1601

if item not in self._all_old_items]

1602

self._new_item_queue.extend(new_items)

1603

new_prefixes.update([self._search_key_func(item[0])

1604

for item in new_items])

1605

processed_new_refs.update(refs)

1606

yield record

1607

# For new_prefixes we have the full length prefixes queued up.

1608

# However, we also need possible prefixes. (If we have a known ref to

1609

# 'ab', then we also need to include 'a'.) So expand the

1610

# new_prefixes to include all shorter prefixes

1611

for prefix in list(new_prefixes):

1612

new_prefixes.update([prefix[:i] for i in xrange(1, len(prefix))])

1613

self._enqueue_old(new_prefixes, old_chks_to_enqueue)

1614

1615

def _flush_new_queue(self):

1616

# No need to maintain the heap invariant anymore, just pull things out

1617

# and process them

1618

refs = set(self._new_queue)

1619

self._new_queue = []

1620

# First pass, flush all interesting items and convert to using direct refs

1621

all_old_chks = self._all_old_chks

1622

processed_new_refs = self._processed_new_refs

1623

all_old_items = self._all_old_items

1624

new_items = [item for item in self._new_item_queue

1625

if item not in all_old_items]

1626

self._new_item_queue = []

1627

if new_items:

1628

yield None, new_items

1629

refs = refs.difference(all_old_chks)

1630

processed_new_refs.update(refs)

1631

while refs:

1632

# TODO: Using a SimpleSet for self._processed_new_refs and

1633

# saved as much as 10MB of peak memory. However, it requires

1634

# implementing a non-pyrex version.

1635

next_refs = set()

1636

next_refs_update = next_refs.update

1637

# Inlining _read_nodes_from_store improves 'bzr branch bzr.dev'

1638

# from 1m54s to 1m51s. Consider it.

1639

for record, _, p_refs, items in self._read_nodes_from_store(refs):

1640

if all_old_items:

1641

# using the 'if' check saves about 145s => 141s, when

1642

# streaming initial branch of Launchpad data.

1643

items = [item for item in items

1644

if item not in all_old_items]

1645

yield record, items

1646

next_refs_update([p_r[1] for p_r in p_refs])

1647

del p_refs

1648

# set1.difference(set/dict) walks all of set1, and checks if it

1649

# exists in 'other'.

1650

# set1.difference(iterable) walks all of iterable, and does a

1651

# 'difference_update' on a clone of set1. Pick wisely based on the

1652

# expected sizes of objects.

1653

# in our case it is expected that 'new_refs' will always be quite

1654

# small.

1655

next_refs = next_refs.difference(all_old_chks)

1656

next_refs = next_refs.difference(processed_new_refs)

1657

processed_new_refs.update(next_refs)

1658

refs = next_refs

1659

1660

def _process_next_old(self):

1661

# Since we don't filter uninteresting any further than during

1662

# _read_all_roots, process the whole queue in a single pass.

1663

refs = self._old_queue

1664

self._old_queue = []

1665

all_old_chks = self._all_old_chks

1666

for record, _, prefix_refs, items in self._read_nodes_from_store(refs):

1667

# TODO: Use StaticTuple here?

1668

self._all_old_items.update(items)

1669

refs = [r for _,r in prefix_refs if r not in all_old_chks]

1670

self._old_queue.extend(refs)

1671

all_old_chks.update(refs)

1672

1673

def _process_queues(self):

1674

while self._old_queue:

1675

self._process_next_old()

1676

return self._flush_new_queue()

1677

1678

def process(self):

1679

for record in self._read_all_roots():

1680

yield record, []

1681

for record, items in self._process_queues():

1682

yield record, items

1379

1683

1380

1684

1381

1685

def iter_interesting_nodes(store, interesting_root_keys,

1390

1694

:param uninteresting_root_keys: keys which should be filtered out of the

1391

1695

result set.

1392

1696

:return: Yield

1393

(interesting records, interesting chk's, interesting key:values)

1697

(interesting record, {interesting key:values})

1394

1698

"""

1395

# TODO: consider that it may be more memory efficient to use the 20-byte

1396

# sha1 string, rather than tuples of hexidecimal sha1 strings.

1397

# TODO: Try to factor out a lot of the get_record_stream() calls into a

1398

# helper function similar to _read_bytes. This function should be

1399

# able to use nodes from the _page_cache as well as actually

1400

# requesting bytes from the store.

1401

1402

# A way to adapt from the compressed texts back into fulltexts

1403

# In a way, this seems like a layering inversion to have CHKMap know the

1404

# details of versionedfile

1405

adapter_class = versionedfile.adapter_registry.get(

1406

('knit-ft-gz', 'fulltext'))

1407

adapter = adapter_class(store)

1408

1409

(all_uninteresting_chks, all_uninteresting_items, interesting_keys,

1410

interesting_records, interesting_items) = _find_all_uninteresting(store,

1411

interesting_root_keys, uninteresting_root_keys, adapter, pb)

1412

1413

# Now that we know everything uninteresting, we can yield information from

1414

# our first request

1415

interesting_items.difference_update(all_uninteresting_items)

1416

records = dict((record.key, record) for record in interesting_records

1417

if record.key not in all_uninteresting_chks)

1418

if records or interesting_items:

1419

yield records, interesting_items

1420

interesting_keys.difference_update(all_uninteresting_chks)

1421

1422

chks_to_read = interesting_keys

1423

counter = 0

1424

while chks_to_read:

1425

next_chks = set()

1426

for record in store.get_record_stream(chks_to_read, 'unordered', False):

1427

counter += 1

1428

if pb is not None:

1429

pb.update('find chk pages', counter)

1430

# TODO: Handle 'absent'?

1431

try:

1432

bytes = record.get_bytes_as('fulltext')

1433

except errors.UnavailableRepresentation:

1434

bytes = adapter.get_bytes(record)

1435

# We don't care about search_key_func for this code, because we

1436

# only care about external references.

1437

node = _deserialise(bytes, record.key, search_key_func=None)

1438

if type(node) is InternalNode:

1439

# all_uninteresting_chks grows large, as it lists all nodes we

1440

# don't want to process (including already seen interesting

1441

# nodes).

1442

# small.difference_update(large) scales O(large), but

1443

# small.difference(large) scales O(small).

1444

# Also, we know we just _deserialised this node, so we can

1445

# access the dict directly.

1446

chks = set(node._items.itervalues()).difference(

1447

all_uninteresting_chks)

1448

# Is set() and .difference_update better than:

1449

# chks = [chk for chk in node.refs()

1450

# if chk not in all_uninteresting_chks]

1451

next_chks.update(chks)

1452

# These are now uninteresting everywhere else

1453

all_uninteresting_chks.update(chks)

1454

interesting_items = []

1455

else:

1456

interesting_items = [item for item in node._items.iteritems()

1457

if item not in all_uninteresting_items]

1458

# TODO: Do we need to filter out items that we have already

1459

# seen on other pages? We don't really want to buffer the

1460

# whole thing, but it does mean that callers need to

1461

# understand they may get duplicate values.

1462

# all_uninteresting_items.update(interesting_items)

1463

yield {record.key: record}, interesting_items

1464

chks_to_read = next_chks

1699

iterator = CHKMapDifference(store, interesting_root_keys,

1700

uninteresting_root_keys,

1701

search_key_func=store._search_key_func,

1702

pb=pb)

1703

return iterator.process()

1465

1704

1466

1705

1467

1706

try:

1471

1710

_deserialise_leaf_node,

1472

1711

_deserialise_internal_node,

1473

1712

)

1474

except ImportError:

1713

except ImportError, e:

1714

osutils.failed_to_load_extension(e)

1475

1715

from bzrlib._chk_map_py import (

1476

1716

_search_key_16,

1477

1717

_search_key_255,

1480

1720

)

1481

1721

search_key_registry.register('hash-16-way', _search_key_16)

1482

1722

search_key_registry.register('hash-255-way', _search_key_255)

1723

1724

1725

def _check_key(key):

1726

"""Helper function to assert that a key is properly formatted.

1727

1728

This generally shouldn't be used in production code, but it can be helpful

1729

to debug problems.

1730

"""

1731

if type(key) is not StaticTuple:

1732

raise TypeError('key %r is not StaticTuple but %s' % (key, type(key)))

1733

if len(key) != 1:

1734

raise ValueError('key %r should have length 1, not %d' % (key, len(key),))

1735

if type(key[0]) is not str:

1736

raise TypeError('key %r should hold a str, not %r'

1737

% (key, type(key[0])))

1738

if not key[0].startswith('sha1:'):

1739

raise ValueError('key %r should point to a sha1:' % (key,))

1740

1741

Older »