~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/chk_map.py

Committer: Vincent Ladeuil
Date: 2010-04-23 08:51:52 UTC
mfrom: (5131.2.6 support_OO_flag)
mto: This revision was merged to the branch mainline in revision 5179.
Revision ID: v.ladeuil+lp@free.fr-20100423085152-uoewc1vnkwqhw0pj

Manually assign docstrings to command objects, so that they work with python -OO

files added:
.testr.conf

MANIFEST.in

NEWS-template.txt

README_BDIST_RPM

apport

apport/README

apport/bzr-crashdb.conf

apport/source_bzr.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_import_c_api.h

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/cleanup.py

bzrlib/cmdline.py

bzrlib/crash.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/filters/eol.py

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/location-alias.txt

bzrlib/help_topics/es

bzrlib/inventory_delta.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/static_tuple.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/commands/test_revert.py

bzrlib/tests/features.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_bzrdir_colo

bzrlib/tests/per_bzrdir_colo/__init__.py

bzrlib/tests/per_bzrdir_colo/test_supported.py

bzrlib/tests/per_bzrdir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/script.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_script.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/transport/pathfilter.py

bzrlib/util/bencode.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

doc/Bazaar-Logo-For-Manuals.png

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/apport.txt

doc/developers/bug-handling.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/implementation-notes.txt

doc/developers/index-plain.txt

doc/developers/miscellaneous-notes.txt

doc/developers/plans.txt

doc/developers/principles.txt

doc/developers/specifications.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/quick-reference/index.txt

doc/en/tutorials/index.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/whats-new

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/quick-reference/index.txt

doc/es/user-guide/index-plain.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/generate_release_notes.py

tools/package_docs.py

tools/packaging/update-control.sh

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

files removed:
bzrlib/tests/blackbox/test_guess_renames.py

bzrlib/tests/test_http_implementations.py

bzrlib/textui.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/tests/test_bencode.py

bzrlib/weave_commands.py

contrib/fortune

doc/bazaar-vcs.org.kid

doc/developers/performance-contributing.txt

doc/en/developer-guide

doc/en/user-guide/index.txt

doc/es/guia-desarrollador

doc/es/notas-version

doc/es/referencia

tools/biobench.py

tools/history2revfiles.py

files renamed:
bzrlib/_btree_serializer_c.pyx => bzrlib/_btree_serializer_pyx.pyx

bzrlib/_dirstate_helpers_c.h => bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_c.pyx => bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_knit_load_data_c.pyx => bzrlib/_knit_load_data_pyx.pyx

tools/doc_generate/ => bzrlib/doc_generate/

bzrlib/help_topics/en/conflicts.txt => bzrlib/help_topics/en/conflict-types.txt

doc/es/guia-usuario/resolving_conflicts.txt => bzrlib/help_topics/es/conflict-types.txt

bzrlib/tests/branch_implementations/ => bzrlib/tests/per_branch/

bzrlib/tests/bzrdir_implementations/ => bzrlib/tests/per_bzrdir/

bzrlib/tests/interrepository_implementations/ => bzrlib/tests/per_interrepository/

bzrlib/tests/intertree_implementations/ => bzrlib/tests/per_intertree/

bzrlib/tests/inventory_implementations/ => bzrlib/tests/per_inventory/

bzrlib/tests/test_pack_repository.py => bzrlib/tests/per_pack_repository.py

bzrlib/tests/test_transport_implementations.py => bzrlib/tests/per_transport.py

bzrlib/tests/tree_implementations/ => bzrlib/tests/per_tree/

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py => bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/test_versionedfile.py => bzrlib/tests/per_versionedfile.py

bzrlib/tests/workingtree_implementations/ => bzrlib/tests/per_workingtree/

bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

doc/en/quick-reference/Makefile => doc/en/_static/en/Makefile

doc/en/quick-reference/quick-start-summary.pdf => doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/quick-reference/quick-start-summary.png => doc/en/_static/en/bzr-en-quick-reference.png

doc/en/quick-reference/quick-start-summary.svg => doc/en/_static/en/bzr-en-quick-reference.svg

doc/es/referencia-rapida/Makefile => doc/es/_static/es/Makefile

doc/es/referencia-rapida/referencia-rapida.svg => doc/es/_static/es/bzr-es-quick-reference.svg

doc/index.es.txt => doc/es/index.txt

doc/es/referencia-rapida/ => doc/es/quick-reference/

doc/es/guia-usuario/ => doc/es/user-guide/

generate_docs.py => tools/generate_docs.py

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_btree_serializer_py.py

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/foreign.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/version.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/update.txt

doc/en/admin-guide/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/es/mini-tutorial/index.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.txt

profile_imports.py

setup.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/win32/build_release.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/info.txt

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/chk_map.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

Updates to a CHKMap are done preferentially via the apply_delta method, to

allow optimisation of the update operation; but individual map/unmap calls are

possible and supported. All changes via map/unmap are buffered in memory until

the _save method is called to force serialisation of the tree. apply_delta

performs a _save implicitly.

possible and supported. Individual changes via map/unmap are buffered in memory

until the _save method is called to force serialisation of the tree.

apply_delta records its changes immediately by performing an implicit _save.

TODO:

-----

"""

import heapq

import time

import threading

from bzrlib import lazy_import

lazy_import.lazy_import(globals(), """

from bzrlib import versionedfile

from bzrlib import (

errors,

versionedfile,

)

""")

from bzrlib import (

errors,

lru_cache,

osutils,

registry,

static_tuple,

trace,

)

from bzrlib.static_tuple import StaticTuple

# approx 4MB

# If each line is 50 bytes, and you have 255 internal pages, with 255-way fan

# out, it takes 3.1MB to cache the layer.

_PAGE_CACHE_SIZE = 4*1024*1024

# We are caching bytes so len(value) is perfectly accurate

_page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)

# Per thread caches for 2 reasons:

# - in the server we may be serving very different content, so we get less

# cache thrashing.

# - we avoid locking on every cache lookup.

_thread_caches = threading.local()

# The page cache.

_thread_caches.page_cache = None

def _get_cache():

"""Get the per-thread page cache.

We need a function to do this because in a new thread the _thread_caches

threading.local object does not have the cache initialized yet.

"""

page_cache = getattr(_thread_caches, 'page_cache', None)

if page_cache is None:

# We are caching bytes so len(value) is perfectly accurate

page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)

_thread_caches.page_cache = page_cache

return page_cache

def clear_cache():

_get_cache().clear()

# If a ChildNode falls below this many bytes, we check for a remap

_INTERESTING_NEW_SIZE = 50

106

class CHKMap(object):

107

"""A persistent map from string to string backed by a CHK store."""

108

109

__slots__ = ('_store', '_root_node', '_search_key_func')

110

111

def __init__(self, store, root_key, search_key_func=None):

112

"""Create a CHKMap object.

113

107

136

of old_key is removed.

108

137

"""

109

138

delete_count = 0

139

# Check preconditions first.

140

as_st = StaticTuple.from_sequence

141

new_items = set([as_st(key) for (old, key, value) in delta

142

if key is not None and old is None])

143

existing_new = list(self.iteritems(key_filter=new_items))

144

if existing_new:

145

raise errors.InconsistentDeltaDelta(delta,

146

"New items are already in the map %r." % existing_new)

147

# Now apply changes.

110

148

for old, new, value in delta:

111

149

if old is not None and old != new:

112

150

self.unmap(old, check_remap=False)

121

159

122

160

def _ensure_root(self):

123

161

"""Ensure that the root node is an object not a key."""

124

if type(self._root_node) == tuple:

162

if type(self._root_node) is StaticTuple:

125

163

# Demand-load the root

126

164

self._root_node = self._get_node(self._root_node)

127

165

135

173

:param node: A tuple key or node object.

136

174

:return: A node object.

137

175

"""

138

if type(node) == tuple:

176

if type(node) is StaticTuple:

139

177

bytes = self._read_bytes(node)

140

178

return _deserialise(bytes, node,

141

179

search_key_func=self._search_key_func)

144

182

145

183

def _read_bytes(self, key):

146

184

try:

147

return _page_cache[key]

185

return _get_cache()[key]

148

186

except KeyError:

149

187

stream = self._store.get_record_stream([key], 'unordered', True)

150

188

bytes = stream.next().get_bytes_as('fulltext')

151

_page_cache[key] = bytes

189

_get_cache()[key] = bytes

152

190

return bytes

153

191

154

192

def _dump_tree(self, include_keys=False):

182

220

for key, value in sorted(node._items.iteritems()):

183

221

# Don't use prefix nor indent here to line up when used in

184

222

# tests in conjunction with assertEqualDiff

185

result.append(' %r %r' % (key, value))

223

result.append(' %r %r' % (tuple(key), value))

186

224

return result

187

225

188

226

@classmethod

203

241

multiple pages.

204

242

:return: The root chk of the resulting CHKMap.

205

243

"""

206

result = CHKMap(store, None, search_key_func=search_key_func)

244

root_key = klass._create_directly(store, initial_value,

245

maximum_size=maximum_size, key_width=key_width,

246

search_key_func=search_key_func)

247

if type(root_key) is not StaticTuple:

248

raise AssertionError('we got a %s instead of a StaticTuple'

249

% (type(root_key),))

250

return root_key

251

252

@classmethod

253

def _create_via_map(klass, store, initial_value, maximum_size=0,

254

key_width=1, search_key_func=None):

255

result = klass(store, None, search_key_func=search_key_func)

207

256

result._root_node.set_maximum_size(maximum_size)

208

257

result._root_node._key_width = key_width

209

258

delta = []

210

259

for key, value in initial_value.items():

211

260

delta.append((None, key, value))

212

return result.apply_delta(delta)

261

root_key = result.apply_delta(delta)

262

return root_key

263

264

@classmethod

265

def _create_directly(klass, store, initial_value, maximum_size=0,

266

key_width=1, search_key_func=None):

267

node = LeafNode(search_key_func=search_key_func)

268

node.set_maximum_size(maximum_size)

269

node._key_width = key_width

270

as_st = StaticTuple.from_sequence

271

node._items = dict([(as_st(key), val) for key, val

272

in initial_value.iteritems()])

273

node._raw_size = sum([node._key_value_len(key, value)

274

for key,value in node._items.iteritems()])

275

node._len = len(node._items)

276

node._compute_search_prefix()

277

node._compute_serialised_prefix()

278

if (node._len > 1

279

and maximum_size

280

and node._current_size() > maximum_size):

281

prefix, node_details = node._split(store)

282

if len(node_details) == 1:

283

raise AssertionError('Failed to split using node._split')

284

node = InternalNode(prefix, search_key_func=search_key_func)

285

node.set_maximum_size(maximum_size)

286

node._key_width = key_width

287

for split, subnode in node_details:

288

node.add_node(split, subnode)

289

keys = list(node.serialise(store))

290

return keys[-1]

213

291

214

292

def iter_changes(self, basis):

215

293

"""Iterate over the changes between basis and self.

413

491

self_pending)

414

492

basis_prefix, _, basis_node, basis_path = heapq.heappop(

415

493

basis_pending)

416

assert self_prefix == basis_prefix

494

if self_prefix != basis_prefix:

495

raise AssertionError(

496

'%r != %r' % (self_prefix, basis_prefix))

417

497

process_common_prefix_nodes(

418

498

self_node, self_path,

419

499

basis_node, basis_path)

433

513

def iteritems(self, key_filter=None):

434

514

"""Iterate over the entire CHKMap's contents."""

435

515

self._ensure_root()

516

if key_filter is not None:

517

as_st = StaticTuple.from_sequence

518

key_filter = [as_st(key) for key in key_filter]

436

519

return self._root_node.iteritems(self._store, key_filter=key_filter)

437

520

438

521

def key(self):

439

522

"""Return the key for this map."""

440

if type(self._root_node) is tuple:

523

if type(self._root_node) is StaticTuple:

441

524

return self._root_node

442

525

else:

443

526

return self._root_node._key

447

530

return len(self._root_node)

448

531

449

532

def map(self, key, value):

450

"""Map a key tuple to value."""

533

"""Map a key tuple to value.

534

535

:param key: A key to map.

536

:param value: The value to assign to key.

537

"""

538

key = StaticTuple.from_sequence(key)

451

539

# Need a root object.

452

540

self._ensure_root()

453

541

prefix, node_details = self._root_node.map(self._store, key, value)

463

551

464

552

def _node_key(self, node):

465

553

"""Get the key for a node whether it's a tuple or node."""

466

if type(node) == tuple:

554

if type(node) is tuple:

555

node = StaticTuple.from_sequence(node)

556

if type(node) is StaticTuple:

467

557

return node

468

558

else:

469

559

return node._key

470

560

471

561

def unmap(self, key, check_remap=True):

472

562

"""remove key from the map."""

563

key = StaticTuple.from_sequence(key)

473

564

self._ensure_root()

474

565

if type(self._root_node) is InternalNode:

475

566

unmapped = self._root_node.unmap(self._store, key,

489

580

490

581

:return: The key of the root node.

491

582

"""

492

if type(self._root_node) == tuple:

583

if type(self._root_node) is StaticTuple:

493

584

# Already saved.

494

585

return self._root_node

495

586

keys = list(self._root_node.serialise(self._store))

503

594

adding the header bytes, and without prefix compression.

504

595

"""

505

596

597

__slots__ = ('_key', '_len', '_maximum_size', '_key_width',

598

'_raw_size', '_items', '_search_prefix', '_search_key_func'

599

)

600

506

601

def __init__(self, key_width=1):

507

602

"""Create a node.

508

603

557

652

"""

558

653

if key.startswith(prefix):

559

654

return prefix

655

pos = -1

560

656

# Is there a better way to do this?

561

657

for pos, (left, right) in enumerate(zip(prefix, key)):

562

658

if left != right:

596

692

the key/value pairs.

597

693

"""

598

694

695

__slots__ = ('_common_serialised_prefix', '_serialise_key')

696

599

697

def __init__(self, search_key_func=None):

600

698

Node.__init__(self)

601

699

# All of the keys in this leaf node share this common prefix

644

742

:param bytes: The bytes of the node.

645

743

:param key: The key that the serialised node has.

646

744

"""

745

key = static_tuple.expect_static_tuple(key)

647

746

return _deserialise_leaf_node(bytes, key,

648

747

search_key_func=search_key_func)

649

748

736

835

737

836

:return: (common_serialised_prefix, [(node_serialised_prefix, node)])

738

837

"""

739

assert self._search_prefix is not _unknown

838

if self._search_prefix is _unknown:

839

raise AssertionError('Search prefix must be known')

740

840

common_prefix = self._search_prefix

741

841

split_at = len(common_prefix) + 1

742

842

result = {}

760

860

result[prefix] = node

761

861

else:

762

862

node = result[prefix]

763

node.map(store, key, value)

863

sub_prefix, node_details = node.map(store, key, value)

864

if len(node_details) > 1:

865

if prefix != sub_prefix:

866

# This node has been split and is now found via a different

867

# path

868

result.pop(prefix)

869

new_node = InternalNode(sub_prefix,

870

search_key_func=self._search_key_func)

871

new_node.set_maximum_size(self._maximum_size)

872

new_node._key_width = self._key_width

873

for split, node in node_details:

874

new_node.add_node(split, node)

875

result[prefix] = new_node

764

876

return common_prefix, result.items()

765

877

766

878

def map(self, store, key, value):

772

884

if self._map_no_split(key, value):

773

885

return self._split(store)

774

886

else:

775

assert self._search_prefix is not _unknown

887

if self._search_prefix is _unknown:

888

raise AssertionError('%r must be known' % self._search_prefix)

776

889

return self._search_prefix, [("", self)]

777

890

778

891

def serialise(self, store):

805

918

lines.append(serialized[prefix_len:])

806

919

lines.extend(value_lines)

807

920

sha1, _, _ = store.add_lines((None,), (), lines)

808

self._key = ("sha1:" + sha1,)

921

self._key = StaticTuple("sha1:" + sha1,).intern()

809

922

bytes = ''.join(lines)

810

923

if len(bytes) != self._current_size():

811

924

raise AssertionError('Invalid _current_size')

812

_page_cache.add(self._key, bytes)

925

_get_cache().add(self._key, bytes)

813

926

return [self._key]

814

927

815

928

def refs(self):

879

992

LeafNode or InternalNode.

880

993

"""

881

994

995

__slots__ = ('_node_width',)

996

882

997

def __init__(self, prefix='', search_key_func=None):

883

998

Node.__init__(self)

884

999

# The size of an internalnode with default values and no children.

926

1041

:param key: The key that the serialised node has.

927

1042

:return: An InternalNode instance.

928

1043

"""

1044

key = static_tuple.expect_static_tuple(key)

929

1045

return _deserialise_internal_node(bytes, key,

930

1046

search_key_func=search_key_func)

931

1047

950

1066

# prefix is the key in self._items to use, key_filter is the key_filter

951

1067

# entries that would match this node

952

1068

keys = {}

1069

shortcut = False

953

1070

if key_filter is None:

1071

# yielding all nodes, yield whatever we have, and queue up a read

1072

# for whatever we are missing

1073

shortcut = True

954

1074

for prefix, node in self._items.iteritems():

955

if type(node) == tuple:

1075

if node.__class__ is StaticTuple:

956

1076

keys[node] = (prefix, None)

957

1077

else:

958

1078

yield node, None

959

else:

960

# XXX defaultdict ?

1079

elif len(key_filter) == 1:

1080

# Technically, this path could also be handled by the first check

1081

# in 'self._node_width' in length_filters. However, we can handle

1082

# this case without spending any time building up the

1083

# prefix_to_keys, etc state.

1084

1085

# This is a bit ugly, but TIMEIT showed it to be by far the fastest

1086

# 0.626us list(key_filter)[0]

1087

# is a func() for list(), 2 mallocs, and a getitem

1088

# 0.489us [k for k in key_filter][0]

1089

# still has the mallocs, avoids the func() call

1090

# 0.350us iter(key_filter).next()

1091

# has a func() call, and mallocs an iterator

1092

# 0.125us for key in key_filter: pass

1093

# no func() overhead, might malloc an iterator

1094

# 0.105us for key in key_filter: break

1095

# no func() overhead, might malloc an iterator, probably

1096

# avoids checking an 'else' clause as part of the for

1097

for key in key_filter:

1098

break

1099

search_prefix = self._search_prefix_filter(key)

1100

if len(search_prefix) == self._node_width:

1101

# This item will match exactly, so just do a dict lookup, and

1102

# see what we can return

1103

shortcut = True

1104

try:

1105

node = self._items[search_prefix]

1106

except KeyError:

1107

# A given key can only match 1 child node, if it isn't

1108

# there, then we can just return nothing

1109

return

1110

if node.__class__ is StaticTuple:

1111

keys[node] = (search_prefix, [key])

1112

else:

1113

# This is loaded, and the only thing that can match,

1114

# return

1115

yield node, [key]

1116

return

1117

if not shortcut:

1118

# First, convert all keys into a list of search prefixes

1119

# Aggregate common prefixes, and track the keys they come from

961

1120

prefix_to_keys = {}

962

1121

length_filters = {}

963

1122

for key in key_filter:

964

search_key = self._search_prefix_filter(key)

1123

search_prefix = self._search_prefix_filter(key)

965

1124

length_filter = length_filters.setdefault(

966

len(search_key), set())

967

length_filter.add(search_key)

968

prefix_to_keys.setdefault(search_key, []).append(key)

969

length_filters = length_filters.items()

970

for prefix, node in self._items.iteritems():

971

node_key_filter = []

972

for length, length_filter in length_filters:

973

sub_prefix = prefix[:length]

974

if sub_prefix in length_filter:

975

node_key_filter.extend(prefix_to_keys[sub_prefix])

976

if node_key_filter: # this key matched something, yield it

977

if type(node) == tuple:

978

keys[node] = (prefix, node_key_filter)

1125

len(search_prefix), set())

1126

length_filter.add(search_prefix)

1127

prefix_to_keys.setdefault(search_prefix, []).append(key)

1128

1129

if (self._node_width in length_filters

1130

and len(length_filters) == 1):

1131

# all of the search prefixes match exactly _node_width. This

1132

# means that everything is an exact match, and we can do a

1133

# lookup into self._items, rather than iterating over the items

1134

# dict.

1135

search_prefixes = length_filters[self._node_width]

1136

for search_prefix in search_prefixes:

1137

try:

1138

node = self._items[search_prefix]

1139

except KeyError:

1140

# We can ignore this one

1141

continue

1142

node_key_filter = prefix_to_keys[search_prefix]

1143

if node.__class__ is StaticTuple:

1144

keys[node] = (search_prefix, node_key_filter)

979

1145

else:

980

1146

yield node, node_key_filter

1147

else:

1148

# The slow way. We walk every item in self._items, and check to

1149

# see if there are any matches

1150

length_filters = length_filters.items()

1151

for prefix, node in self._items.iteritems():

1152

node_key_filter = []

1153

for length, length_filter in length_filters:

1154

sub_prefix = prefix[:length]

1155

if sub_prefix in length_filter:

1156

node_key_filter.extend(prefix_to_keys[sub_prefix])

1157

if node_key_filter: # this key matched something, yield it

1158

if node.__class__ is StaticTuple:

1159

keys[node] = (prefix, node_key_filter)

1160

else:

1161

yield node, node_key_filter

981

1162

if keys:

982

1163

# Look in the page cache for some more bytes

983

1164

found_keys = set()

984

1165

for key in keys:

985

1166

try:

986

bytes = _page_cache[key]

1167

bytes = _get_cache()[key]

987

1168

except KeyError:

988

1169

continue

989

1170

else:

1014

1195

prefix, node_key_filter = keys[record.key]

1015

1196

node_and_filters.append((node, node_key_filter))

1016

1197

self._items[prefix] = node

1017

_page_cache.add(record.key, bytes)

1198

_get_cache().add(record.key, bytes)

1018

1199

for info in node_and_filters:

1019

1200

yield info

1020

1201

1112

1293

:return: An iterable of the keys inserted by this operation.

1113

1294

"""

1114

1295

for node in self._items.itervalues():

1115

if type(node) == tuple:

1296

if type(node) is StaticTuple:

1116

1297

# Never deserialised.

1117

1298

continue

1118

1299

if node._key is not None:

1129

1310

lines.append('%s\n' % (self._search_prefix,))

1130

1311

prefix_len = len(self._search_prefix)

1131

1312

for prefix, node in sorted(self._items.items()):

1132

if type(node) == tuple:

1313

if type(node) is StaticTuple:

1133

1314

key = node[0]

1134

1315

else:

1135

1316

key = node._key[0]

1139

1320

% (serialised, self._search_prefix))

1140

1321

lines.append(serialised[prefix_len:])

1141

1322

sha1, _, _ = store.add_lines((None,), (), lines)

1142

self._key = ("sha1:" + sha1,)

1143

_page_cache.add(self._key, ''.join(lines))

1323

self._key = StaticTuple("sha1:" + sha1,).intern()

1324

_get_cache().add(self._key, ''.join(lines))

1144

1325

yield self._key

1145

1326

1146

1327

def _search_key(self, key):

1174

1355

raise AssertionError("unserialised nodes have no refs.")

1175

1356

refs = []

1176

1357

for value in self._items.itervalues():

1177

if type(value) == tuple:

1358

if type(value) is StaticTuple:

1178

1359

refs.append(value)

1179

1360

else:

1180

1361

refs.append(value.key())

1281

1462

return node

1282

1463

1283

1464

1284

def _find_children_info(store, interesting_keys, uninteresting_keys, pb):

1285

"""Read the associated records, and determine what is interesting."""

1286

uninteresting_keys = set(uninteresting_keys)

1287

chks_to_read = uninteresting_keys.union(interesting_keys)

1288

next_uninteresting = set()

1289

next_interesting = set()

1290

uninteresting_items = set()

1291

interesting_items = set()

1292

interesting_records = []

1293

# records_read = set()

1294

for record in store.get_record_stream(chks_to_read, 'unordered', True):

1295

# records_read.add(record.key())

1296

if pb is not None:

1297

pb.tick()

1298

bytes = record.get_bytes_as('fulltext')

1299

# We don't care about search_key_func for this code, because we only

1300

# care about external references.

1301

node = _deserialise(bytes, record.key, search_key_func=None)

1302

if record.key in uninteresting_keys:

1303

if type(node) is InternalNode:

1304

next_uninteresting.update(node.refs())

1305

else:

1306

# We know we are at a LeafNode, so we can pass None for the

1307

# store

1308

uninteresting_items.update(node.iteritems(None))

1309

else:

1310

interesting_records.append(record)

1311

if type(node) is InternalNode:

1312

next_interesting.update(node.refs())

1313

else:

1314

interesting_items.update(node.iteritems(None))

1315

# TODO: Filter out records that have already been read, as node splitting

1316

# can cause us to reference the same nodes via shorter and longer

1317

# paths

1318

return (next_uninteresting, uninteresting_items,

1319

next_interesting, interesting_records, interesting_items)

1320

1321

1322

def _find_all_uninteresting(store, interesting_root_keys,

1323

uninteresting_root_keys, adapter, pb):

1324

"""Determine the full set of uninteresting keys."""

1325

# What about duplicates between interesting_root_keys and

1326

# uninteresting_root_keys?

1327

if not uninteresting_root_keys:

1328

# Shortcut case. We know there is nothing uninteresting to filter out

1329

# So we just let the rest of the algorithm do the work

1330

# We know there is nothing uninteresting, and we didn't have to read

1331

# any interesting records yet.

1332

return (set(), set(), set(interesting_root_keys), [], set())

1333

all_uninteresting_chks = set(uninteresting_root_keys)

1334

all_uninteresting_items = set()

1335

1336

# First step, find the direct children of both the interesting and

1337

# uninteresting set

1338

(uninteresting_keys, uninteresting_items,

1339

interesting_keys, interesting_records,

1340

interesting_items) = _find_children_info(store, interesting_root_keys,

1341

uninteresting_root_keys,

1342

pb=pb)

1343

all_uninteresting_chks.update(uninteresting_keys)

1344

all_uninteresting_items.update(uninteresting_items)

1345

del uninteresting_items

1346

# Note: Exact matches between interesting and uninteresting do not need

1347

# to be search further. Non-exact matches need to be searched in case

1348

# there is a future exact-match

1349

uninteresting_keys.difference_update(interesting_keys)

1350

1351

# Second, find the full set of uninteresting bits reachable by the

1352

# uninteresting roots

1353

chks_to_read = uninteresting_keys

1354

while chks_to_read:

1355

next_chks = set()

1356

for record in store.get_record_stream(chks_to_read, 'unordered', False):

1357

# TODO: Handle 'absent'

1358

if pb is not None:

1359

pb.tick()

1360

try:

1361

bytes = record.get_bytes_as('fulltext')

1362

except errors.UnavailableRepresentation:

1363

bytes = adapter.get_bytes(record)

1364

# We don't care about search_key_func for this code, because we

1365

# only care about external references.

1366

node = _deserialise(bytes, record.key, search_key_func=None)

1367

if type(node) is InternalNode:

1368

# uninteresting_prefix_chks.update(node._items.iteritems())

1369

chks = node._items.values()

1370

# TODO: We remove the entries that are already in

1371

# uninteresting_chks ?

1372

next_chks.update(chks)

1373

all_uninteresting_chks.update(chks)

1374

else:

1375

all_uninteresting_items.update(node._items.iteritems())

1376

chks_to_read = next_chks

1377

return (all_uninteresting_chks, all_uninteresting_items,

1378

interesting_keys, interesting_records, interesting_items)

1465

class CHKMapDifference(object):

1466

"""Iterate the stored pages and key,value pairs for (new - old).

1467

1468

This class provides a generator over the stored CHK pages and the

1469

(key, value) pairs that are in any of the new maps and not in any of the

1470

old maps.

1471

1472

Note that it may yield chk pages that are common (especially root nodes),

1473

but it won't yield (key,value) pairs that are common.

1474

"""

1475

1476

def __init__(self, store, new_root_keys, old_root_keys,

1477

search_key_func, pb=None):

1478

# TODO: Should we add a StaticTuple barrier here? It would be nice to

1479

# force callers to use StaticTuple, because there will often be

1480

# lots of keys passed in here. And even if we cast it locally,

1481

# that just meanst that we will have *both* a StaticTuple and a

1482

# tuple() in memory, referring to the same object. (so a net

1483

# increase in memory, not a decrease.)

1484

self._store = store

1485

self._new_root_keys = new_root_keys

1486

self._old_root_keys = old_root_keys

1487

self._pb = pb

1488

# All uninteresting chks that we have seen. By the time they are added

1489

# here, they should be either fully ignored, or queued up for

1490

# processing

1491

# TODO: This might grow to a large size if there are lots of merge

1492

# parents, etc. However, it probably doesn't scale to O(history)

1493

# like _processed_new_refs does.

1494

self._all_old_chks = set(self._old_root_keys)

1495

# All items that we have seen from the old_root_keys

1496

self._all_old_items = set()

1497

# These are interesting items which were either read, or already in the

1498

# interesting queue (so we don't need to walk them again)

1499

# TODO: processed_new_refs becomes O(all_chks), consider switching to

1500

# SimpleSet here.

1501

self._processed_new_refs = set()

1502

self._search_key_func = search_key_func

1503

1504

# The uninteresting and interesting nodes to be searched

1505

self._old_queue = []

1506

self._new_queue = []

1507

# Holds the (key, value) items found when processing the root nodes,

1508

# waiting for the uninteresting nodes to be walked

1509

self._new_item_queue = []

1510

self._state = None

1511

1512

def _read_nodes_from_store(self, keys):

1513

# We chose not to use _get_cache(), because we think in

1514

# terms of records to be yielded. Also, we expect to touch each page

1515

# only 1 time during this code. (We may want to evaluate saving the

1516

# raw bytes into the page cache, which would allow a working tree

1517

# update after the fetch to not have to read the bytes again.)

1518

as_st = StaticTuple.from_sequence

1519

stream = self._store.get_record_stream(keys, 'unordered', True)

1520

for record in stream:

1521

if self._pb is not None:

1522

self._pb.tick()

1523

if record.storage_kind == 'absent':

1524

raise errors.NoSuchRevision(self._store, record.key)

1525

bytes = record.get_bytes_as('fulltext')

1526

node = _deserialise(bytes, record.key,

1527

search_key_func=self._search_key_func)

1528

if type(node) is InternalNode:

1529

# Note we don't have to do node.refs() because we know that

1530

# there are no children that have been pushed into this node

1531

# Note: Using as_st() here seemed to save 1.2MB, which would

1532

# indicate that we keep 100k prefix_refs around while

1533

# processing. They *should* be shorter lived than that...

1534

# It does cost us ~10s of processing time

1535

#prefix_refs = [as_st(item) for item in node._items.iteritems()]

1536

prefix_refs = node._items.items()

1537

items = []

1538

else:

1539

prefix_refs = []

1540

# Note: We don't use a StaticTuple here. Profiling showed a

1541

# minor memory improvement (0.8MB out of 335MB peak 0.2%)

1542

# But a significant slowdown (15s / 145s, or 10%)

1543

items = node._items.items()

1544

yield record, node, prefix_refs, items

1545

1546

def _read_old_roots(self):

1547

old_chks_to_enqueue = []

1548

all_old_chks = self._all_old_chks

1549

for record, node, prefix_refs, items in \

1550

self._read_nodes_from_store(self._old_root_keys):

1551

# Uninteresting node

1552

prefix_refs = [p_r for p_r in prefix_refs

1553

if p_r[1] not in all_old_chks]

1554

new_refs = [p_r[1] for p_r in prefix_refs]

1555

all_old_chks.update(new_refs)

1556

# TODO: This might be a good time to turn items into StaticTuple

1557

# instances and possibly intern them. However, this does not

1558

# impact 'initial branch' performance, so I'm not worrying

1559

# about this yet

1560

self._all_old_items.update(items)

1561

# Queue up the uninteresting references

1562

# Don't actually put them in the 'to-read' queue until we have

1563

# finished checking the interesting references

1564

old_chks_to_enqueue.extend(prefix_refs)

1565

return old_chks_to_enqueue

1566

1567

def _enqueue_old(self, new_prefixes, old_chks_to_enqueue):

1568

# At this point, we have read all the uninteresting and interesting

1569

# items, so we can queue up the uninteresting stuff, knowing that we've

1570

# handled the interesting ones

1571

for prefix, ref in old_chks_to_enqueue:

1572

not_interesting = True

1573

for i in xrange(len(prefix), 0, -1):

1574

if prefix[:i] in new_prefixes:

1575

not_interesting = False

1576

break

1577

if not_interesting:

1578

# This prefix is not part of the remaining 'interesting set'

1579

continue

1580

self._old_queue.append(ref)

1581

1582

def _read_all_roots(self):

1583

"""Read the root pages.

1584

1585

This is structured as a generator, so that the root records can be

1586

yielded up to whoever needs them without any buffering.

1587

"""

1588

# This is the bootstrap phase

1589

if not self._old_root_keys:

1590

# With no old_root_keys we can just shortcut and be ready

1591

# for _flush_new_queue

1592

self._new_queue = list(self._new_root_keys)

1593

return

1594

old_chks_to_enqueue = self._read_old_roots()

1595

# filter out any root keys that are already known to be uninteresting

1596

new_keys = set(self._new_root_keys).difference(self._all_old_chks)

1597

# These are prefixes that are present in new_keys that we are

1598

# thinking to yield

1599

new_prefixes = set()

1600

# We are about to yield all of these, so we don't want them getting

1601

# added a second time

1602

processed_new_refs = self._processed_new_refs

1603

processed_new_refs.update(new_keys)

1604

for record, node, prefix_refs, items in \

1605

self._read_nodes_from_store(new_keys):

1606

# At this level, we now know all the uninteresting references

1607

# So we filter and queue up whatever is remaining

1608

prefix_refs = [p_r for p_r in prefix_refs

1609

if p_r[1] not in self._all_old_chks

1610

and p_r[1] not in processed_new_refs]

1611

refs = [p_r[1] for p_r in prefix_refs]

1612

new_prefixes.update([p_r[0] for p_r in prefix_refs])

1613

self._new_queue.extend(refs)

1614

# TODO: We can potentially get multiple items here, however the

1615

# current design allows for this, as callers will do the work

1616

# to make the results unique. We might profile whether we

1617

# gain anything by ensuring unique return values for items

1618

# TODO: This might be a good time to cast to StaticTuple, as

1619

# self._new_item_queue will hold the contents of multiple

1620

# records for an extended lifetime

1621

new_items = [item for item in items

1622

if item not in self._all_old_items]

1623

self._new_item_queue.extend(new_items)

1624

new_prefixes.update([self._search_key_func(item[0])

1625

for item in new_items])

1626

processed_new_refs.update(refs)

1627

yield record

1628

# For new_prefixes we have the full length prefixes queued up.

1629

# However, we also need possible prefixes. (If we have a known ref to

1630

# 'ab', then we also need to include 'a'.) So expand the

1631

# new_prefixes to include all shorter prefixes

1632

for prefix in list(new_prefixes):

1633

new_prefixes.update([prefix[:i] for i in xrange(1, len(prefix))])

1634

self._enqueue_old(new_prefixes, old_chks_to_enqueue)

1635

1636

def _flush_new_queue(self):

1637

# No need to maintain the heap invariant anymore, just pull things out

1638

# and process them

1639

refs = set(self._new_queue)

1640

self._new_queue = []

1641

# First pass, flush all interesting items and convert to using direct refs

1642

all_old_chks = self._all_old_chks

1643

processed_new_refs = self._processed_new_refs

1644

all_old_items = self._all_old_items

1645

new_items = [item for item in self._new_item_queue

1646

if item not in all_old_items]

1647

self._new_item_queue = []

1648

if new_items:

1649

yield None, new_items

1650

refs = refs.difference(all_old_chks)

1651

processed_new_refs.update(refs)

1652

while refs:

1653

# TODO: Using a SimpleSet for self._processed_new_refs and

1654

# saved as much as 10MB of peak memory. However, it requires

1655

# implementing a non-pyrex version.

1656

next_refs = set()

1657

next_refs_update = next_refs.update

1658

# Inlining _read_nodes_from_store improves 'bzr branch bzr.dev'

1659

# from 1m54s to 1m51s. Consider it.

1660

for record, _, p_refs, items in self._read_nodes_from_store(refs):

1661

if all_old_items:

1662

# using the 'if' check saves about 145s => 141s, when

1663

# streaming initial branch of Launchpad data.

1664

items = [item for item in items

1665

if item not in all_old_items]

1666

yield record, items

1667

next_refs_update([p_r[1] for p_r in p_refs])

1668

del p_refs

1669

# set1.difference(set/dict) walks all of set1, and checks if it

1670

# exists in 'other'.

1671

# set1.difference(iterable) walks all of iterable, and does a

1672

# 'difference_update' on a clone of set1. Pick wisely based on the

1673

# expected sizes of objects.

1674

# in our case it is expected that 'new_refs' will always be quite

1675

# small.

1676

next_refs = next_refs.difference(all_old_chks)

1677

next_refs = next_refs.difference(processed_new_refs)

1678

processed_new_refs.update(next_refs)

1679

refs = next_refs

1680

1681

def _process_next_old(self):

1682

# Since we don't filter uninteresting any further than during

1683

# _read_all_roots, process the whole queue in a single pass.

1684

refs = self._old_queue

1685

self._old_queue = []

1686

all_old_chks = self._all_old_chks

1687

for record, _, prefix_refs, items in self._read_nodes_from_store(refs):

1688

# TODO: Use StaticTuple here?

1689

self._all_old_items.update(items)

1690

refs = [r for _,r in prefix_refs if r not in all_old_chks]

1691

self._old_queue.extend(refs)

1692

all_old_chks.update(refs)

1693

1694

def _process_queues(self):

1695

while self._old_queue:

1696

self._process_next_old()

1697

return self._flush_new_queue()

1698

1699

def process(self):

1700

for record in self._read_all_roots():

1701

yield record, []

1702

for record, items in self._process_queues():

1703

yield record, items

1379

1704

1380

1705

1381

1706

def iter_interesting_nodes(store, interesting_root_keys,

1390

1715

:param uninteresting_root_keys: keys which should be filtered out of the

1391

1716

result set.

1392

1717

:return: Yield

1393

(interesting records, interesting chk's, interesting key:values)

1718

(interesting record, {interesting key:values})

1394

1719

"""

1395

# TODO: consider that it may be more memory efficient to use the 20-byte

1396

# sha1 string, rather than tuples of hexidecimal sha1 strings.

1397

# TODO: Try to factor out a lot of the get_record_stream() calls into a

1398

# helper function similar to _read_bytes. This function should be

1399

# able to use nodes from the _page_cache as well as actually

1400

# requesting bytes from the store.

1401

1402

# A way to adapt from the compressed texts back into fulltexts

1403

# In a way, this seems like a layering inversion to have CHKMap know the

1404

# details of versionedfile

1405

adapter_class = versionedfile.adapter_registry.get(

1406

('knit-ft-gz', 'fulltext'))

1407

adapter = adapter_class(store)

1408

1409

(all_uninteresting_chks, all_uninteresting_items, interesting_keys,

1410

interesting_records, interesting_items) = _find_all_uninteresting(store,

1411

interesting_root_keys, uninteresting_root_keys, adapter, pb)

1412

1413

# Now that we know everything uninteresting, we can yield information from

1414

# our first request

1415

interesting_items.difference_update(all_uninteresting_items)

1416

records = dict((record.key, record) for record in interesting_records

1417

if record.key not in all_uninteresting_chks)

1418

if records or interesting_items:

1419

yield records, interesting_items

1420

interesting_keys.difference_update(all_uninteresting_chks)

1421

1422

chks_to_read = interesting_keys

1423

counter = 0

1424

while chks_to_read:

1425

next_chks = set()

1426

for record in store.get_record_stream(chks_to_read, 'unordered', False):

1427

counter += 1

1428

if pb is not None:

1429

pb.update('find chk pages', counter)

1430

# TODO: Handle 'absent'?

1431

try:

1432

bytes = record.get_bytes_as('fulltext')

1433

except errors.UnavailableRepresentation:

1434

bytes = adapter.get_bytes(record)

1435

# We don't care about search_key_func for this code, because we

1436

# only care about external references.

1437

node = _deserialise(bytes, record.key, search_key_func=None)

1438

if type(node) is InternalNode:

1439

# all_uninteresting_chks grows large, as it lists all nodes we

1440

# don't want to process (including already seen interesting

1441

# nodes).

1442

# small.difference_update(large) scales O(large), but

1443

# small.difference(large) scales O(small).

1444

# Also, we know we just _deserialised this node, so we can

1445

# access the dict directly.

1446

chks = set(node._items.itervalues()).difference(

1447

all_uninteresting_chks)

1448

# Is set() and .difference_update better than:

1449

# chks = [chk for chk in node.refs()

1450

# if chk not in all_uninteresting_chks]

1451

next_chks.update(chks)

1452

# These are now uninteresting everywhere else

1453

all_uninteresting_chks.update(chks)

1454

interesting_items = []

1455

else:

1456

interesting_items = [item for item in node._items.iteritems()

1457

if item not in all_uninteresting_items]

1458

# TODO: Do we need to filter out items that we have already

1459

# seen on other pages? We don't really want to buffer the

1460

# whole thing, but it does mean that callers need to

1461

# understand they may get duplicate values.

1462

# all_uninteresting_items.update(interesting_items)

1463

yield {record.key: record}, interesting_items

1464

chks_to_read = next_chks

1720

iterator = CHKMapDifference(store, interesting_root_keys,

1721

uninteresting_root_keys,

1722

search_key_func=store._search_key_func,

1723

pb=pb)

1724

return iterator.process()

1465

1725

1466

1726

1467

1727

try:

1471

1731

_deserialise_leaf_node,

1472

1732

_deserialise_internal_node,

1473

1733

)

1474

except ImportError:

1734

except ImportError, e:

1735

osutils.failed_to_load_extension(e)

1475

1736

from bzrlib._chk_map_py import (

1476

1737

_search_key_16,

1477

1738

_search_key_255,

1480

1741

)

1481

1742

search_key_registry.register('hash-16-way', _search_key_16)

1482

1743

search_key_registry.register('hash-255-way', _search_key_255)

1744

1745

1746

def _check_key(key):

1747

"""Helper function to assert that a key is properly formatted.

1748

1749

This generally shouldn't be used in production code, but it can be helpful

1750

to debug problems.

1751

"""

1752

if type(key) is not StaticTuple:

1753

raise TypeError('key %r is not StaticTuple but %s' % (key, type(key)))

1754

if len(key) != 1:

1755

raise ValueError('key %r should have length 1, not %d' % (key, len(key),))

1756

if type(key[0]) is not str:

1757

raise TypeError('key %r should hold a str, not %r'

1758

% (key, type(key[0])))

1759

if not key[0].startswith('sha1:'):

1760

raise ValueError('key %r should point to a sha1:' % (key,))

1761

1762

Older »