~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/chk_map.py

Committer: John Arbash Meinel
Date: 2007-02-02 04:49:38 UTC
mfrom: (1908.11.7 tree-revision-tree.)
mto: (1852.15.19 test_write_inventory)
mto: This revision was merged to the branch mainline in revision 2322.
Revision ID: john@arbash-meinel.com-20070202044938-6c04umlv9y4j2tz1

[merge] bzr.dev 2255, resolve conflicts, update copyrights

files added:
NEWS.developers

build-api

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_escaped_store.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/xml6.py

doc/README.1st

files removed:
bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/bundle/serializer/v4.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/email_message.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/inventory_delta.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/pack.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconfigure.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/tag.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/https_server.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/transport_util.py

bzrlib/timestamp.py

bzrlib/transport/brokenrename.py

bzrlib/transport/ftp

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/log.py

bzrlib/transport/nosmart.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/views.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/BUILD-NOTES

doc/Makefile

doc/_static

doc/_static/bzr icon 16.png

doc/_static/bzr.ico

doc/_static/en

doc/_static/en/quick-reference

doc/_static/en/quick-reference/Makefile

doc/_static/en/quick-reference/bzr-quick-reference.pdf

doc/_static/en/quick-reference/bzr-quick-reference.png

doc/_static/en/quick-reference/bzr-quick-reference.svg

doc/_templates

doc/_templates/index.html

doc/_templates/layout.html

doc/conf.py

doc/contents.txt

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/index.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-for-2x.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/developer-guide

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/Makefile

doc/es/quick-reference/quick-start-summary.pdf

doc/es/quick-reference/quick-start-summary.png

doc/es/quick-reference/quick-start-summary.svg

doc/es/release-notes

doc/es/user-guide

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/es/user-reference

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/make.bat

doc/news-template.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/check-newsbugs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/rst2pdf.py

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/run_script.py

files renamed:
doc/en/developer-guide/HACKING.txt => HACKING

bzrlib/deprecated_graph.py => bzrlib/graph.py

bzrlib/help_topics/__init__.py => bzrlib/help_topics.py

bzrlib/_patiencediff_py.py => bzrlib/patiencediff.py

bzrlib/tests/http_utils.py => bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/http_server.py => bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_send.py => bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/per_branch/ => bzrlib/tests/branch_implementations/

bzrlib/tests/per_bzrdir/ => bzrlib/tests/bzrdir_implementations/

bzrlib/tests/per_interrepository/ => bzrlib/tests/interrepository_implementations/

bzrlib/tests/per_intertree/ => bzrlib/tests/intertree_implementations/

bzrlib/tests/per_repository/ => bzrlib/tests/repository_implementations/

bzrlib/tests/test_deprecated_graph.py => bzrlib/tests/test_graph.py

bzrlib/tests/test_revisionspec.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/per_transport.py => bzrlib/tests/test_transport_implementations.py

bzrlib/tests/per_versionedfile.py => bzrlib/tests/test_versionedfile.py

bzrlib/tests/per_tree/ => bzrlib/tests/tree_implementations/

bzrlib/tests/per_workingtree/ => bzrlib/tests/workingtree_implementations/

bzrlib/transport/ftp/__init__.py => bzrlib/transport/ftp.py

bzrlib/transport/remote.py => bzrlib/transport/smart.py

bzrlib/win32utils.py => bzrlib/win32console.py

bzrlib/xml8.py => bzrlib/xml5.py

doc/en/tutorials/centralized_workflow.txt => doc/centralized_workflow.txt

bzrlib/help_topics/en/configuration.txt => doc/configuration.txt

doc/en/user-guide/http_smart_server.txt => doc/http_smart_server.txt

doc/en/user-guide/index.txt => doc/index.txt

doc/en/user-guide/plugins.txt => doc/plugins.txt

doc/en/user-guide/server.txt => doc/server.txt

doc/en/user-guide/setting_up_email.txt => doc/setting_up_email.txt

doc/en/user-guide/specifying_revisions.txt => doc/specifying_revisions.txt

doc/en/tutorials/tutorial.txt => doc/tutorial.txt

doc/en/user-guide/using_aliases.txt => doc/using_aliases.txt

doc/en/user-guide/version_info.txt => doc/version_info.txt

tools/generate_docs.py => generate_docs.py

bzrlib/doc_generate/ => tools/doc_generate/

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml_serializer.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

doc/bazaar-vcs.org.kid

doc/default.css

profile_imports.py

setup.py *

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/ostools.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/chk_map.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Persistent maps from tuple_of_strings->string using CHK stores.

Overview and current status:

The CHKMap class implements a dict from tuple_of_strings->string by using a trie

with internal nodes of 8-bit fan out; The key tuples are mapped to strings by

joining them by \x00, and \x00 padding shorter keys out to the length of the

longest key. Leaf nodes are packed as densely as possible, and internal nodes

are all an additional 8-bits wide leading to a sparse upper tree.

Updates to a CHKMap are done preferentially via the apply_delta method, to

allow optimisation of the update operation; but individual map/unmap calls are

possible and supported. Individual changes via map/unmap are buffered in memory

until the _save method is called to force serialisation of the tree.

apply_delta records its changes immediately by performing an implicit _save.

TODO:

-----

Densely packed upper nodes.

"""

import heapq

from bzrlib import lazy_import

lazy_import.lazy_import(globals(), """

from bzrlib import (

errors,

versionedfile,

)

""")

from bzrlib import (

lru_cache,

osutils,

registry,

trace,

)

# approx 4MB

# If each line is 50 bytes, and you have 255 internal pages, with 255-way fan

# out, it takes 3.1MB to cache the layer.

_PAGE_CACHE_SIZE = 4*1024*1024

# We are caching bytes so len(value) is perfectly accurate

_page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)

def clear_cache():

_page_cache.clear()

# If a ChildNode falls below this many bytes, we check for a remap

_INTERESTING_NEW_SIZE = 50

# If a ChildNode shrinks by more than this amount, we check for a remap

_INTERESTING_SHRINKAGE_LIMIT = 20

# If we delete more than this many nodes applying a delta, we check for a remap

_INTERESTING_DELETES_LIMIT = 5

def _search_key_plain(key):

"""Map the key tuple into a search string that just uses the key bytes."""

return '\x00'.join(key)

search_key_registry = registry.Registry()

search_key_registry.register('plain', _search_key_plain)

class CHKMap(object):

"""A persistent map from string to string backed by a CHK store."""

def __init__(self, store, root_key, search_key_func=None):

"""Create a CHKMap object.

:param store: The store the CHKMap is stored in.

:param root_key: The root key of the map. None to create an empty

CHKMap.

:param search_key_func: A function mapping a key => bytes. These bytes

are then used by the internal nodes to split up leaf nodes into

multiple pages.

"""

self._store = store

if search_key_func is None:

search_key_func = _search_key_plain

self._search_key_func = search_key_func

100

if root_key is None:

101

self._root_node = LeafNode(search_key_func=search_key_func)

102

else:

103

self._root_node = self._node_key(root_key)

104

105

def apply_delta(self, delta):

106

"""Apply a delta to the map.

107

108

:param delta: An iterable of old_key, new_key, new_value tuples.

109

If new_key is not None, then new_key->new_value is inserted

110

into the map; if old_key is not None, then the old mapping

111

of old_key is removed.

112

"""

113

delete_count = 0

114

# Check preconditions first.

115

new_items = set([key for (old, key, value) in delta if key is not None

116

and old is None])

117

existing_new = list(self.iteritems(key_filter=new_items))

118

if existing_new:

119

raise errors.InconsistentDeltaDelta(delta,

120

"New items are already in the map %r." % existing_new)

121

# Now apply changes.

122

for old, new, value in delta:

123

if old is not None and old != new:

124

self.unmap(old, check_remap=False)

125

delete_count += 1

126

for old, new, value in delta:

127

if new is not None:

128

self.map(new, value)

129

if delete_count > _INTERESTING_DELETES_LIMIT:

130

trace.mutter("checking remap as %d deletions", delete_count)

131

self._check_remap()

132

return self._save()

133

134

def _ensure_root(self):

135

"""Ensure that the root node is an object not a key."""

136

if type(self._root_node) is tuple:

137

# Demand-load the root

138

self._root_node = self._get_node(self._root_node)

139

140

def _get_node(self, node):

141

"""Get a node.

142

143

Note that this does not update the _items dict in objects containing a

144

reference to this node. As such it does not prevent subsequent IO being

145

performed.

146

147

:param node: A tuple key or node object.

148

:return: A node object.

149

"""

150

if type(node) is tuple:

151

bytes = self._read_bytes(node)

152

return _deserialise(bytes, node,

153

search_key_func=self._search_key_func)

154

else:

155

return node

156

157

def _read_bytes(self, key):

158

try:

159

return _page_cache[key]

160

except KeyError:

161

stream = self._store.get_record_stream([key], 'unordered', True)

162

bytes = stream.next().get_bytes_as('fulltext')

163

_page_cache[key] = bytes

164

return bytes

165

166

def _dump_tree(self, include_keys=False):

167

"""Return the tree in a string representation."""

168

self._ensure_root()

169

res = self._dump_tree_node(self._root_node, prefix='', indent='',

170

include_keys=include_keys)

171

res.append('') # Give a trailing '\n'

172

return '\n'.join(res)

173

174

def _dump_tree_node(self, node, prefix, indent, include_keys=True):

175

"""For this node and all children, generate a string representation."""

176

result = []

177

if not include_keys:

178

key_str = ''

179

else:

180

node_key = node.key()

181

if node_key is not None:

182

key_str = ' %s' % (node_key[0],)

183

else:

184

key_str = ' None'

185

result.append('%s%r %s%s' % (indent, prefix, node.__class__.__name__,

186

key_str))

187

if type(node) is InternalNode:

188

# Trigger all child nodes to get loaded

189

list(node._iter_nodes(self._store))

190

for prefix, sub in sorted(node._items.iteritems()):

191

result.extend(self._dump_tree_node(sub, prefix, indent + ' ',

192

include_keys=include_keys))

193

else:

194

for key, value in sorted(node._items.iteritems()):

195

# Don't use prefix nor indent here to line up when used in

196

# tests in conjunction with assertEqualDiff

197

result.append(' %r %r' % (key, value))

198

return result

199

200

@classmethod

201

def from_dict(klass, store, initial_value, maximum_size=0, key_width=1,

202

search_key_func=None):

203

"""Create a CHKMap in store with initial_value as the content.

204

205

:param store: The store to record initial_value in, a VersionedFiles

206

object with 1-tuple keys supporting CHK key generation.

207

:param initial_value: A dict to store in store. Its keys and values

208

must be bytestrings.

209

:param maximum_size: The maximum_size rule to apply to nodes. This

210

determines the size at which no new data is added to a single node.

211

:param key_width: The number of elements in each key_tuple being stored

212

in this map.

213

:param search_key_func: A function mapping a key => bytes. These bytes

214

are then used by the internal nodes to split up leaf nodes into

215

multiple pages.

216

:return: The root chk of the resulting CHKMap.

217

"""

218

root_key = klass._create_directly(store, initial_value,

219

maximum_size=maximum_size, key_width=key_width,

220

search_key_func=search_key_func)

221

return root_key

222

223

@classmethod

224

def _create_via_map(klass, store, initial_value, maximum_size=0,

225

key_width=1, search_key_func=None):

226

result = klass(store, None, search_key_func=search_key_func)

227

result._root_node.set_maximum_size(maximum_size)

228

result._root_node._key_width = key_width

229

delta = []

230

for key, value in initial_value.items():

231

delta.append((None, key, value))

232

root_key = result.apply_delta(delta)

233

return root_key

234

235

@classmethod

236

def _create_directly(klass, store, initial_value, maximum_size=0,

237

key_width=1, search_key_func=None):

238

node = LeafNode(search_key_func=search_key_func)

239

node.set_maximum_size(maximum_size)

240

node._key_width = key_width

241

node._items = dict(initial_value)

242

node._raw_size = sum([node._key_value_len(key, value)

243

for key,value in initial_value.iteritems()])

244

node._len = len(node._items)

245

node._compute_search_prefix()

246

node._compute_serialised_prefix()

247

if (node._len > 1

248

and maximum_size

249

and node._current_size() > maximum_size):

250

prefix, node_details = node._split(store)

251

if len(node_details) == 1:

252

raise AssertionError('Failed to split using node._split')

253

node = InternalNode(prefix, search_key_func=search_key_func)

254

node.set_maximum_size(maximum_size)

255

node._key_width = key_width

256

for split, subnode in node_details:

257

node.add_node(split, subnode)

258

keys = list(node.serialise(store))

259

return keys[-1]

260

261

def iter_changes(self, basis):

262

"""Iterate over the changes between basis and self.

263

264

:return: An iterator of tuples: (key, old_value, new_value). Old_value

265

is None for keys only in self; new_value is None for keys only in

266

basis.

267

"""

268

# Overview:

269

# Read both trees in lexographic, highest-first order.

270

# Any identical nodes we skip

271

# Any unique prefixes we output immediately.

272

# values in a leaf node are treated as single-value nodes in the tree

273

# which allows them to be not-special-cased. We know to output them

274

# because their value is a string, not a key(tuple) or node.

275

276

# corner cases to beware of when considering this function:

277

# *) common references are at different heights.

278

# consider two trees:

279

# {'a': LeafNode={'aaa':'foo', 'aab':'bar'}, 'b': LeafNode={'b'}}

280

# {'a': InternalNode={'aa':LeafNode={'aaa':'foo', 'aab':'bar'},

281

# 'ab':LeafNode={'ab':'bar'}}

282

# 'b': LeafNode={'b'}}

283

# the node with aaa/aab will only be encountered in the second tree

284

# after reading the 'a' subtree, but it is encountered in the first

285

# tree immediately. Variations on this may have read internal nodes

286

# like this. we want to cut the entire pending subtree when we

287

# realise we have a common node. For this we use a list of keys -

288

# the path to a node - and check the entire path is clean as we

289

# process each item.

290

if self._node_key(self._root_node) == self._node_key(basis._root_node):

291

return

292

self._ensure_root()

293

basis._ensure_root()

294

excluded_keys = set()

295

self_node = self._root_node

296

basis_node = basis._root_node

297

# A heap, each element is prefix, node(tuple/NodeObject/string),

298

# key_path (a list of tuples, tail-sharing down the tree.)

299

self_pending = []

300

basis_pending = []

301

def process_node(node, path, a_map, pending):

302

# take a node and expand it

303

node = a_map._get_node(node)

304

if type(node) == LeafNode:

305

path = (node._key, path)

306

for key, value in node._items.items():

307

# For a LeafNode, the key is a serialized_key, rather than

308

# a search_key, but the heap is using search_keys

309

search_key = node._search_key_func(key)

310

heapq.heappush(pending, (search_key, key, value, path))

311

else:

312

# type(node) == InternalNode

313

path = (node._key, path)

314

for prefix, child in node._items.items():

315

heapq.heappush(pending, (prefix, None, child, path))

316

def process_common_internal_nodes(self_node, basis_node):

317

self_items = set(self_node._items.items())

318

basis_items = set(basis_node._items.items())

319

path = (self_node._key, None)

320

for prefix, child in self_items - basis_items:

321

heapq.heappush(self_pending, (prefix, None, child, path))

322

path = (basis_node._key, None)

323

for prefix, child in basis_items - self_items:

324

heapq.heappush(basis_pending, (prefix, None, child, path))

325

def process_common_leaf_nodes(self_node, basis_node):

326

self_items = set(self_node._items.items())

327

basis_items = set(basis_node._items.items())

328

path = (self_node._key, None)

329

for key, value in self_items - basis_items:

330

prefix = self._search_key_func(key)

331

heapq.heappush(self_pending, (prefix, key, value, path))

332

path = (basis_node._key, None)

333

for key, value in basis_items - self_items:

334

prefix = basis._search_key_func(key)

335

heapq.heappush(basis_pending, (prefix, key, value, path))

336

def process_common_prefix_nodes(self_node, self_path,

337

basis_node, basis_path):

338

# Would it be more efficient if we could request both at the same

339

# time?

340

self_node = self._get_node(self_node)

341

basis_node = basis._get_node(basis_node)

342

if (type(self_node) == InternalNode

343

and type(basis_node) == InternalNode):

344

# Matching internal nodes

345

process_common_internal_nodes(self_node, basis_node)

346

elif (type(self_node) == LeafNode

347

and type(basis_node) == LeafNode):

348

process_common_leaf_nodes(self_node, basis_node)

349

else:

350

process_node(self_node, self_path, self, self_pending)

351

process_node(basis_node, basis_path, basis, basis_pending)

352

process_common_prefix_nodes(self_node, None, basis_node, None)

353

self_seen = set()

354

basis_seen = set()

355

excluded_keys = set()

356

def check_excluded(key_path):

357

# Note that this is N^2, it depends on us trimming trees

358

# aggressively to not become slow.

359

# A better implementation would probably have a reverse map

360

# back to the children of a node, and jump straight to it when

361

# a common node is detected, the proceed to remove the already

362

# pending children. bzrlib.graph has a searcher module with a

363

# similar problem.

364

while key_path is not None:

365

key, key_path = key_path

366

if key in excluded_keys:

367

return True

368

return False

369

370

loop_counter = 0

371

while self_pending or basis_pending:

372

loop_counter += 1

373

if not self_pending:

374

# self is exhausted: output remainder of basis

375

for prefix, key, node, path in basis_pending:

376

if check_excluded(path):

377

continue

378

node = basis._get_node(node)

379

if key is not None:

380

# a value

381

yield (key, node, None)

382

else:

383

# subtree - fastpath the entire thing.

384

for key, value in node.iteritems(basis._store):

385

yield (key, value, None)

386

return

387

elif not basis_pending:

388

# basis is exhausted: output remainder of self.

389

for prefix, key, node, path in self_pending:

390

if check_excluded(path):

391

continue

392

node = self._get_node(node)

393

if key is not None:

394

# a value

395

yield (key, None, node)

396

else:

397

# subtree - fastpath the entire thing.

398

for key, value in node.iteritems(self._store):

399

yield (key, None, value)

400

return

401

else:

402

# XXX: future optimisation - yield the smaller items

403

# immediately rather than pushing everything on/off the

404

# heaps. Applies to both internal nodes and leafnodes.

405

if self_pending[0][0] < basis_pending[0][0]:

406

# expand self

407

prefix, key, node, path = heapq.heappop(self_pending)

408

if check_excluded(path):

409

continue

410

if key is not None:

411

# a value

412

yield (key, None, node)

413

else:

414

process_node(node, path, self, self_pending)

415

continue

416

elif self_pending[0][0] > basis_pending[0][0]:

417

# expand basis

418

prefix, key, node, path = heapq.heappop(basis_pending)

419

if check_excluded(path):

420

continue

421

if key is not None:

422

# a value

423

yield (key, node, None)

424

else:

425

process_node(node, path, basis, basis_pending)

426

continue

427

else:

428

# common prefix: possibly expand both

429

if self_pending[0][1] is None:

430

# process next self

431

read_self = True

432

else:

433

read_self = False

434

if basis_pending[0][1] is None:

435

# process next basis

436

read_basis = True

437

else:

438

read_basis = False

439

if not read_self and not read_basis:

440

# compare a common value

441

self_details = heapq.heappop(self_pending)

442

basis_details = heapq.heappop(basis_pending)

443

if self_details[2] != basis_details[2]:

444

yield (self_details[1],

445

basis_details[2], self_details[2])

446

continue

447

# At least one side wasn't a simple value

448

if (self._node_key(self_pending[0][2]) ==

449

self._node_key(basis_pending[0][2])):

450

# Identical pointers, skip (and don't bother adding to

451

# excluded, it won't turn up again.

452

heapq.heappop(self_pending)

453

heapq.heappop(basis_pending)

454

continue

455

# Now we need to expand this node before we can continue

456

if read_self and read_basis:

457

# Both sides start with the same prefix, so process

458

# them in parallel

459

self_prefix, _, self_node, self_path = heapq.heappop(

460

self_pending)

461

basis_prefix, _, basis_node, basis_path = heapq.heappop(

462

basis_pending)

463

if self_prefix != basis_prefix:

464

raise AssertionError(

465

'%r != %r' % (self_prefix, basis_prefix))

466

process_common_prefix_nodes(

467

self_node, self_path,

468

basis_node, basis_path)

469

continue

470

if read_self:

471

prefix, key, node, path = heapq.heappop(self_pending)

472

if check_excluded(path):

473

continue

474

process_node(node, path, self, self_pending)

475

if read_basis:

476

prefix, key, node, path = heapq.heappop(basis_pending)

477

if check_excluded(path):

478

continue

479

process_node(node, path, basis, basis_pending)

480

# print loop_counter

481

482

def iteritems(self, key_filter=None):

483

"""Iterate over the entire CHKMap's contents."""

484

self._ensure_root()

485

return self._root_node.iteritems(self._store, key_filter=key_filter)

486

487

def key(self):

488

"""Return the key for this map."""

489

if type(self._root_node) is tuple:

490

return self._root_node

491

else:

492

return self._root_node._key

493

494

def __len__(self):

495

self._ensure_root()

496

return len(self._root_node)

497

498

def map(self, key, value):

499

"""Map a key tuple to value.

500

501

:param key: A key to map.

502

:param value: The value to assign to key.

503

"""

504

# Need a root object.

505

self._ensure_root()

506

prefix, node_details = self._root_node.map(self._store, key, value)

507

if len(node_details) == 1:

508

self._root_node = node_details[0][1]

509

else:

510

self._root_node = InternalNode(prefix,

511

search_key_func=self._search_key_func)

512

self._root_node.set_maximum_size(node_details[0][1].maximum_size)

513

self._root_node._key_width = node_details[0][1]._key_width

514

for split, node in node_details:

515

self._root_node.add_node(split, node)

516

517

def _node_key(self, node):

518

"""Get the key for a node whether it's a tuple or node."""

519

if type(node) is tuple:

520

return node

521

else:

522

return node._key

523

524

def unmap(self, key, check_remap=True):

525

"""remove key from the map."""

526

self._ensure_root()

527

if type(self._root_node) is InternalNode:

528

unmapped = self._root_node.unmap(self._store, key,

529

check_remap=check_remap)

530

else:

531

unmapped = self._root_node.unmap(self._store, key)

532

self._root_node = unmapped

533

534

def _check_remap(self):

535

"""Check if nodes can be collapsed."""

536

self._ensure_root()

537

if type(self._root_node) is InternalNode:

538

self._root_node._check_remap(self._store)

539

540

def _save(self):

541

"""Save the map completely.

542

543

:return: The key of the root node.

544

"""

545

if type(self._root_node) is tuple:

546

# Already saved.

547

return self._root_node

548

keys = list(self._root_node.serialise(self._store))

549

return keys[-1]

550

551

552

class Node(object):

553

"""Base class defining the protocol for CHK Map nodes.

554

555

:ivar _raw_size: The total size of the serialized key:value data, before

556

adding the header bytes, and without prefix compression.

557

"""

558

559

def __init__(self, key_width=1):

560

"""Create a node.

561

562

:param key_width: The width of keys for this node.

563

"""

564

self._key = None

565

# Current number of elements

566

self._len = 0

567

self._maximum_size = 0

568

self._key_width = key_width

569

# current size in bytes

570

self._raw_size = 0

571

# The pointers/values this node has - meaning defined by child classes.

572

self._items = {}

573

# The common search prefix

574

self._search_prefix = None

575

576

def __repr__(self):

577

items_str = str(sorted(self._items))

578

if len(items_str) > 20:

579

items_str = items_str[:16] + '...]'

580

return '%s(key:%s len:%s size:%s max:%s prefix:%s items:%s)' % (

581

self.__class__.__name__, self._key, self._len, self._raw_size,

582

self._maximum_size, self._search_prefix, items_str)

583

584

def key(self):

585

return self._key

586

587

def __len__(self):

588

return self._len

589

590

@property

591

def maximum_size(self):

592

"""What is the upper limit for adding references to a node."""

593

return self._maximum_size

594

595

def set_maximum_size(self, new_size):

596

"""Set the size threshold for nodes.

597

598

:param new_size: The size at which no data is added to a node. 0 for

599

unlimited.

600

"""

601

self._maximum_size = new_size

602

603

@classmethod

604

def common_prefix(cls, prefix, key):

605

"""Given 2 strings, return the longest prefix common to both.

606

607

:param prefix: This has been the common prefix for other keys, so it is

608

more likely to be the common prefix in this case as well.

609

:param key: Another string to compare to

610

"""

611

if key.startswith(prefix):

612

return prefix

613

pos = -1

614

# Is there a better way to do this?

615

for pos, (left, right) in enumerate(zip(prefix, key)):

616

if left != right:

617

pos -= 1

618

break

619

common = prefix[:pos+1]

620

return common

621

622

@classmethod

623

def common_prefix_for_keys(cls, keys):

624

"""Given a list of keys, find their common prefix.

625

626

:param keys: An iterable of strings.

627

:return: The longest common prefix of all keys.

628

"""

629

common_prefix = None

630

for key in keys:

631

if common_prefix is None:

632

common_prefix = key

633

continue

634

common_prefix = cls.common_prefix(common_prefix, key)

635

if not common_prefix:

636

# if common_prefix is the empty string, then we know it won't

637

# change further

638

return ''

639

return common_prefix

640

641

642

# Singleton indicating we have not computed _search_prefix yet

643

_unknown = object()

644

645

class LeafNode(Node):

646

"""A node containing actual key:value pairs.

647

648

:ivar _items: A dict of key->value items. The key is in tuple form.

649

:ivar _size: The number of bytes that would be used by serializing all of

650

the key/value pairs.

651

"""

652

653

def __init__(self, search_key_func=None):

654

Node.__init__(self)

655

# All of the keys in this leaf node share this common prefix

656

self._common_serialised_prefix = None

657

self._serialise_key = '\x00'.join

658

if search_key_func is None:

659

self._search_key_func = _search_key_plain

660

else:

661

self._search_key_func = search_key_func

662

663

def __repr__(self):

664

items_str = str(sorted(self._items))

665

if len(items_str) > 20:

666

items_str = items_str[:16] + '...]'

667

return \

668

'%s(key:%s len:%s size:%s max:%s prefix:%s keywidth:%s items:%s)' \

669

% (self.__class__.__name__, self._key, self._len, self._raw_size,

670

self._maximum_size, self._search_prefix, self._key_width, items_str)

671

672

def _current_size(self):

673

"""Answer the current serialised size of this node.

674

675

This differs from self._raw_size in that it includes the bytes used for

676

the header.

677

"""

678

if self._common_serialised_prefix is None:

679

bytes_for_items = 0

680

prefix_len = 0

681

else:

682

# We will store a single string with the common prefix

683

# And then that common prefix will not be stored in any of the

684

# entry lines

685

prefix_len = len(self._common_serialised_prefix)

686

bytes_for_items = (self._raw_size - (prefix_len * self._len))

687

return (9 # 'chkleaf:\n'

688

+ len(str(self._maximum_size)) + 1

689

+ len(str(self._key_width)) + 1

690

+ len(str(self._len)) + 1

691

+ prefix_len + 1

692

+ bytes_for_items)

693

694

@classmethod

695

def deserialise(klass, bytes, key, search_key_func=None):

696

"""Deserialise bytes, with key key, into a LeafNode.

697

698

:param bytes: The bytes of the node.

699

:param key: The key that the serialised node has.

700

"""

701

return _deserialise_leaf_node(bytes, key,

702

search_key_func=search_key_func)

703

704

def iteritems(self, store, key_filter=None):

705

"""Iterate over items in the node.

706

707

:param key_filter: A filter to apply to the node. It should be a

708

list/set/dict or similar repeatedly iterable container.

709

"""

710

if key_filter is not None:

711

# Adjust the filter - short elements go to a prefix filter. All

712

# other items are looked up directly.

713

# XXX: perhaps defaultdict? Profiling<rinse and repeat>

714

filters = {}

715

for key in key_filter:

716

if len(key) == self._key_width:

717

# This filter is meant to match exactly one key, yield it

718

# if we have it.

719

try:

720

yield key, self._items[key]

721

except KeyError:

722

# This key is not present in this map, continue

723

pass

724

else:

725

# Short items, we need to match based on a prefix

726

length_filter = filters.setdefault(len(key), set())

727

length_filter.add(key)

728

if filters:

729

filters = filters.items()

730

for item in self._items.iteritems():

731

for length, length_filter in filters:

732

if item[0][:length] in length_filter:

733

yield item

734

break

735

else:

736

for item in self._items.iteritems():

737

yield item

738

739

def _key_value_len(self, key, value):

740

# TODO: Should probably be done without actually joining the key, but

741

# then that can be done via the C extension

742

return (len(self._serialise_key(key)) + 1

743

+ len(str(value.count('\n'))) + 1

744

+ len(value) + 1)

745

746

def _search_key(self, key):

747

return self._search_key_func(key)

748

749

def _map_no_split(self, key, value):

750

"""Map a key to a value.

751

752

This assumes either the key does not already exist, or you have already

753

removed its size and length from self.

754

755

:return: True if adding this node should cause us to split.

756

"""

757

self._items[key] = value

758

self._raw_size += self._key_value_len(key, value)

759

self._len += 1

760

serialised_key = self._serialise_key(key)

761

if self._common_serialised_prefix is None:

762

self._common_serialised_prefix = serialised_key

763

else:

764

self._common_serialised_prefix = self.common_prefix(

765

self._common_serialised_prefix, serialised_key)

766

search_key = self._search_key(key)

767

if self._search_prefix is _unknown:

768

self._compute_search_prefix()

769

if self._search_prefix is None:

770

self._search_prefix = search_key

771

else:

772

self._search_prefix = self.common_prefix(

773

self._search_prefix, search_key)

774

if (self._len > 1

775

and self._maximum_size

776

and self._current_size() > self._maximum_size):

777

# Check to see if all of the search_keys for this node are

778

# identical. We allow the node to grow under that circumstance

779

# (we could track this as common state, but it is infrequent)

780

if (search_key != self._search_prefix

781

or not self._are_search_keys_identical()):

782

return True

783

return False

784

785

def _split(self, store):

786

"""We have overflowed.

787

788

Split this node into multiple LeafNodes, return it up the stack so that

789

the next layer creates a new InternalNode and references the new nodes.

790

791

:return: (common_serialised_prefix, [(node_serialised_prefix, node)])

792

"""

793

if self._search_prefix is _unknown:

794

raise AssertionError('Search prefix must be known')

795

common_prefix = self._search_prefix

796

split_at = len(common_prefix) + 1

797

result = {}

798

for key, value in self._items.iteritems():

799

search_key = self._search_key(key)

800

prefix = search_key[:split_at]

801

# TODO: Generally only 1 key can be exactly the right length,

802

# which means we can only have 1 key in the node pointed

803

# at by the 'prefix\0' key. We might want to consider

804

# folding it into the containing InternalNode rather than

805

# having a fixed length-1 node.

806

# Note this is probably not true for hash keys, as they

807

# may get a '\00' node anywhere, but won't have keys of

808

# different lengths.

809

if len(prefix) < split_at:

810

prefix += '\x00'*(split_at - len(prefix))

811

if prefix not in result:

812

node = LeafNode(search_key_func=self._search_key_func)

813

node.set_maximum_size(self._maximum_size)

814

node._key_width = self._key_width

815

result[prefix] = node

816

else:

817

node = result[prefix]

818

sub_prefix, node_details = node.map(store, key, value)

819

if len(node_details) > 1:

820

if prefix != sub_prefix:

821

# This node has been split and is now found via a different

822

# path

823

result.pop(prefix)

824

new_node = InternalNode(sub_prefix,

825

search_key_func=self._search_key_func)

826

new_node.set_maximum_size(self._maximum_size)

827

new_node._key_width = self._key_width

828

for split, node in node_details:

829

new_node.add_node(split, node)

830

result[prefix] = new_node

831

return common_prefix, result.items()

832

833

def map(self, store, key, value):

834

"""Map key to value."""

835

if key in self._items:

836

self._raw_size -= self._key_value_len(key, self._items[key])

837

self._len -= 1

838

self._key = None

839

if self._map_no_split(key, value):

840

return self._split(store)

841

else:

842

if self._search_prefix is _unknown:

843

raise AssertionError('%r must be known' % self._search_prefix)

844

return self._search_prefix, [("", self)]

845

846

def serialise(self, store):

847

"""Serialise the LeafNode to store.

848

849

:param store: A VersionedFiles honouring the CHK extensions.

850

:return: An iterable of the keys inserted by this operation.

851

"""

852

lines = ["chkleaf:\n"]

853

lines.append("%d\n" % self._maximum_size)

854

lines.append("%d\n" % self._key_width)

855

lines.append("%d\n" % self._len)

856

if self._common_serialised_prefix is None:

857

lines.append('\n')

858

if len(self._items) != 0:

859

raise AssertionError('If _common_serialised_prefix is None'

860

' we should have no items')

861

else:

862

lines.append('%s\n' % (self._common_serialised_prefix,))

863

prefix_len = len(self._common_serialised_prefix)

864

for key, value in sorted(self._items.items()):

865

# Always add a final newline

866

value_lines = osutils.chunks_to_lines([value + '\n'])

867

serialized = "%s\x00%s\n" % (self._serialise_key(key),

868

len(value_lines))

869

if not serialized.startswith(self._common_serialised_prefix):

870

raise AssertionError('We thought the common prefix was %r'

871

' but entry %r does not have it in common'

872

% (self._common_serialised_prefix, serialized))

873

lines.append(serialized[prefix_len:])

874

lines.extend(value_lines)

875

sha1, _, _ = store.add_lines((None,), (), lines)

876

self._key = ("sha1:" + sha1,)

877

bytes = ''.join(lines)

878

if len(bytes) != self._current_size():

879

raise AssertionError('Invalid _current_size')

880

_page_cache.add(self._key, bytes)

881

return [self._key]

882

883

def refs(self):

884

"""Return the references to other CHK's held by this node."""

885

return []

886

887

def _compute_search_prefix(self):

888

"""Determine the common search prefix for all keys in this node.

889

890

:return: A bytestring of the longest search key prefix that is

891

unique within this node.

892

"""

893

search_keys = [self._search_key_func(key) for key in self._items]

894

self._search_prefix = self.common_prefix_for_keys(search_keys)

895

return self._search_prefix

896

897

def _are_search_keys_identical(self):

898

"""Check to see if the search keys for all entries are the same.

899

900

When using a hash as the search_key it is possible for non-identical

901

keys to collide. If that happens enough, we may try overflow a

902

LeafNode, but as all are collisions, we must not split.

903

"""

904

common_search_key = None

905

for key in self._items:

906

search_key = self._search_key(key)

907

if common_search_key is None:

908

common_search_key = search_key

909

elif search_key != common_search_key:

910

return False

911

return True

912

913

def _compute_serialised_prefix(self):

914

"""Determine the common prefix for serialised keys in this node.

915

916

:return: A bytestring of the longest serialised key prefix that is

917

unique within this node.

918

"""

919

serialised_keys = [self._serialise_key(key) for key in self._items]

920

self._common_serialised_prefix = self.common_prefix_for_keys(

921

serialised_keys)

922

return self._common_serialised_prefix

923

924

def unmap(self, store, key):

925

"""Unmap key from the node."""

926

try:

927

self._raw_size -= self._key_value_len(key, self._items[key])

928

except KeyError:

929

trace.mutter("key %s not found in %r", key, self._items)

930

raise

931

self._len -= 1

932

del self._items[key]

933

self._key = None

934

# Recompute from scratch

935

self._compute_search_prefix()

936

self._compute_serialised_prefix()

937

return self

938

939

940

class InternalNode(Node):

941

"""A node that contains references to other nodes.

942

943

An InternalNode is responsible for mapping search key prefixes to child

944

nodes.

945

946

:ivar _items: serialised_key => node dictionary. node may be a tuple,

947

LeafNode or InternalNode.

948

"""

949

950

def __init__(self, prefix='', search_key_func=None):

951

Node.__init__(self)

952

# The size of an internalnode with default values and no children.

953

# How many octets key prefixes within this node are.

954

self._node_width = 0

955

self._search_prefix = prefix

956

if search_key_func is None:

957

self._search_key_func = _search_key_plain

958

else:

959

self._search_key_func = search_key_func

960

961

def add_node(self, prefix, node):

962

"""Add a child node with prefix prefix, and node node.

963

964

:param prefix: The search key prefix for node.

965

:param node: The node being added.

966

"""

967

if self._search_prefix is None:

968

raise AssertionError("_search_prefix should not be None")

969

if not prefix.startswith(self._search_prefix):

970

raise AssertionError("prefixes mismatch: %s must start with %s"

971

% (prefix,self._search_prefix))

972

if len(prefix) != len(self._search_prefix) + 1:

973

raise AssertionError("prefix wrong length: len(%s) is not %d" %

974

(prefix, len(self._search_prefix) + 1))

975

self._len += len(node)

976

if not len(self._items):

977

self._node_width = len(prefix)

978

if self._node_width != len(self._search_prefix) + 1:

979

raise AssertionError("node width mismatch: %d is not %d" %

980

(self._node_width, len(self._search_prefix) + 1))

981

self._items[prefix] = node

982

self._key = None

983

984

def _current_size(self):

985

"""Answer the current serialised size of this node."""

986

return (self._raw_size + len(str(self._len)) + len(str(self._key_width)) +

987

len(str(self._maximum_size)))

988

989

@classmethod

990

def deserialise(klass, bytes, key, search_key_func=None):

991

"""Deserialise bytes to an InternalNode, with key key.

992

993

:param bytes: The bytes of the node.

994

:param key: The key that the serialised node has.

995

:return: An InternalNode instance.

996

"""

997

return _deserialise_internal_node(bytes, key,

998

search_key_func=search_key_func)

999

1000

def iteritems(self, store, key_filter=None):

1001

for node, node_filter in self._iter_nodes(store, key_filter=key_filter):

1002

for item in node.iteritems(store, key_filter=node_filter):

1003

yield item

1004

1005

def _iter_nodes(self, store, key_filter=None, batch_size=None):

1006

"""Iterate over node objects which match key_filter.

1007

1008

:param store: A store to use for accessing content.

1009

:param key_filter: A key filter to filter nodes. Only nodes that might

1010

contain a key in key_filter will be returned.

1011

:param batch_size: If not None, then we will return the nodes that had

1012

to be read using get_record_stream in batches, rather than reading

1013

them all at once.

1014

:return: An iterable of nodes. This function does not have to be fully

1015

consumed. (There will be no pending I/O when items are being returned.)

1016

"""

1017

# Map from chk key ('sha1:...',) to (prefix, key_filter)

1018

# prefix is the key in self._items to use, key_filter is the key_filter

1019

# entries that would match this node

1020

keys = {}

1021

shortcut = False

1022

if key_filter is None:

1023

# yielding all nodes, yield whatever we have, and queue up a read

1024

# for whatever we are missing

1025

shortcut = True

1026

for prefix, node in self._items.iteritems():

1027

if node.__class__ is tuple:

1028

keys[node] = (prefix, None)

1029

else:

1030

yield node, None

1031

elif len(key_filter) == 1:

1032

# Technically, this path could also be handled by the first check

1033

# in 'self._node_width' in length_filters. However, we can handle

1034

# this case without spending any time building up the

1035

# prefix_to_keys, etc state.

1036

1037

# This is a bit ugly, but TIMEIT showed it to be by far the fastest

1038

# 0.626us list(key_filter)[0]

1039

# is a func() for list(), 2 mallocs, and a getitem

1040

# 0.489us [k for k in key_filter][0]

1041

# still has the mallocs, avoids the func() call

1042

# 0.350us iter(key_filter).next()

1043

# has a func() call, and mallocs an iterator

1044

# 0.125us for key in key_filter: pass

1045

# no func() overhead, might malloc an iterator

1046

# 0.105us for key in key_filter: break

1047

# no func() overhead, might malloc an iterator, probably

1048

# avoids checking an 'else' clause as part of the for

1049

for key in key_filter:

1050

break

1051

search_prefix = self._search_prefix_filter(key)

1052

if len(search_prefix) == self._node_width:

1053

# This item will match exactly, so just do a dict lookup, and

1054

# see what we can return

1055

shortcut = True

1056

try:

1057

node = self._items[search_prefix]

1058

except KeyError:

1059

# A given key can only match 1 child node, if it isn't

1060

# there, then we can just return nothing

1061

return

1062

if node.__class__ is tuple:

1063

keys[node] = (search_prefix, [key])

1064

else:

1065

# This is loaded, and the only thing that can match,

1066

# return

1067

yield node, [key]

1068

return

1069

if not shortcut:

1070

# First, convert all keys into a list of search prefixes

1071

# Aggregate common prefixes, and track the keys they come from

1072

prefix_to_keys = {}

1073

length_filters = {}

1074

for key in key_filter:

1075

search_prefix = self._search_prefix_filter(key)

1076

length_filter = length_filters.setdefault(

1077

len(search_prefix), set())

1078

length_filter.add(search_prefix)

1079

prefix_to_keys.setdefault(search_prefix, []).append(key)

1080

1081

if (self._node_width in length_filters

1082

and len(length_filters) == 1):

1083

# all of the search prefixes match exactly _node_width. This

1084

# means that everything is an exact match, and we can do a

1085

# lookup into self._items, rather than iterating over the items

1086

# dict.

1087

search_prefixes = length_filters[self._node_width]

1088

for search_prefix in search_prefixes:

1089

try:

1090

node = self._items[search_prefix]

1091

except KeyError:

1092

# We can ignore this one

1093

continue

1094

node_key_filter = prefix_to_keys[search_prefix]

1095

if node.__class__ is tuple:

1096

keys[node] = (search_prefix, node_key_filter)

1097

else:

1098

yield node, node_key_filter

1099

else:

1100

# The slow way. We walk every item in self._items, and check to

1101

# see if there are any matches

1102

length_filters = length_filters.items()

1103

for prefix, node in self._items.iteritems():

1104

node_key_filter = []

1105

for length, length_filter in length_filters:

1106

sub_prefix = prefix[:length]

1107

if sub_prefix in length_filter:

1108

node_key_filter.extend(prefix_to_keys[sub_prefix])

1109

if node_key_filter: # this key matched something, yield it

1110

if node.__class__ is tuple:

1111

keys[node] = (prefix, node_key_filter)

1112

else:

1113

yield node, node_key_filter

1114

if keys:

1115

# Look in the page cache for some more bytes

1116

found_keys = set()

1117

for key in keys:

1118

try:

1119

bytes = _page_cache[key]

1120

except KeyError:

1121

continue

1122

else:

1123

node = _deserialise(bytes, key,

1124

search_key_func=self._search_key_func)

1125

prefix, node_key_filter = keys[key]

1126

self._items[prefix] = node

1127

found_keys.add(key)

1128

yield node, node_key_filter

1129

for key in found_keys:

1130

del keys[key]

1131

if keys:

1132

# demand load some pages.

1133

if batch_size is None:

1134

# Read all the keys in

1135

batch_size = len(keys)

1136

key_order = list(keys)

1137

for batch_start in range(0, len(key_order), batch_size):

1138

batch = key_order[batch_start:batch_start + batch_size]

1139

# We have to fully consume the stream so there is no pending

1140

# I/O, so we buffer the nodes for now.

1141

stream = store.get_record_stream(batch, 'unordered', True)

1142

node_and_filters = []

1143

for record in stream:

1144

bytes = record.get_bytes_as('fulltext')

1145

node = _deserialise(bytes, record.key,

1146

search_key_func=self._search_key_func)

1147

prefix, node_key_filter = keys[record.key]

1148

node_and_filters.append((node, node_key_filter))

1149

self._items[prefix] = node

1150

_page_cache.add(record.key, bytes)

1151

for info in node_and_filters:

1152

yield info

1153

1154

def map(self, store, key, value):

1155

"""Map key to value."""

1156

if not len(self._items):

1157

raise AssertionError("can't map in an empty InternalNode.")

1158

search_key = self._search_key(key)

1159

if self._node_width != len(self._search_prefix) + 1:

1160

raise AssertionError("node width mismatch: %d is not %d" %

1161

(self._node_width, len(self._search_prefix) + 1))

1162

if not search_key.startswith(self._search_prefix):

1163

# This key doesn't fit in this index, so we need to split at the

1164

# point where it would fit, insert self into that internal node,

1165

# and then map this key into that node.

1166

new_prefix = self.common_prefix(self._search_prefix,

1167

search_key)

1168

new_parent = InternalNode(new_prefix,

1169

search_key_func=self._search_key_func)

1170

new_parent.set_maximum_size(self._maximum_size)

1171

new_parent._key_width = self._key_width

1172

new_parent.add_node(self._search_prefix[:len(new_prefix)+1],

1173

self)

1174

return new_parent.map(store, key, value)

1175

children = [node for node, _

1176

in self._iter_nodes(store, key_filter=[key])]

1177

if children:

1178

child = children[0]

1179

else:

1180

# new child needed:

1181

child = self._new_child(search_key, LeafNode)

1182

old_len = len(child)

1183

if type(child) is LeafNode:

1184

old_size = child._current_size()

1185

else:

1186

old_size = None

1187

prefix, node_details = child.map(store, key, value)

1188

if len(node_details) == 1:

1189

# child may have shrunk, or might be a new node

1190

child = node_details[0][1]

1191

self._len = self._len - old_len + len(child)

1192

self._items[search_key] = child

1193

self._key = None

1194

new_node = self

1195

if type(child) is LeafNode:

1196

if old_size is None:

1197

# The old node was an InternalNode which means it has now

1198

# collapsed, so we need to check if it will chain to a

1199

# collapse at this level.

1200

trace.mutter("checking remap as InternalNode -> LeafNode")

1201

new_node = self._check_remap(store)

1202

else:

1203

# If the LeafNode has shrunk in size, we may want to run

1204

# a remap check. Checking for a remap is expensive though

1205

# and the frequency of a successful remap is very low.

1206

# Shrinkage by small amounts is common, so we only do the

1207

# remap check if the new_size is low or the shrinkage

1208

# amount is over a configurable limit.

1209

new_size = child._current_size()

1210

shrinkage = old_size - new_size

1211

if (shrinkage > 0 and new_size < _INTERESTING_NEW_SIZE

1212

or shrinkage > _INTERESTING_SHRINKAGE_LIMIT):

1213

trace.mutter(

1214

"checking remap as size shrunk by %d to be %d",

1215

shrinkage, new_size)

1216

new_node = self._check_remap(store)

1217

if new_node._search_prefix is None:

1218

raise AssertionError("_search_prefix should not be None")

1219

return new_node._search_prefix, [('', new_node)]

1220

# child has overflown - create a new intermediate node.

1221

# XXX: This is where we might want to try and expand our depth

1222

# to refer to more bytes of every child (which would give us

1223

# multiple pointers to child nodes, but less intermediate nodes)

1224

child = self._new_child(search_key, InternalNode)

1225

child._search_prefix = prefix

1226

for split, node in node_details:

1227

child.add_node(split, node)

1228

self._len = self._len - old_len + len(child)

1229

self._key = None

1230

return self._search_prefix, [("", self)]

1231

1232

def _new_child(self, search_key, klass):

1233

"""Create a new child node of type klass."""

1234

child = klass()

1235

child.set_maximum_size(self._maximum_size)

1236

child._key_width = self._key_width

1237

child._search_key_func = self._search_key_func

1238

self._items[search_key] = child

1239

return child

1240

1241

def serialise(self, store):

1242

"""Serialise the node to store.

1243

1244

:param store: A VersionedFiles honouring the CHK extensions.

1245

:return: An iterable of the keys inserted by this operation.

1246

"""

1247

for node in self._items.itervalues():

1248

if type(node) is tuple:

1249

# Never deserialised.

1250

continue

1251

if node._key is not None:

1252

# Never altered

1253

continue

1254

for key in node.serialise(store):

1255

yield key

1256

lines = ["chknode:\n"]

1257

lines.append("%d\n" % self._maximum_size)

1258

lines.append("%d\n" % self._key_width)

1259

lines.append("%d\n" % self._len)

1260

if self._search_prefix is None:

1261

raise AssertionError("_search_prefix should not be None")

1262

lines.append('%s\n' % (self._search_prefix,))

1263

prefix_len = len(self._search_prefix)

1264

for prefix, node in sorted(self._items.items()):

1265

if type(node) is tuple:

1266

key = node[0]

1267

else:

1268

key = node._key[0]

1269

serialised = "%s\x00%s\n" % (prefix, key)

1270

if not serialised.startswith(self._search_prefix):

1271

raise AssertionError("prefixes mismatch: %s must start with %s"

1272

% (serialised, self._search_prefix))

1273

lines.append(serialised[prefix_len:])

1274

sha1, _, _ = store.add_lines((None,), (), lines)

1275

self._key = ("sha1:" + sha1,)

1276

_page_cache.add(self._key, ''.join(lines))

1277

yield self._key

1278

1279

def _search_key(self, key):

1280

"""Return the serialised key for key in this node."""

1281

# search keys are fixed width. All will be self._node_width wide, so we

1282

# pad as necessary.

1283

return (self._search_key_func(key) + '\x00'*self._node_width)[:self._node_width]

1284

1285

def _search_prefix_filter(self, key):

1286

"""Serialise key for use as a prefix filter in iteritems."""

1287

return self._search_key_func(key)[:self._node_width]

1288

1289

def _split(self, offset):

1290

"""Split this node into smaller nodes starting at offset.

1291

1292

:param offset: The offset to start the new child nodes at.

1293

:return: An iterable of (prefix, node) tuples. prefix is a byte

1294

prefix for reaching node.

1295

"""

1296

if offset >= self._node_width:

1297

for node in self._items.values():

1298

for result in node._split(offset):

1299

yield result

1300

return

1301

for key, node in self._items.items():

1302

pass

1303

1304

def refs(self):

1305

"""Return the references to other CHK's held by this node."""

1306

if self._key is None:

1307

raise AssertionError("unserialised nodes have no refs.")

1308

refs = []

1309

for value in self._items.itervalues():

1310

if type(value) is tuple:

1311

refs.append(value)

1312

else:

1313

refs.append(value.key())

1314

return refs

1315

1316

def _compute_search_prefix(self, extra_key=None):

1317

"""Return the unique key prefix for this node.

1318

1319

:return: A bytestring of the longest search key prefix that is

1320

unique within this node.

1321

"""

1322

self._search_prefix = self.common_prefix_for_keys(self._items)

1323

return self._search_prefix

1324

1325

def unmap(self, store, key, check_remap=True):

1326

"""Remove key from this node and it's children."""

1327

if not len(self._items):

1328

raise AssertionError("can't unmap in an empty InternalNode.")

1329

children = [node for node, _

1330

in self._iter_nodes(store, key_filter=[key])]

1331

if children:

1332

child = children[0]

1333

else:

1334

raise KeyError(key)

1335

self._len -= 1

1336

unmapped = child.unmap(store, key)

1337

self._key = None

1338

search_key = self._search_key(key)

1339

if len(unmapped) == 0:

1340

# All child nodes are gone, remove the child:

1341

del self._items[search_key]

1342

unmapped = None

1343

else:

1344

# Stash the returned node

1345

self._items[search_key] = unmapped

1346

if len(self._items) == 1:

1347

# this node is no longer needed:

1348

return self._items.values()[0]

1349

if type(unmapped) is InternalNode:

1350

return self

1351

if check_remap:

1352

return self._check_remap(store)

1353

else:

1354

return self

1355

1356

def _check_remap(self, store):

1357

"""Check if all keys contained by children fit in a single LeafNode.

1358

1359

:param store: A store to use for reading more nodes

1360

:return: Either self, or a new LeafNode which should replace self.

1361

"""

1362

# Logic for how we determine when we need to rebuild

1363

# 1) Implicitly unmap() is removing a key which means that the child

1364

# nodes are going to be shrinking by some extent.

1365

# 2) If all children are LeafNodes, it is possible that they could be

1366

# combined into a single LeafNode, which can then completely replace

1367

# this internal node with a single LeafNode

1368

# 3) If *one* child is an InternalNode, we assume it has already done

1369

# all the work to determine that its children cannot collapse, and

1370

# we can then assume that those nodes *plus* the current nodes don't

1371

# have a chance of collapsing either.

1372

# So a very cheap check is to just say if 'unmapped' is an

1373

# InternalNode, we don't have to check further.

1374

1375

# TODO: Another alternative is to check the total size of all known

1376

# LeafNodes. If there is some formula we can use to determine the

1377

# final size without actually having to read in any more

1378

# children, it would be nice to have. However, we have to be

1379

# careful with stuff like nodes that pull out the common prefix

1380

# of each key, as adding a new key can change the common prefix

1381

# and cause size changes greater than the length of one key.

1382

# So for now, we just add everything to a new Leaf until it

1383

# splits, as we know that will give the right answer

1384

new_leaf = LeafNode(search_key_func=self._search_key_func)

1385

new_leaf.set_maximum_size(self._maximum_size)

1386

new_leaf._key_width = self._key_width

1387

# A batch_size of 16 was chosen because:

1388

# a) In testing, a 4k page held 14 times. So if we have more than 16

1389

# leaf nodes we are unlikely to hold them in a single new leaf

1390

# node. This still allows for 1 round trip

1391

# b) With 16-way fan out, we can still do a single round trip

1392

# c) With 255-way fan out, we don't want to read all 255 and destroy

1393

# the page cache, just to determine that we really don't need it.

1394

for node, _ in self._iter_nodes(store, batch_size=16):

1395

if type(node) is InternalNode:

1396

# Without looking at any leaf nodes, we are sure

1397

return self

1398

for key, value in node._items.iteritems():

1399

if new_leaf._map_no_split(key, value):

1400

return self

1401

trace.mutter("remap generated a new LeafNode")

1402

return new_leaf

1403

1404

1405

def _deserialise(bytes, key, search_key_func):

1406

"""Helper for repositorydetails - convert bytes to a node."""

1407

if bytes.startswith("chkleaf:\n"):

1408

node = LeafNode.deserialise(bytes, key, search_key_func=search_key_func)

1409

elif bytes.startswith("chknode:\n"):

1410

node = InternalNode.deserialise(bytes, key,

1411

search_key_func=search_key_func)

1412

else:

1413

raise AssertionError("Unknown node type.")

1414

return node

1415

1416

1417

class CHKMapDifference(object):

1418

"""Iterate the stored pages and key,value pairs for (new - old).

1419

1420

This class provides a generator over the stored CHK pages and the

1421

(key, value) pairs that are in any of the new maps and not in any of the

1422

old maps.

1423

1424

Note that it may yield chk pages that are common (especially root nodes),

1425

but it won't yield (key,value) pairs that are common.

1426

"""

1427

1428

def __init__(self, store, new_root_keys, old_root_keys,

1429

search_key_func, pb=None):

1430

self._store = store

1431

self._new_root_keys = new_root_keys

1432

self._old_root_keys = old_root_keys

1433

self._pb = pb

1434

# All uninteresting chks that we have seen. By the time they are added

1435

# here, they should be either fully ignored, or queued up for

1436

# processing

1437

self._all_old_chks = set(self._old_root_keys)

1438

# All items that we have seen from the old_root_keys

1439

self._all_old_items = set()

1440

# These are interesting items which were either read, or already in the

1441

# interesting queue (so we don't need to walk them again)

1442

self._processed_new_refs = set()

1443

self._search_key_func = search_key_func

1444

1445

# The uninteresting and interesting nodes to be searched

1446

self._old_queue = []

1447

self._new_queue = []

1448

# Holds the (key, value) items found when processing the root nodes,

1449

# waiting for the uninteresting nodes to be walked

1450

self._new_item_queue = []

1451

self._state = None

1452

1453

def _read_nodes_from_store(self, keys):

1454

# We chose not to use _page_cache, because we think in terms of records

1455

# to be yielded. Also, we expect to touch each page only 1 time during

1456

# this code. (We may want to evaluate saving the raw bytes into the

1457

# page cache, which would allow a working tree update after the fetch

1458

# to not have to read the bytes again.)

1459

stream = self._store.get_record_stream(keys, 'unordered', True)

1460

for record in stream:

1461

if self._pb is not None:

1462

self._pb.tick()

1463

if record.storage_kind == 'absent':

1464

raise errors.NoSuchRevision(self._store, record.key)

1465

bytes = record.get_bytes_as('fulltext')

1466

node = _deserialise(bytes, record.key,

1467

search_key_func=self._search_key_func)

1468

if type(node) is InternalNode:

1469

# Note we don't have to do node.refs() because we know that

1470

# there are no children that have been pushed into this node

1471

prefix_refs = node._items.items()

1472

items = []

1473

else:

1474

prefix_refs = []

1475

items = node._items.items()

1476

yield record, node, prefix_refs, items

1477

1478

def _read_old_roots(self):

1479

old_chks_to_enqueue = []

1480

all_old_chks = self._all_old_chks

1481

for record, node, prefix_refs, items in \

1482

self._read_nodes_from_store(self._old_root_keys):

1483

# Uninteresting node

1484

prefix_refs = [p_r for p_r in prefix_refs

1485

if p_r[1] not in all_old_chks]

1486

new_refs = [p_r[1] for p_r in prefix_refs]

1487

all_old_chks.update(new_refs)

1488

self._all_old_items.update(items)

1489

# Queue up the uninteresting references

1490

# Don't actually put them in the 'to-read' queue until we have

1491

# finished checking the interesting references

1492

old_chks_to_enqueue.extend(prefix_refs)

1493

return old_chks_to_enqueue

1494

1495

def _enqueue_old(self, new_prefixes, old_chks_to_enqueue):

1496

# At this point, we have read all the uninteresting and interesting

1497

# items, so we can queue up the uninteresting stuff, knowing that we've

1498

# handled the interesting ones

1499

for prefix, ref in old_chks_to_enqueue:

1500

not_interesting = True

1501

for i in xrange(len(prefix), 0, -1):

1502

if prefix[:i] in new_prefixes:

1503

not_interesting = False

1504

break

1505

if not_interesting:

1506

# This prefix is not part of the remaining 'interesting set'

1507

continue

1508

self._old_queue.append(ref)

1509

1510

def _read_all_roots(self):

1511

"""Read the root pages.

1512

1513

This is structured as a generator, so that the root records can be

1514

yielded up to whoever needs them without any buffering.

1515

"""

1516

# This is the bootstrap phase

1517

if not self._old_root_keys:

1518

# With no old_root_keys we can just shortcut and be ready

1519

# for _flush_new_queue

1520

self._new_queue = list(self._new_root_keys)

1521

return

1522

old_chks_to_enqueue = self._read_old_roots()

1523

# filter out any root keys that are already known to be uninteresting

1524

new_keys = set(self._new_root_keys).difference(self._all_old_chks)

1525

# These are prefixes that are present in new_keys that we are

1526

# thinking to yield

1527

new_prefixes = set()

1528

# We are about to yield all of these, so we don't want them getting

1529

# added a second time

1530

processed_new_refs = self._processed_new_refs

1531

processed_new_refs.update(new_keys)

1532

for record, node, prefix_refs, items in \

1533

self._read_nodes_from_store(new_keys):

1534

# At this level, we now know all the uninteresting references

1535

# So we filter and queue up whatever is remaining

1536

prefix_refs = [p_r for p_r in prefix_refs

1537

if p_r[1] not in self._all_old_chks

1538

and p_r[1] not in processed_new_refs]

1539

refs = [p_r[1] for p_r in prefix_refs]

1540

new_prefixes.update([p_r[0] for p_r in prefix_refs])

1541

self._new_queue.extend(refs)

1542

# TODO: We can potentially get multiple items here, however the

1543

# current design allows for this, as callers will do the work

1544

# to make the results unique. We might profile whether we

1545

# gain anything by ensuring unique return values for items

1546

new_items = [item for item in items

1547

if item not in self._all_old_items]

1548

self._new_item_queue.extend(new_items)

1549

new_prefixes.update([self._search_key_func(item[0])

1550

for item in new_items])

1551

processed_new_refs.update(refs)

1552

yield record

1553

# For new_prefixes we have the full length prefixes queued up.

1554

# However, we also need possible prefixes. (If we have a known ref to

1555

# 'ab', then we also need to include 'a'.) So expand the

1556

# new_prefixes to include all shorter prefixes

1557

for prefix in list(new_prefixes):

1558

new_prefixes.update([prefix[:i] for i in xrange(1, len(prefix))])

1559

self._enqueue_old(new_prefixes, old_chks_to_enqueue)

1560

1561

def _flush_new_queue(self):

1562

# No need to maintain the heap invariant anymore, just pull things out

1563

# and process them

1564

refs = set(self._new_queue)

1565

self._new_queue = []

1566

# First pass, flush all interesting items and convert to using direct refs

1567

all_old_chks = self._all_old_chks

1568

processed_new_refs = self._processed_new_refs

1569

all_old_items = self._all_old_items

1570

new_items = [item for item in self._new_item_queue

1571

if item not in all_old_items]

1572

self._new_item_queue = []

1573

if new_items:

1574

yield None, new_items

1575

refs = refs.difference(all_old_chks)

1576

while refs:

1577

next_refs = set()

1578

next_refs_update = next_refs.update

1579

# Inlining _read_nodes_from_store improves 'bzr branch bzr.dev'

1580

# from 1m54s to 1m51s. Consider it.

1581

for record, _, p_refs, items in self._read_nodes_from_store(refs):

1582

items = [item for item in items

1583

if item not in all_old_items]

1584

yield record, items

1585

next_refs_update([p_r[1] for p_r in p_refs])

1586

next_refs = next_refs.difference(all_old_chks)

1587

next_refs = next_refs.difference(processed_new_refs)

1588

processed_new_refs.update(next_refs)

1589

refs = next_refs

1590

1591

def _process_next_old(self):

1592

# Since we don't filter uninteresting any further than during

1593

# _read_all_roots, process the whole queue in a single pass.

1594

refs = self._old_queue

1595

self._old_queue = []

1596

all_old_chks = self._all_old_chks

1597

for record, _, prefix_refs, items in self._read_nodes_from_store(refs):

1598

self._all_old_items.update(items)

1599

refs = [r for _,r in prefix_refs if r not in all_old_chks]

1600

self._old_queue.extend(refs)

1601

all_old_chks.update(refs)

1602

1603

def _process_queues(self):

1604

while self._old_queue:

1605

self._process_next_old()

1606

return self._flush_new_queue()

1607

1608

def process(self):

1609

for record in self._read_all_roots():

1610

yield record, []

1611

for record, items in self._process_queues():

1612

yield record, items

1613

1614

1615

def iter_interesting_nodes(store, interesting_root_keys,

1616

uninteresting_root_keys, pb=None):

1617

"""Given root keys, find interesting nodes.

1618

1619

Evaluate nodes referenced by interesting_root_keys. Ones that are also

1620

referenced from uninteresting_root_keys are not considered interesting.

1621

1622

:param interesting_root_keys: keys which should be part of the

1623

"interesting" nodes (which will be yielded)

1624

:param uninteresting_root_keys: keys which should be filtered out of the

1625

result set.

1626

:return: Yield

1627

(interesting record, {interesting key:values})

1628

"""

1629

iterator = CHKMapDifference(store, interesting_root_keys,

1630

uninteresting_root_keys,

1631

search_key_func=store._search_key_func,

1632

pb=pb)

1633

return iterator.process()

1634

1635

1636

try:

1637

from bzrlib._chk_map_pyx import (

1638

_search_key_16,

1639

_search_key_255,

1640

_deserialise_leaf_node,

1641

_deserialise_internal_node,

1642

)

1643

except ImportError:

1644

from bzrlib._chk_map_py import (

1645

_search_key_16,

1646

_search_key_255,

1647

_deserialise_leaf_node,

1648

_deserialise_internal_node,

1649

)

1650

search_key_registry.register('hash-16-way', _search_key_16)

1651

search_key_registry.register('hash-255-way', _search_key_255)

Older »