~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Canonical.com Patch Queue Manager
Date: 2010-09-01 08:02:42 UTC
mfrom: (5390.3.3 faster-revert-593560)
Revision ID: pqm@pqm.ubuntu.com-20100901080242-esg62ody4frwmy66

(spiv) Avoid repeatedly calling self.target.all_file_ids() in
InterTree.iter_changes. (Andrew Bennetts)

files added:
.testr.conf

MANIFEST.in

NEWS-template.txt

README_BDIST_RPM

apport

apport/README

apport/bzr-crashdb.conf

apport/source_bzr.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/cache_utf8.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmd_version_info.py

bzrlib/cmdline.py

bzrlib/controldir.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc_generate/builders

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/conf.py

bzrlib/doc_generate/writers

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/email_message.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/conflict-types.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/location-alias.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/help_topics/es

bzrlib/help_topics/es/conflict-types.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inventory_delta.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/library_state.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/pack.py

bzrlib/patiencediff.py

bzrlib/plugins/bash_completion

bzrlib/plugins/bash_completion/README.txt

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/bash_completion/tests

bzrlib/plugins/bash_completion/tests/__init__.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconfigure.py

bzrlib/recordcounter.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/static_tuple.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/tag.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_lookup_revision.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_revert.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/doc_generate

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders

bzrlib/tests/doc_generate/builders/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers

bzrlib/tests/doc_generate/writers/__init__.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/fixtures.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/https_server.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_controldir/test_push.py

bzrlib/tests/per_controldir_colo

bzrlib/tests/per_controldir_colo/__init__.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_copy_content_into.py

bzrlib/tests/per_interbranch/test_get.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__btree_serializer.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_fixtures.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_script.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/timestamp.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/ftp

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/gio_transport.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/log.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/remote.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/views.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bash/bzr

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

contrib/zsh/README

doc/Bazaar-Logo-For-Manuals.png

doc/developers

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/principles.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/transports.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/developers/win32_build_setup.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/index.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/en/whats-new

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/index.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/check-newsbugs.py

tools/generate_release_notes.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/py2exe_boot_common.py

tools/win32/run_script.py

files removed:
NEWS.developers

build-api

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_escaped_store.py

bzrlib/textui.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave_commands.py

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/fortune

contrib/zsh/_bzr

doc/README.1st

doc/index.txt

tools/biobench.py

tools/history2revfiles.py

tools/win32/copy_docs.py

files renamed:
bzrlib/patiencediff.py => bzrlib/_patiencediff_py.py

bzrlib/graph.py => bzrlib/deprecated_graph.py

tools/doc_generate/ => bzrlib/doc_generate/

doc/configuration.txt => bzrlib/help_topics/en/configuration.txt

bzrlib/tests/blackbox/test_bundle.py => bzrlib/tests/blackbox/test_send.py

bzrlib/tests/HTTPTestUtil.py => bzrlib/tests/http_utils.py

bzrlib/tests/branch_implementations/ => bzrlib/tests/per_branch/

bzrlib/tests/bzrdir_implementations/ => bzrlib/tests/per_controldir/

bzrlib/tests/bzrdir_implementations/test_bzrdir.py => bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/interrepository_implementations/ => bzrlib/tests/per_interrepository/

bzrlib/tests/intertree_implementations/ => bzrlib/tests/per_intertree/

bzrlib/tests/repository_implementations/ => bzrlib/tests/per_repository/

bzrlib/tests/test_revprops.py => bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/test_transport_implementations.py => bzrlib/tests/per_transport.py

bzrlib/tests/tree_implementations/ => bzrlib/tests/per_tree/

bzrlib/tests/test_versionedfile.py => bzrlib/tests/per_versionedfile.py

bzrlib/tests/workingtree_implementations/ => bzrlib/tests/per_workingtree/

bzrlib/tests/test_command.py => bzrlib/tests/test_commands.py

bzrlib/tests/test_graph.py => bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/tests/test_revisionspec.py

bzrlib/transport/ftp.py => bzrlib/transport/ftp/__init__.py

bzrlib/win32console.py => bzrlib/win32utils.py

bzrlib/xml5.py => bzrlib/xml8.py

HACKING => doc/developers/HACKING.txt

doc/tutorial.txt => doc/en/tutorials/tutorial.txt

doc/plugins.txt => doc/en/user-guide/plugins.txt

doc/setting_up_email.txt => doc/en/user-guide/setting_up_email.txt

doc/specifying_revisions.txt => doc/en/user-guide/specifying_revisions.txt

doc/using_aliases.txt => doc/en/user-guide/using_aliases.txt

generate_docs.py => tools/generate_docs.py

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_controldir/__init__.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml_serializer.py

contrib/newinventory.py

contrib/pwclient.full

doc/default.css

profile_imports.py

setup.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/http_client.py

tools/trace-revisions

tools/weavebench.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

)

from bzrlib.static_tuple import StaticTuple

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

# Keys that are referenced but not actually present in this index

self._absent_keys = set()

100

self._nodes_by_key = None

101

self._key_length = key_elements

102

self._optimize_for_size = False

103

self._combine_backing_indices = True

104

105

def _check_key(self, key):

106

"""Raise BadIndexKey if key is not a valid key for this index."""

107

if type(key) not in (tuple, StaticTuple):

108

raise errors.BadIndexKey(key)

109

if self._key_length != len(key):

110

raise errors.BadIndexKey(key)

111

for element in key:

112

if not element or _whitespace_re.search(element) is not None:

113

raise errors.BadIndexKey(element)

114

115

def _external_references(self):

116

"""Return references that are not present in this index.

117

"""

118

keys = set()

119

refs = set()

120

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

121

# lists are used. It is currently correct for pack-0.92 through

122

# 1.9, which use the node references (3rd column) second

123

# reference list as the compression parent. Perhaps this should

124

# be moved into something higher up the stack, since it

125

# makes assumptions about how the index is used.

126

if self.reference_lists > 1:

127

for node in self.iter_all_entries():

128

keys.add(node[1])

129

refs.update(node[3][1])

130

return refs - keys

131

else:

132

# If reference_lists == 0 there can be no external references, and

133

# if reference_lists == 1, then there isn't a place to store the

134

# compression parent

135

return set()

136

137

def _get_nodes_by_key(self):

138

if self._nodes_by_key is None:

139

nodes_by_key = {}

140

if self.reference_lists:

141

for key, (absent, references, value) in self._nodes.iteritems():

142

if absent:

143

continue

144

key_dict = nodes_by_key

145

for subkey in key[:-1]:

146

key_dict = key_dict.setdefault(subkey, {})

147

key_dict[key[-1]] = key, value, references

148

else:

149

for key, (absent, references, value) in self._nodes.iteritems():

150

if absent:

151

continue

152

key_dict = nodes_by_key

153

for subkey in key[:-1]:

154

key_dict = key_dict.setdefault(subkey, {})

155

key_dict[key[-1]] = key, value

156

self._nodes_by_key = nodes_by_key

157

return self._nodes_by_key

158

159

def _update_nodes_by_key(self, key, value, node_refs):

160

"""Update the _nodes_by_key dict with a new key.

161

162

For a key of (foo, bar, baz) create

163

_nodes_by_key[foo][bar][baz] = key_value

164

"""

165

if self._nodes_by_key is None:

166

return

167

key_dict = self._nodes_by_key

168

if self.reference_lists:

169

key_value = StaticTuple(key, value, node_refs)

170

else:

171

key_value = StaticTuple(key, value)

172

for subkey in key[:-1]:

173

key_dict = key_dict.setdefault(subkey, {})

174

key_dict[key[-1]] = key_value

175

176

def _check_key_ref_value(self, key, references, value):

177

"""Check that 'key' and 'references' are all valid.

178

179

:param key: A key tuple. Must conform to the key interface (be a tuple,

180

be of the right length, not have any whitespace or nulls in any key

181

element.)

182

:param references: An iterable of reference lists. Something like

183

[[(ref, key)], [(ref, key), (other, key)]]

184

:param value: The value associate with this key. Must not contain

185

newlines or null characters.

186

:return: (node_refs, absent_references)

187

node_refs basically a packed form of 'references' where all

188

iterables are tuples

189

absent_references reference keys that are not in self._nodes.

190

This may contain duplicates if the same key is

191

referenced in multiple lists.

192

"""

193

as_st = StaticTuple.from_sequence

194

self._check_key(key)

195

if _newline_null_re.search(value) is not None:

196

raise errors.BadIndexValue(value)

197

if len(references) != self.reference_lists:

198

raise errors.BadIndexValue(references)

199

node_refs = []

200

absent_references = []

201

for reference_list in references:

202

for reference in reference_list:

203

# If reference *is* in self._nodes, then we know it has already

204

# been checked.

205

if reference not in self._nodes:

206

self._check_key(reference)

207

absent_references.append(reference)

208

reference_list = as_st([as_st(ref).intern()

209

for ref in reference_list])

210

node_refs.append(reference_list)

211

return as_st(node_refs), absent_references

212

213

def add_node(self, key, value, references=()):

214

"""Add a node to the index.

215

216

:param key: The key. keys are non-empty tuples containing

217

as many whitespace-free utf8 bytestrings as the key length

218

defined for this index.

219

:param references: An iterable of iterables of keys. Each is a

220

reference to another key.

221

:param value: The value to associate with the key. It may be any

222

bytes as long as it does not contain \0 or \n.

223

"""

224

(node_refs,

225

absent_references) = self._check_key_ref_value(key, references, value)

226

if key in self._nodes and self._nodes[key][0] != 'a':

227

raise errors.BadIndexDuplicateKey(key, self)

228

for reference in absent_references:

229

# There may be duplicates, but I don't think it is worth worrying

230

# about

231

self._nodes[reference] = ('a', (), '')

232

self._absent_keys.update(absent_references)

233

self._absent_keys.discard(key)

234

self._nodes[key] = ('', node_refs, value)

235

if self._nodes_by_key is not None and self._key_length > 1:

236

self._update_nodes_by_key(key, value, node_refs)

237

238

def clear_cache(self):

239

"""See GraphIndex.clear_cache()

240

241

This is a no-op, but we need the api to conform to a generic 'Index'

242

abstraction.

243

"""

244

245

def finish(self):

246

lines = [_SIGNATURE]

247

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

248

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

249

key_count = len(self._nodes) - len(self._absent_keys)

250

lines.append(_OPTION_LEN + str(key_count) + '\n')

251

prefix_length = sum(len(x) for x in lines)

252

# references are byte offsets. To avoid having to do nasty

253

# polynomial work to resolve offsets (references to later in the

254

# file cannot be determined until all the inbetween references have

255

# been calculated too) we pad the offsets with 0's to make them be

256

# of consistent length. Using binary offsets would break the trivial

257

# file parsing.

258

# to calculate the width of zero's needed we do three passes:

259

# one to gather all the non-reference data and the number of references.

260

# one to pad all the data with reference-length and determine entry

261

# addresses.

262

# One to serialise.

263

264

# forward sorted by key. In future we may consider topological sorting,

265

# at the cost of table scans for direct lookup, or a second index for

266

# direct lookup

267

nodes = sorted(self._nodes.items())

268

# if we do not prepass, we don't know how long it will be up front.

269

expected_bytes = None

270

# we only need to pre-pass if we have reference lists at all.

271

if self.reference_lists:

272

key_offset_info = []

273

non_ref_bytes = prefix_length

274

total_references = 0

275

# TODO use simple multiplication for the constants in this loop.

276

for key, (absent, references, value) in nodes:

277

# record the offset known *so far* for this key:

278

# the non reference bytes to date, and the total references to

279

# date - saves reaccumulating on the second pass

280

key_offset_info.append((key, non_ref_bytes, total_references))

281

# key is literal, value is literal, there are 3 null's, 1 NL

282

# key is variable length tuple, \x00 between elements

283

non_ref_bytes += sum(len(element) for element in key)

284

if self._key_length > 1:

285

non_ref_bytes += self._key_length - 1

286

# value is literal bytes, there are 3 null's, 1 NL.

287

non_ref_bytes += len(value) + 3 + 1

288

# one byte for absent if set.

289

if absent:

290

non_ref_bytes += 1

291

elif self.reference_lists:

292

# (ref_lists -1) tabs

293

non_ref_bytes += self.reference_lists - 1

294

# (ref-1 cr's per ref_list)

295

for ref_list in references:

296

# how many references across the whole file?

297

total_references += len(ref_list)

298

# accrue reference separators

299

if ref_list:

300

non_ref_bytes += len(ref_list) - 1

301

# how many digits are needed to represent the total byte count?

302

digits = 1

303

possible_total_bytes = non_ref_bytes + total_references*digits

304

while 10 ** digits < possible_total_bytes:

305

digits += 1

306

possible_total_bytes = non_ref_bytes + total_references*digits

307

expected_bytes = possible_total_bytes + 1 # terminating newline

308

# resolve key addresses.

309

key_addresses = {}

310

for key, non_ref_bytes, total_references in key_offset_info:

311

key_addresses[key] = non_ref_bytes + total_references*digits

312

# serialise

313

format_string = '%%0%sd' % digits

314

for key, (absent, references, value) in nodes:

315

flattened_references = []

316

for ref_list in references:

317

ref_addresses = []

318

for reference in ref_list:

319

ref_addresses.append(format_string % key_addresses[reference])

320

flattened_references.append('\r'.join(ref_addresses))

321

string_key = '\x00'.join(key)

322

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

323

'\t'.join(flattened_references), value))

324

lines.append('\n')

325

result = StringIO(''.join(lines))

326

if expected_bytes and len(result.getvalue()) != expected_bytes:

327

raise errors.BzrError('Failed index creation. Internal error:'

328

' mismatched output length and expected length: %d %d' %

329

(len(result.getvalue()), expected_bytes))

330

return result

331

332

def set_optimize(self, for_size=None, combine_backing_indices=None):

333

"""Change how the builder tries to optimize the result.

334

335

:param for_size: Tell the builder to try and make the index as small as

336

possible.

337

:param combine_backing_indices: If the builder spills to disk to save

338

memory, should the on-disk indices be combined. Set to True if you

339

are going to be probing the index, but to False if you are not. (If

340

you are not querying, then the time spent combining is wasted.)

341

:return: None

342

"""

343

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

344

# other builders do.

345

if for_size is not None:

346

self._optimize_for_size = for_size

347

if combine_backing_indices is not None:

348

self._combine_backing_indices = combine_backing_indices

349

350

def find_ancestry(self, keys, ref_list_num):

351

"""See CombinedGraphIndex.find_ancestry()"""

352

pending = set(keys)

353

parent_map = {}

354

missing_keys = set()

355

while pending:

356

next_pending = set()

357

for _, key, value, ref_lists in self.iter_entries(pending):

358

parent_keys = ref_lists[ref_list_num]

359

parent_map[key] = parent_keys

360

next_pending.update([p for p in parent_keys if p not in

361

parent_map])

362

missing_keys.update(pending.difference(parent_map))

363

pending = next_pending

364

return parent_map, missing_keys

365

366

367

class GraphIndex(object):

368

"""An index for data with embedded graphs.

369

370

The index maps keys to a list of key reference lists, and a value.

371

Each node has the same number of key reference lists. Each key reference

372

list can be empty or an arbitrary length. The value is an opaque NULL

373

terminated string without any newlines. The storage of the index is

374

hidden in the interface: keys and key references are always tuples of

375

bytestrings, never the internal representation (e.g. dictionary offsets).

376

377

It is presumed that the index will not be mutated - it is static data.

378

379

Successive iter_all_entries calls will read the entire index each time.

380

Additionally, iter_entries calls will read the index linearly until the

381

desired keys are found. XXX: This must be fixed before the index is

382

suitable for production use. :XXX

383

"""

384

385

def __init__(self, transport, name, size, unlimited_cache=False, offset=0):

386

"""Open an index called name on transport.

387

388

:param transport: A bzrlib.transport.Transport.

389

:param name: A path to provide to transport API calls.

390

:param size: The size of the index in bytes. This is used for bisection

391

logic to perform partial index reads. While the size could be

392

obtained by statting the file this introduced an additional round

393

trip as well as requiring stat'able transports, both of which are

394

avoided by having it supplied. If size is None, then bisection

395

support will be disabled and accessing the index will just stream

396

all the data.

397

:param offset: Instead of starting the index data at offset 0, start it

398

at an arbitrary offset.

399

"""

400

self._transport = transport

401

self._name = name

402

# Becomes a dict of key:(value, reference-list-byte-locations) used by

403

# the bisection interface to store parsed but not resolved keys.

404

self._bisect_nodes = None

405

# Becomes a dict of key:(value, reference-list-keys) which are ready to

406

# be returned directly to callers.

407

self._nodes = None

408

# a sorted list of slice-addresses for the parsed bytes of the file.

409

# e.g. (0,1) would mean that byte 0 is parsed.

410

self._parsed_byte_map = []

411

# a sorted list of keys matching each slice address for parsed bytes

412

# e.g. (None, 'foo@bar') would mean that the first byte contained no

413

# key, and the end byte of the slice is the of the data for 'foo@bar'

414

self._parsed_key_map = []

415

self._key_count = None

416

self._keys_by_offset = None

417

self._nodes_by_key = None

418

self._size = size

419

# The number of bytes we've read so far in trying to process this file

420

self._bytes_read = 0

421

self._base_offset = offset

422

423

def __eq__(self, other):

424

"""Equal when self and other were created with the same parameters."""

425

return (

426

type(self) == type(other) and

427

self._transport == other._transport and

428

self._name == other._name and

429

self._size == other._size)

430

431

def __ne__(self, other):

432

return not self.__eq__(other)

433

434

def __repr__(self):

435

return "%s(%r)" % (self.__class__.__name__,

436

self._transport.abspath(self._name))

437

438

def _buffer_all(self, stream=None):

439

"""Buffer all the index data.

440

441

Mutates self._nodes and self.keys_by_offset.

442

"""

443

if self._nodes is not None:

444

# We already did this

445

return

446

if 'index' in debug.debug_flags:

447

mutter('Reading entire index %s', self._transport.abspath(self._name))

448

if stream is None:

449

stream = self._transport.get(self._name)

450

if self._base_offset != 0:

451

# This is wasteful, but it is better than dealing with

452

# adjusting all the offsets, etc.

453

stream = StringIO(stream.read()[self._base_offset:])

454

self._read_prefix(stream)

455

self._expected_elements = 3 + self._key_length

456

line_count = 0

457

# raw data keyed by offset

458

self._keys_by_offset = {}

459

# ready-to-return key:value or key:value, node_ref_lists

460

self._nodes = {}

461

self._nodes_by_key = None

462

trailers = 0

463

pos = stream.tell()

464

lines = stream.read().split('\n')

465

# GZ 2009-09-20: Should really use a try/finally block to ensure close

466

stream.close()

467

del lines[-1]

468

_, _, _, trailers = self._parse_lines(lines, pos)

469

for key, absent, references, value in self._keys_by_offset.itervalues():

470

if absent:

471

continue

472

# resolve references:

473

if self.node_ref_lists:

474

node_value = (value, self._resolve_references(references))

475

else:

476

node_value = value

477

self._nodes[key] = node_value

478

# cache the keys for quick set intersections

479

if trailers != 1:

480

# there must be one line - the empty trailer line.

481

raise errors.BadIndexData(self)

482

483

def clear_cache(self):

484

"""Clear out any cached/memoized values.

485

486

This can be called at any time, but generally it is used when we have

487

extracted some information, but don't expect to be requesting any more

488

from this index.

489

"""

490

491

def external_references(self, ref_list_num):

492

"""Return references that are not present in this index.

493

"""

494

self._buffer_all()

495

if ref_list_num + 1 > self.node_ref_lists:

496

raise ValueError('No ref list %d, index has %d ref lists'

497

% (ref_list_num, self.node_ref_lists))

498

refs = set()

499

nodes = self._nodes

500

for key, (value, ref_lists) in nodes.iteritems():

501

ref_list = ref_lists[ref_list_num]

502

refs.update([ref for ref in ref_list if ref not in nodes])

503

return refs

504

505

def _get_nodes_by_key(self):

506

if self._nodes_by_key is None:

507

nodes_by_key = {}

508

if self.node_ref_lists:

509

for key, (value, references) in self._nodes.iteritems():

510

key_dict = nodes_by_key

511

for subkey in key[:-1]:

512

key_dict = key_dict.setdefault(subkey, {})

513

key_dict[key[-1]] = key, value, references

514

else:

515

for key, value in self._nodes.iteritems():

516

key_dict = nodes_by_key

517

for subkey in key[:-1]:

518

key_dict = key_dict.setdefault(subkey, {})

519

key_dict[key[-1]] = key, value

520

self._nodes_by_key = nodes_by_key

521

return self._nodes_by_key

522

523

def iter_all_entries(self):

524

"""Iterate over all keys within the index.

525

526

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

527

The former tuple is used when there are no reference lists in the

528

index, making the API compatible with simple key:value index types.

529

There is no defined order for the result iteration - it will be in

530

the most efficient order for the index.

531

"""

532

if 'evil' in debug.debug_flags:

533

trace.mutter_callsite(3,

534

"iter_all_entries scales with size of history.")

535

if self._nodes is None:

536

self._buffer_all()

537

if self.node_ref_lists:

538

for key, (value, node_ref_lists) in self._nodes.iteritems():

539

yield self, key, value, node_ref_lists

540

else:

541

for key, value in self._nodes.iteritems():

542

yield self, key, value

543

544

def _read_prefix(self, stream):

545

signature = stream.read(len(self._signature()))

546

if not signature == self._signature():

547

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

548

options_line = stream.readline()

549

if not options_line.startswith(_OPTION_NODE_REFS):

550

raise errors.BadIndexOptions(self)

551

try:

552

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

553

except ValueError:

554

raise errors.BadIndexOptions(self)

555

options_line = stream.readline()

556

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

557

raise errors.BadIndexOptions(self)

558

try:

559

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

560

except ValueError:

561

raise errors.BadIndexOptions(self)

562

options_line = stream.readline()

563

if not options_line.startswith(_OPTION_LEN):

564

raise errors.BadIndexOptions(self)

565

try:

566

self._key_count = int(options_line[len(_OPTION_LEN):-1])

567

except ValueError:

568

raise errors.BadIndexOptions(self)

569

570

def _resolve_references(self, references):

571

"""Return the resolved key references for references.

572

573

References are resolved by looking up the location of the key in the

574

_keys_by_offset map and substituting the key name, preserving ordering.

575

576

:param references: An iterable of iterables of key locations. e.g.

577

[[123, 456], [123]]

578

:return: A tuple of tuples of keys.

579

"""

580

node_refs = []

581

for ref_list in references:

582

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

583

return tuple(node_refs)

584

585

def _find_index(self, range_map, key):

586

"""Helper for the _parsed_*_index calls.

587

588

Given a range map - [(start, end), ...], finds the index of the range

589

in the map for key if it is in the map, and if it is not there, the

590

immediately preceeding range in the map.

591

"""

592

result = bisect_right(range_map, key) - 1

593

if result + 1 < len(range_map):

594

# check the border condition, it may be in result + 1

595

if range_map[result + 1][0] == key[0]:

596

return result + 1

597

return result

598

599

def _parsed_byte_index(self, offset):

600

"""Return the index of the entry immediately before offset.

601

602

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

603

there is one unparsed byte (the 11th, addressed as[10]). then:

604

asking for 0 will return 0

605

asking for 10 will return 0

606

asking for 11 will return 1

607

asking for 12 will return 1

608

"""

609

key = (offset, 0)

610

return self._find_index(self._parsed_byte_map, key)

611

612

def _parsed_key_index(self, key):

613

"""Return the index of the entry immediately before key.

614

615

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

616

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

617

have been parsed, then:

618

asking for '' will return 0

619

asking for 'a' will return 0

620

asking for 'b' will return 1

621

asking for 'e' will return 1

622

"""

623

search_key = (key, None)

624

return self._find_index(self._parsed_key_map, search_key)

625

626

def _is_parsed(self, offset):

627

"""Returns True if offset has been parsed."""

628

index = self._parsed_byte_index(offset)

629

if index == len(self._parsed_byte_map):

630

return offset < self._parsed_byte_map[index - 1][1]

631

start, end = self._parsed_byte_map[index]

632

return offset >= start and offset < end

633

634

def _iter_entries_from_total_buffer(self, keys):

635

"""Iterate over keys when the entire index is parsed."""

636

# Note: See the note in BTreeBuilder.iter_entries for why we don't use

637

# .intersection() here

638

nodes = self._nodes

639

keys = [key for key in keys if key in nodes]

640

if self.node_ref_lists:

641

for key in keys:

642

value, node_refs = nodes[key]

643

yield self, key, value, node_refs

644

else:

645

for key in keys:

646

yield self, key, nodes[key]

647

648

def iter_entries(self, keys):

649

"""Iterate over keys within the index.

650

651

:param keys: An iterable providing the keys to be retrieved.

652

:return: An iterable as per iter_all_entries, but restricted to the

653

keys supplied. No additional keys will be returned, and every

654

key supplied that is in the index will be returned.

655

"""

656

keys = set(keys)

657

if not keys:

658

return []

659

if self._size is None and self._nodes is None:

660

self._buffer_all()

661

662

# We fit about 20 keys per minimum-read (4K), so if we are looking for

663

# more than 1/20th of the index its likely (assuming homogenous key

664

# spread) that we'll read the entire index. If we're going to do that,

665

# buffer the whole thing. A better analysis might take key spread into

666

# account - but B+Tree indices are better anyway.

667

# We could look at all data read, and use a threshold there, which will

668

# trigger on ancestry walks, but that is not yet fully mapped out.

669

if self._nodes is None and len(keys) * 20 > self.key_count():

670

self._buffer_all()

671

if self._nodes is not None:

672

return self._iter_entries_from_total_buffer(keys)

673

else:

674

return (result[1] for result in bisect_multi_bytes(

675

self._lookup_keys_via_location, self._size, keys))

676

677

def iter_entries_prefix(self, keys):

678

"""Iterate over keys within the index using prefix matching.

679

680

Prefix matching is applied within the tuple of a key, not to within

681

the bytestring of each key element. e.g. if you have the keys ('foo',

682

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

683

only the former key is returned.

684

685

WARNING: Note that this method currently causes a full index parse

686

unconditionally (which is reasonably appropriate as it is a means for

687

thunking many small indices into one larger one and still supplies

688

iter_all_entries at the thunk layer).

689

690

:param keys: An iterable providing the key prefixes to be retrieved.

691

Each key prefix takes the form of a tuple the length of a key, but

692

with the last N elements 'None' rather than a regular bytestring.

693

The first element cannot be 'None'.

694

:return: An iterable as per iter_all_entries, but restricted to the

695

keys with a matching prefix to those supplied. No additional keys

696

will be returned, and every match that is in the index will be

697

returned.

698

"""

699

keys = set(keys)

700

if not keys:

701

return

702

# load data - also finds key lengths

703

if self._nodes is None:

704

self._buffer_all()

705

if self._key_length == 1:

706

for key in keys:

707

# sanity check

708

if key[0] is None:

709

raise errors.BadIndexKey(key)

710

if len(key) != self._key_length:

711

raise errors.BadIndexKey(key)

712

if self.node_ref_lists:

713

value, node_refs = self._nodes[key]

714

yield self, key, value, node_refs

715

else:

716

yield self, key, self._nodes[key]

717

return

718

nodes_by_key = self._get_nodes_by_key()

719

for key in keys:

720

# sanity check

721

if key[0] is None:

722

raise errors.BadIndexKey(key)

723

if len(key) != self._key_length:

724

raise errors.BadIndexKey(key)

725

# find what it refers to:

726

key_dict = nodes_by_key

727

elements = list(key)

728

# find the subdict whose contents should be returned.

729

try:

730

while len(elements) and elements[0] is not None:

731

key_dict = key_dict[elements[0]]

732

elements.pop(0)

733

except KeyError:

734

# a non-existant lookup.

735

continue

736

if len(elements):

737

dicts = [key_dict]

738

while dicts:

739

key_dict = dicts.pop(-1)

740

# can't be empty or would not exist

741

item, value = key_dict.iteritems().next()

742

if type(value) == dict:

743

# push keys

744

dicts.extend(key_dict.itervalues())

745

else:

746

# yield keys

747

for value in key_dict.itervalues():

748

# each value is the key:value:node refs tuple

749

# ready to yield.

750

yield (self, ) + value

751

else:

752

# the last thing looked up was a terminal element

753

yield (self, ) + key_dict

754

755

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

756

"""See BTreeIndex._find_ancestors."""

757

# The api can be implemented as a trivial overlay on top of

758

# iter_entries, it is not an efficient implementation, but it at least

759

# gets the job done.

760

found_keys = set()

761

search_keys = set()

762

for index, key, value, refs in self.iter_entries(keys):

763

parent_keys = refs[ref_list_num]

764

found_keys.add(key)

765

parent_map[key] = parent_keys

766

search_keys.update(parent_keys)

767

# Figure out what, if anything, was missing

768

missing_keys.update(set(keys).difference(found_keys))

769

search_keys = search_keys.difference(parent_map)

770

return search_keys

771

772

def key_count(self):

773

"""Return an estimate of the number of keys in this index.

774

775

For GraphIndex the estimate is exact.

776

"""

777

if self._key_count is None:

778

self._read_and_parse([_HEADER_READV])

779

return self._key_count

780

781

def _lookup_keys_via_location(self, location_keys):

782

"""Public interface for implementing bisection.

783

784

If _buffer_all has been called, then all the data for the index is in

785

memory, and this method should not be called, as it uses a separate

786

cache because it cannot pre-resolve all indices, which buffer_all does

787

for performance.

788

789

:param location_keys: A list of location(byte offset), key tuples.

790

:return: A list of (location_key, result) tuples as expected by

791

bzrlib.bisect_multi.bisect_multi_bytes.

792

"""

793

# Possible improvements:

794

# - only bisect lookup each key once

795

# - sort the keys first, and use that to reduce the bisection window

796

# -----

797

# this progresses in three parts:

798

# read data

799

# parse it

800

# attempt to answer the question from the now in memory data.

801

# build the readv request

802

# for each location, ask for 800 bytes - much more than rows we've seen

803

# anywhere.

804

readv_ranges = []

805

for location, key in location_keys:

806

# can we answer from cache?

807

if self._bisect_nodes and key in self._bisect_nodes:

808

# We have the key parsed.

809

continue

810

index = self._parsed_key_index(key)

811

if (len(self._parsed_key_map) and

812

self._parsed_key_map[index][0] <= key and

813

(self._parsed_key_map[index][1] >= key or

814

# end of the file has been parsed

815

self._parsed_byte_map[index][1] == self._size)):

816

# the key has been parsed, so no lookup is needed even if its

817

# not present.

818

continue

819

# - if we have examined this part of the file already - yes

820

index = self._parsed_byte_index(location)

821

if (len(self._parsed_byte_map) and

822

self._parsed_byte_map[index][0] <= location and

823

self._parsed_byte_map[index][1] > location):

824

# the byte region has been parsed, so no read is needed.

825

continue

826

length = 800

827

if location + length > self._size:

828

length = self._size - location

829

# todo, trim out parsed locations.

830

if length > 0:

831

readv_ranges.append((location, length))

832

# read the header if needed

833

if self._bisect_nodes is None:

834

readv_ranges.append(_HEADER_READV)

835

self._read_and_parse(readv_ranges)

836

result = []

837

if self._nodes is not None:

838

# _read_and_parse triggered a _buffer_all because we requested the

839

# whole data range

840

for location, key in location_keys:

841

if key not in self._nodes: # not present

842

result.append(((location, key), False))

843

elif self.node_ref_lists:

844

value, refs = self._nodes[key]

845

result.append(((location, key),

846

(self, key, value, refs)))

847

else:

848

result.append(((location, key),

849

(self, key, self._nodes[key])))

850

return result

851

# generate results:

852

# - figure out <, >, missing, present

853

# - result present references so we can return them.

854

# keys that we cannot answer until we resolve references

855

pending_references = []

856

pending_locations = set()

857

for location, key in location_keys:

858

# can we answer from cache?

859

if key in self._bisect_nodes:

860

# the key has been parsed, so no lookup is needed

861

if self.node_ref_lists:

862

# the references may not have been all parsed.

863

value, refs = self._bisect_nodes[key]

864

wanted_locations = []

865

for ref_list in refs:

866

for ref in ref_list:

867

if ref not in self._keys_by_offset:

868

wanted_locations.append(ref)

869

if wanted_locations:

870

pending_locations.update(wanted_locations)

871

pending_references.append((location, key))

872

continue

873

result.append(((location, key), (self, key,

874

value, self._resolve_references(refs))))

875

else:

876

result.append(((location, key),

877

(self, key, self._bisect_nodes[key])))

878

continue

879

else:

880

# has the region the key should be in, been parsed?

881

index = self._parsed_key_index(key)

882

if (self._parsed_key_map[index][0] <= key and

883

(self._parsed_key_map[index][1] >= key or

884

# end of the file has been parsed

885

self._parsed_byte_map[index][1] == self._size)):

886

result.append(((location, key), False))

887

continue

888

# no, is the key above or below the probed location:

889

# get the range of the probed & parsed location

890

index = self._parsed_byte_index(location)

891

# if the key is below the start of the range, its below

892

if key < self._parsed_key_map[index][0]:

893

direction = -1

894

else:

895

direction = +1

896

result.append(((location, key), direction))

897

readv_ranges = []

898

# lookup data to resolve references

899

for location in pending_locations:

900

length = 800

901

if location + length > self._size:

902

length = self._size - location

903

# TODO: trim out parsed locations (e.g. if the 800 is into the

904

# parsed region trim it, and dont use the adjust_for_latency

905

# facility)

906

if length > 0:

907

readv_ranges.append((location, length))

908

self._read_and_parse(readv_ranges)

909

if self._nodes is not None:

910

# The _read_and_parse triggered a _buffer_all, grab the data and

911

# return it

912

for location, key in pending_references:

913

value, refs = self._nodes[key]

914

result.append(((location, key), (self, key, value, refs)))

915

return result

916

for location, key in pending_references:

917

# answer key references we had to look-up-late.

918

value, refs = self._bisect_nodes[key]

919

result.append(((location, key), (self, key,

920

value, self._resolve_references(refs))))

921

return result

922

923

def _parse_header_from_bytes(self, bytes):

924

"""Parse the header from a region of bytes.

925

926

:param bytes: The data to parse.

927

:return: An offset, data tuple such as readv yields, for the unparsed

928

data. (which may length 0).

929

"""

930

signature = bytes[0:len(self._signature())]

931

if not signature == self._signature():

932

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

933

lines = bytes[len(self._signature()):].splitlines()

934

options_line = lines[0]

935

if not options_line.startswith(_OPTION_NODE_REFS):

936

raise errors.BadIndexOptions(self)

937

try:

938

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

939

except ValueError:

940

raise errors.BadIndexOptions(self)

941

options_line = lines[1]

942

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

943

raise errors.BadIndexOptions(self)

944

try:

945

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

946

except ValueError:

947

raise errors.BadIndexOptions(self)

948

options_line = lines[2]

949

if not options_line.startswith(_OPTION_LEN):

950

raise errors.BadIndexOptions(self)

951

try:

952

self._key_count = int(options_line[len(_OPTION_LEN):])

953

except ValueError:

954

raise errors.BadIndexOptions(self)

955

# calculate the bytes we have processed

956

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

957

len(lines[2]) + 3)

958

self._parsed_bytes(0, None, header_end, None)

959

# setup parsing state

960

self._expected_elements = 3 + self._key_length

961

# raw data keyed by offset

962

self._keys_by_offset = {}

963

# keys with the value and node references

964

self._bisect_nodes = {}

965

return header_end, bytes[header_end:]

966

967

def _parse_region(self, offset, data):

968

"""Parse node data returned from a readv operation.

969

970

:param offset: The byte offset the data starts at.

971

:param data: The data to parse.

972

"""

973

# trim the data.

974

# end first:

975

end = offset + len(data)

976

high_parsed = offset

977

while True:

978

# Trivial test - if the current index's end is within the

979

# low-matching parsed range, we're done.

980

index = self._parsed_byte_index(high_parsed)

981

if end < self._parsed_byte_map[index][1]:

982

return

983

# print "[%d:%d]" % (offset, end), \

984

# self._parsed_byte_map[index:index + 2]

985

high_parsed, last_segment = self._parse_segment(

986

offset, data, end, index)

987

if last_segment:

988

return

989

990

def _parse_segment(self, offset, data, end, index):

991

"""Parse one segment of data.

992

993

:param offset: Where 'data' begins in the file.

994

:param data: Some data to parse a segment of.

995

:param end: Where data ends

996

:param index: The current index into the parsed bytes map.

997

:return: True if the parsed segment is the last possible one in the

998

range of data.

999

:return: high_parsed_byte, last_segment.

1000

high_parsed_byte is the location of the highest parsed byte in this

1001

segment, last_segment is True if the parsed segment is the last

1002

possible one in the data block.

1003

"""

1004

# default is to use all data

1005

trim_end = None

1006

# accomodate overlap with data before this.

1007

if offset < self._parsed_byte_map[index][1]:

1008

# overlaps the lower parsed region

1009

# skip the parsed data

1010

trim_start = self._parsed_byte_map[index][1] - offset

1011

# don't trim the start for \n

1012

start_adjacent = True

1013

elif offset == self._parsed_byte_map[index][1]:

1014

# abuts the lower parsed region

1015

# use all data

1016

trim_start = None

1017

# do not trim anything

1018

start_adjacent = True

1019

else:

1020

# does not overlap the lower parsed region

1021

# use all data

1022

trim_start = None

1023

# but trim the leading \n

1024

start_adjacent = False

1025

if end == self._size:

1026

# lines up to the end of all data:

1027

# use it all

1028

trim_end = None

1029

# do not strip to the last \n

1030

end_adjacent = True

1031

last_segment = True

1032

elif index + 1 == len(self._parsed_byte_map):

1033

# at the end of the parsed data

1034

# use it all

1035

trim_end = None

1036

# but strip to the last \n

1037

end_adjacent = False

1038

last_segment = True

1039

elif end == self._parsed_byte_map[index + 1][0]:

1040

# buts up against the next parsed region

1041

# use it all

1042

trim_end = None

1043

# do not strip to the last \n

1044

end_adjacent = True

1045

last_segment = True

1046

elif end > self._parsed_byte_map[index + 1][0]:

1047

# overlaps into the next parsed region

1048

# only consider the unparsed data

1049

trim_end = self._parsed_byte_map[index + 1][0] - offset

1050

# do not strip to the last \n as we know its an entire record

1051

end_adjacent = True

1052

last_segment = end < self._parsed_byte_map[index + 1][1]

1053

else:

1054

# does not overlap into the next region

1055

# use it all

1056

trim_end = None

1057

# but strip to the last \n

1058

end_adjacent = False

1059

last_segment = True

1060

# now find bytes to discard if needed

1061

if not start_adjacent:

1062

# work around python bug in rfind

1063

if trim_start is None:

1064

trim_start = data.find('\n') + 1

1065

else:

1066

trim_start = data.find('\n', trim_start) + 1

1067

if not (trim_start != 0):

1068

raise AssertionError('no \n was present')

1069

# print 'removing start', offset, trim_start, repr(data[:trim_start])

1070

if not end_adjacent:

1071

# work around python bug in rfind

1072

if trim_end is None:

1073

trim_end = data.rfind('\n') + 1

1074

else:

1075

trim_end = data.rfind('\n', None, trim_end) + 1

1076

if not (trim_end != 0):

1077

raise AssertionError('no \n was present')

1078

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1079

# adjust offset and data to the parseable data.

1080

trimmed_data = data[trim_start:trim_end]

1081

if not (trimmed_data):

1082

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1083

% (trim_start, trim_end, offset, offset + len(data)))

1084

if trim_start:

1085

offset += trim_start

1086

# print "parsing", repr(trimmed_data)

1087

# splitlines mangles the \r delimiters.. don't use it.

1088

lines = trimmed_data.split('\n')

1089

del lines[-1]

1090

pos = offset

1091

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1092

for key, value in nodes:

1093

self._bisect_nodes[key] = value

1094

self._parsed_bytes(offset, first_key,

1095

offset + len(trimmed_data), last_key)

1096

return offset + len(trimmed_data), last_segment

1097

1098

def _parse_lines(self, lines, pos):

1099

key = None

1100

first_key = None

1101

trailers = 0

1102

nodes = []

1103

for line in lines:

1104

if line == '':

1105

# must be at the end

1106

if self._size:

1107

if not (self._size == pos + 1):

1108

raise AssertionError("%s %s" % (self._size, pos))

1109

trailers += 1

1110

continue

1111

elements = line.split('\0')

1112

if len(elements) != self._expected_elements:

1113

raise errors.BadIndexData(self)

1114

# keys are tuples. Each element is a string that may occur many

1115

# times, so we intern them to save space. AB, RC, 200807

1116

key = tuple([intern(element) for element in elements[:self._key_length]])

1117

if first_key is None:

1118

first_key = key

1119

absent, references, value = elements[-3:]

1120

ref_lists = []

1121

for ref_string in references.split('\t'):

1122

ref_lists.append(tuple([

1123

int(ref) for ref in ref_string.split('\r') if ref

1124

]))

1125

ref_lists = tuple(ref_lists)

1126

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1127

pos += len(line) + 1 # +1 for the \n

1128

if absent:

1129

continue

1130

if self.node_ref_lists:

1131

node_value = (value, ref_lists)

1132

else:

1133

node_value = value

1134

nodes.append((key, node_value))

1135

# print "parsed ", key

1136

return first_key, key, nodes, trailers

1137

1138

def _parsed_bytes(self, start, start_key, end, end_key):

1139

"""Mark the bytes from start to end as parsed.

1140

1141

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1142

1) as parsed.

1143

1144

:param start: The start of the parsed region.

1145

:param end: The end of the parsed region.

1146

"""

1147

index = self._parsed_byte_index(start)

1148

new_value = (start, end)

1149

new_key = (start_key, end_key)

1150

if index == -1:

1151

# first range parsed is always the beginning.

1152

self._parsed_byte_map.insert(index, new_value)

1153

self._parsed_key_map.insert(index, new_key)

1154

return

1155

# four cases:

1156

# new region

1157

# extend lower region

1158

# extend higher region

1159

# combine two regions

1160

if (index + 1 < len(self._parsed_byte_map) and

1161

self._parsed_byte_map[index][1] == start and

1162

self._parsed_byte_map[index + 1][0] == end):

1163

# combine two regions

1164

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1165

self._parsed_byte_map[index + 1][1])

1166

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1167

self._parsed_key_map[index + 1][1])

1168

del self._parsed_byte_map[index + 1]

1169

del self._parsed_key_map[index + 1]

1170

elif self._parsed_byte_map[index][1] == start:

1171

# extend the lower entry

1172

self._parsed_byte_map[index] = (

1173

self._parsed_byte_map[index][0], end)

1174

self._parsed_key_map[index] = (

1175

self._parsed_key_map[index][0], end_key)

1176

elif (index + 1 < len(self._parsed_byte_map) and

1177

self._parsed_byte_map[index + 1][0] == end):

1178

# extend the higher entry

1179

self._parsed_byte_map[index + 1] = (

1180

start, self._parsed_byte_map[index + 1][1])

1181

self._parsed_key_map[index + 1] = (

1182

start_key, self._parsed_key_map[index + 1][1])

1183

else:

1184

# new entry

1185

self._parsed_byte_map.insert(index + 1, new_value)

1186

self._parsed_key_map.insert(index + 1, new_key)

1187

1188

def _read_and_parse(self, readv_ranges):

1189

"""Read the ranges and parse the resulting data.

1190

1191

:param readv_ranges: A prepared readv range list.

1192

"""

1193

if not readv_ranges:

1194

return

1195

if self._nodes is None and self._bytes_read * 2 >= self._size:

1196

# We've already read more than 50% of the file and we are about to

1197

# request more data, just _buffer_all() and be done

1198

self._buffer_all()

1199

return

1200

1201

base_offset = self._base_offset

1202

if base_offset != 0:

1203

# Rewrite the ranges for the offset

1204

readv_ranges = [(start+base_offset, size)

1205

for start, size in readv_ranges]

1206

readv_data = self._transport.readv(self._name, readv_ranges, True,

1207

self._size + self._base_offset)

1208

# parse

1209

for offset, data in readv_data:

1210

offset -= base_offset

1211

self._bytes_read += len(data)

1212

if offset < 0:

1213

# transport.readv() expanded to extra data which isn't part of

1214

# this index

1215

data = data[-offset:]

1216

offset = 0

1217

if offset == 0 and len(data) == self._size:

1218

# We read the whole range, most likely because the

1219

# Transport upcast our readv ranges into one long request

1220

# for enough total data to grab the whole index.

1221

self._buffer_all(StringIO(data))

1222

return

1223

if self._bisect_nodes is None:

1224

# this must be the start

1225

if not (offset == 0):

1226

raise AssertionError()

1227

offset, data = self._parse_header_from_bytes(data)

1228

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1229

self._parse_region(offset, data)

1230

1231

def _signature(self):

1232

"""The file signature for this index type."""

1233

return _SIGNATURE

1234

1235

def validate(self):

1236

"""Validate that everything in the index can be accessed."""

1237

# iter_all validates completely at the moment, so just do that.

1238

for node in self.iter_all_entries():

1239

pass

1240

1241

1242

class CombinedGraphIndex(object):

1243

"""A GraphIndex made up from smaller GraphIndices.

1244

1245

The backing indices must implement GraphIndex, and are presumed to be

1246

static data.

1247

1248

Queries against the combined index will be made against the first index,

1249

and then the second and so on. The order of indices can thus influence

1250

performance significantly. For example, if one index is on local disk and a

1251

second on a remote server, the local disk index should be before the other

1252

in the index list.

1253

1254

Also, queries tend to need results from the same indices as previous

1255

queries. So the indices will be reordered after every query to put the

1256

indices that had the result(s) of that query first (while otherwise

1257

preserving the relative ordering).

1258

"""

1259

1260

def __init__(self, indices, reload_func=None):

1261

"""Create a CombinedGraphIndex backed by indices.

1262

1263

:param indices: An ordered list of indices to query for data.

1264

:param reload_func: A function to call if we find we are missing an

1265

index. Should have the form reload_func() => True/False to indicate

1266

if reloading actually changed anything.

1267

"""

1268

self._indices = indices

1269

self._reload_func = reload_func

1270

# Sibling indices are other CombinedGraphIndex that we should call

1271

# _move_to_front_by_name on when we auto-reorder ourself.

1272

self._sibling_indices = []

1273

# A list of names that corresponds to the instances in self._indices,

1274

# so _index_names[0] is always the name for _indices[0], etc. Sibling

1275

# indices must all use the same set of names as each other.

1276

self._index_names = [None] * len(self._indices)

1277

1278

def __repr__(self):

1279

return "%s(%s)" % (

1280

self.__class__.__name__,

1281

', '.join(map(repr, self._indices)))

1282

1283

def clear_cache(self):

1284

"""See GraphIndex.clear_cache()"""

1285

for index in self._indices:

1286

index.clear_cache()

1287

1288

def get_parent_map(self, keys):

1289

"""See graph.StackedParentsProvider.get_parent_map"""

1290

search_keys = set(keys)

1291

if NULL_REVISION in search_keys:

1292

search_keys.discard(NULL_REVISION)

1293

found_parents = {NULL_REVISION:[]}

1294

else:

1295

found_parents = {}

1296

for index, key, value, refs in self.iter_entries(search_keys):

1297

parents = refs[0]

1298

if not parents:

1299

parents = (NULL_REVISION,)

1300

found_parents[key] = parents

1301

return found_parents

1302

1303

has_key = _has_key_from_parent_map

1304

1305

def insert_index(self, pos, index, name=None):

1306

"""Insert a new index in the list of indices to query.

1307

1308

:param pos: The position to insert the index.

1309

:param index: The index to insert.

1310

:param name: a name for this index, e.g. a pack name. These names can

1311

be used to reflect index reorderings to related CombinedGraphIndex

1312

instances that use the same names. (see set_sibling_indices)

1313

"""

1314

self._indices.insert(pos, index)

1315

self._index_names.insert(pos, name)

1316

1317

def iter_all_entries(self):

1318

"""Iterate over all keys within the index

1319

1320

Duplicate keys across child indices are presumed to have the same

1321

value and are only reported once.

1322

1323

:return: An iterable of (index, key, reference_lists, value).

1324

There is no defined order for the result iteration - it will be in

1325

the most efficient order for the index.

1326

"""

1327

seen_keys = set()

1328

while True:

1329

try:

1330

for index in self._indices:

1331

for node in index.iter_all_entries():

1332

if node[1] not in seen_keys:

1333

yield node

1334

seen_keys.add(node[1])

1335

return

1336

except errors.NoSuchFile:

1337

self._reload_or_raise()

1338

1339

def iter_entries(self, keys):

1340

"""Iterate over keys within the index.

1341

1342

Duplicate keys across child indices are presumed to have the same

1343

value and are only reported once.

1344

1345

:param keys: An iterable providing the keys to be retrieved.

1346

:return: An iterable of (index, key, reference_lists, value). There is

1347

no defined order for the result iteration - it will be in the most

1348

efficient order for the index.

1349

"""

1350

keys = set(keys)

1351

hit_indices = []

1352

while True:

1353

try:

1354

for index in self._indices:

1355

if not keys:

1356

break

1357

index_hit = False

1358

for node in index.iter_entries(keys):

1359

keys.remove(node[1])

1360

yield node

1361

index_hit = True

1362

if index_hit:

1363

hit_indices.append(index)

1364

break

1365

except errors.NoSuchFile:

1366

self._reload_or_raise()

1367

self._move_to_front(hit_indices)

1368

1369

def iter_entries_prefix(self, keys):

1370

"""Iterate over keys within the index using prefix matching.

1371

1372

Duplicate keys across child indices are presumed to have the same

1373

value and are only reported once.

1374

1375

Prefix matching is applied within the tuple of a key, not to within

1376

the bytestring of each key element. e.g. if you have the keys ('foo',

1377

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1378

only the former key is returned.

1379

1380

:param keys: An iterable providing the key prefixes to be retrieved.

1381

Each key prefix takes the form of a tuple the length of a key, but

1382

with the last N elements 'None' rather than a regular bytestring.

1383

The first element cannot be 'None'.

1384

:return: An iterable as per iter_all_entries, but restricted to the

1385

keys with a matching prefix to those supplied. No additional keys

1386

will be returned, and every match that is in the index will be

1387

returned.

1388

"""

1389

keys = set(keys)

1390

if not keys:

1391

return

1392

seen_keys = set()

1393

hit_indices = []

1394

while True:

1395

try:

1396

for index in self._indices:

1397

index_hit = False

1398

for node in index.iter_entries_prefix(keys):

1399

if node[1] in seen_keys:

1400

continue

1401

seen_keys.add(node[1])

1402

yield node

1403

index_hit = True

1404

if index_hit:

1405

hit_indices.append(index)

1406

break

1407

except errors.NoSuchFile:

1408

self._reload_or_raise()

1409

self._move_to_front(hit_indices)

1410

1411

def _move_to_front(self, hit_indices):

1412

"""Rearrange self._indices so that hit_indices are first.

1413

1414

Order is maintained as much as possible, e.g. the first unhit index

1415

will be the first index in _indices after the hit_indices, and the

1416

hit_indices will be present in exactly the order they are passed to

1417

_move_to_front.

1418

1419

_move_to_front propagates to all objects in self._sibling_indices by

1420

calling _move_to_front_by_name.

1421

"""

1422

if self._indices[:len(hit_indices)] == hit_indices:

1423

# The 'hit_indices' are already at the front (and in the same

1424

# order), no need to re-order

1425

return

1426

hit_names = self._move_to_front_by_index(hit_indices)

1427

for sibling_idx in self._sibling_indices:

1428

sibling_idx._move_to_front_by_name(hit_names)

1429

1430

def _move_to_front_by_index(self, hit_indices):

1431

"""Core logic for _move_to_front.

1432

1433

Returns a list of names corresponding to the hit_indices param.

1434

"""

1435

indices_info = zip(self._index_names, self._indices)

1436

if 'index' in debug.debug_flags:

1437

mutter('CombinedGraphIndex reordering: currently %r, promoting %r',

1438

indices_info, hit_indices)

1439

hit_names = []

1440

unhit_names = []

1441

new_hit_indices = []

1442

unhit_indices = []

1443

1444

for offset, (name, idx) in enumerate(indices_info):

1445

if idx in hit_indices:

1446

hit_names.append(name)

1447

new_hit_indices.append(idx)

1448

if len(new_hit_indices) == len(hit_indices):

1449

# We've found all of the hit entries, everything else is

1450

# unhit

1451

unhit_names.extend(self._index_names[offset+1:])

1452

unhit_indices.extend(self._indices[offset+1:])

1453

break

1454

else:

1455

unhit_names.append(name)

1456

unhit_indices.append(idx)

1457

1458

self._indices = new_hit_indices + unhit_indices

1459

self._index_names = hit_names + unhit_names

1460

if 'index' in debug.debug_flags:

1461

mutter('CombinedGraphIndex reordered: %r', self._indices)

1462

return hit_names

1463

1464

def _move_to_front_by_name(self, hit_names):

1465

"""Moves indices named by 'hit_names' to front of the search order, as

1466

described in _move_to_front.

1467

"""

1468

# Translate names to index instances, and then call

1469

# _move_to_front_by_index.

1470

indices_info = zip(self._index_names, self._indices)

1471

hit_indices = []

1472

for name, idx in indices_info:

1473

if name in hit_names:

1474

hit_indices.append(idx)

1475

self._move_to_front_by_index(hit_indices)

1476

1477

def find_ancestry(self, keys, ref_list_num):

1478

"""Find the complete ancestry for the given set of keys.

1479

1480

Note that this is a whole-ancestry request, so it should be used

1481

sparingly.

1482

1483

:param keys: An iterable of keys to look for

1484

:param ref_list_num: The reference list which references the parents

1485

we care about.

1486

:return: (parent_map, missing_keys)

1487

"""

1488

# XXX: make this call _move_to_front?

1489

missing_keys = set()

1490

parent_map = {}

1491

keys_to_lookup = set(keys)

1492

generation = 0

1493

while keys_to_lookup:

1494

# keys that *all* indexes claim are missing, stop searching them

1495

generation += 1

1496

all_index_missing = None

1497

# print 'gen\tidx\tsub\tn_keys\tn_pmap\tn_miss'

1498

# print '%4d\t\t\t%4d\t%5d\t%5d' % (generation, len(keys_to_lookup),

1499

# len(parent_map),

1500

# len(missing_keys))

1501

for index_idx, index in enumerate(self._indices):

1502

# TODO: we should probably be doing something with

1503

# 'missing_keys' since we've already determined that

1504

# those revisions have not been found anywhere

1505

index_missing_keys = set()

1506

# Find all of the ancestry we can from this index

1507

# keep looking until the search_keys set is empty, which means

1508

# things we didn't find should be in index_missing_keys

1509

search_keys = keys_to_lookup

1510

sub_generation = 0

1511

# print ' \t%2d\t\t%4d\t%5d\t%5d' % (

1512

# index_idx, len(search_keys),

1513

# len(parent_map), len(index_missing_keys))

1514

while search_keys:

1515

sub_generation += 1

1516

# TODO: ref_list_num should really be a parameter, since

1517

# CombinedGraphIndex does not know what the ref lists

1518

# mean.

1519

search_keys = index._find_ancestors(search_keys,

1520

ref_list_num, parent_map, index_missing_keys)

1521

# print ' \t \t%2d\t%4d\t%5d\t%5d' % (

1522

# sub_generation, len(search_keys),

1523

# len(parent_map), len(index_missing_keys))

1524

# Now set whatever was missing to be searched in the next index

1525

keys_to_lookup = index_missing_keys

1526

if all_index_missing is None:

1527

all_index_missing = set(index_missing_keys)

1528

else:

1529

all_index_missing.intersection_update(index_missing_keys)

1530

if not keys_to_lookup:

1531

break

1532

if all_index_missing is None:

1533

# There were no indexes, so all search keys are 'missing'

1534

missing_keys.update(keys_to_lookup)

1535

keys_to_lookup = None

1536

else:

1537

missing_keys.update(all_index_missing)

1538

keys_to_lookup.difference_update(all_index_missing)

1539

return parent_map, missing_keys

1540

1541

def key_count(self):

1542

"""Return an estimate of the number of keys in this index.

1543

1544

For CombinedGraphIndex this is approximated by the sum of the keys of

1545

the child indices. As child indices may have duplicate keys this can

1546

have a maximum error of the number of child indices * largest number of

1547

keys in any index.

1548

"""

1549

while True:

1550

try:

1551

return sum((index.key_count() for index in self._indices), 0)

1552

except errors.NoSuchFile:

1553

self._reload_or_raise()

1554

1555

missing_keys = _missing_keys_from_parent_map

1556

1557

def _reload_or_raise(self):

1558

"""We just got a NoSuchFile exception.

1559

1560

Try to reload the indices, if it fails, just raise the current

1561

exception.

1562

"""

1563

if self._reload_func is None:

1564

raise

1565

exc_type, exc_value, exc_traceback = sys.exc_info()

1566

trace.mutter('Trying to reload after getting exception: %s',

1567

exc_value)

1568

if not self._reload_func():

1569

# We tried to reload, but nothing changed, so we fail anyway

1570

trace.mutter('_reload_func indicated nothing has changed.'

1571

' Raising original exception.')

1572

raise exc_type, exc_value, exc_traceback

1573

1574

def set_sibling_indices(self, sibling_combined_graph_indices):

1575

"""Set the CombinedGraphIndex objects to reorder after reordering self.

1576

"""

1577

self._sibling_indices = sibling_combined_graph_indices

1578

1579

def validate(self):

1580

"""Validate that everything in the index can be accessed."""

1581

while True:

1582

try:

1583

for index in self._indices:

1584

index.validate()

1585

return

1586

except errors.NoSuchFile:

1587

self._reload_or_raise()

1588

1589

1590

class InMemoryGraphIndex(GraphIndexBuilder):

1591

"""A GraphIndex which operates entirely out of memory and is mutable.

1592

1593

This is designed to allow the accumulation of GraphIndex entries during a

1594

single write operation, where the accumulated entries need to be immediately

1595

available - for example via a CombinedGraphIndex.

1596

"""

1597

1598

def add_nodes(self, nodes):

1599

"""Add nodes to the index.

1600

1601

:param nodes: An iterable of (key, node_refs, value) entries to add.

1602

"""

1603

if self.reference_lists:

1604

for (key, value, node_refs) in nodes:

1605

self.add_node(key, value, node_refs)

1606

else:

1607

for (key, value) in nodes:

1608

self.add_node(key, value)

1609

1610

def iter_all_entries(self):

1611

"""Iterate over all keys within the index

1612

1613

:return: An iterable of (index, key, reference_lists, value). There is no

1614

defined order for the result iteration - it will be in the most

1615

efficient order for the index (in this case dictionary hash order).

1616

"""

1617

if 'evil' in debug.debug_flags:

1618

trace.mutter_callsite(3,

1619

"iter_all_entries scales with size of history.")

1620

if self.reference_lists:

1621

for key, (absent, references, value) in self._nodes.iteritems():

1622

if not absent:

1623

yield self, key, value, references

1624

else:

1625

for key, (absent, references, value) in self._nodes.iteritems():

1626

if not absent:

1627

yield self, key, value

1628

1629

def iter_entries(self, keys):

1630

"""Iterate over keys within the index.

1631

1632

:param keys: An iterable providing the keys to be retrieved.

1633

:return: An iterable of (index, key, value, reference_lists). There is no

1634

defined order for the result iteration - it will be in the most

1635

efficient order for the index (keys iteration order in this case).

1636

"""

1637

# Note: See BTreeBuilder.iter_entries for an explanation of why we

1638

# aren't using set().intersection() here

1639

nodes = self._nodes

1640

keys = [key for key in keys if key in nodes]

1641

if self.reference_lists:

1642

for key in keys:

1643

node = nodes[key]

1644

if not node[0]:

1645

yield self, key, node[2], node[1]

1646

else:

1647

for key in keys:

1648

node = nodes[key]

1649

if not node[0]:

1650

yield self, key, node[2]

1651

1652

def iter_entries_prefix(self, keys):

1653

"""Iterate over keys within the index using prefix matching.

1654

1655

Prefix matching is applied within the tuple of a key, not to within

1656

the bytestring of each key element. e.g. if you have the keys ('foo',

1657

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1658

only the former key is returned.

1659

1660

:param keys: An iterable providing the key prefixes to be retrieved.

1661

Each key prefix takes the form of a tuple the length of a key, but

1662

with the last N elements 'None' rather than a regular bytestring.

1663

The first element cannot be 'None'.

1664

:return: An iterable as per iter_all_entries, but restricted to the

1665

keys with a matching prefix to those supplied. No additional keys

1666

will be returned, and every match that is in the index will be

1667

returned.

1668

"""

1669

# XXX: To much duplication with the GraphIndex class; consider finding

1670

# a good place to pull out the actual common logic.

1671

keys = set(keys)

1672

if not keys:

1673

return

1674

if self._key_length == 1:

1675

for key in keys:

1676

# sanity check

1677

if key[0] is None:

1678

raise errors.BadIndexKey(key)

1679

if len(key) != self._key_length:

1680

raise errors.BadIndexKey(key)

1681

node = self._nodes[key]

1682

if node[0]:

1683

continue

1684

if self.reference_lists:

1685

yield self, key, node[2], node[1]

1686

else:

1687

yield self, key, node[2]

1688

return

1689

nodes_by_key = self._get_nodes_by_key()

1690

for key in keys:

1691

# sanity check

1692

if key[0] is None:

1693

raise errors.BadIndexKey(key)

1694

if len(key) != self._key_length:

1695

raise errors.BadIndexKey(key)

1696

# find what it refers to:

1697

key_dict = nodes_by_key

1698

elements = list(key)

1699

# find the subdict to return

1700

try:

1701

while len(elements) and elements[0] is not None:

1702

key_dict = key_dict[elements[0]]

1703

elements.pop(0)

1704

except KeyError:

1705

# a non-existant lookup.

1706

continue

1707

if len(elements):

1708

dicts = [key_dict]

1709

while dicts:

1710

key_dict = dicts.pop(-1)

1711

# can't be empty or would not exist

1712

item, value = key_dict.iteritems().next()

1713

if type(value) == dict:

1714

# push keys

1715

dicts.extend(key_dict.itervalues())

1716

else:

1717

# yield keys

1718

for value in key_dict.itervalues():

1719

yield (self, ) + value

1720

else:

1721

yield (self, ) + key_dict

1722

1723

def key_count(self):

1724

"""Return an estimate of the number of keys in this index.

1725

1726

For InMemoryGraphIndex the estimate is exact.

1727

"""

1728

return len(self._nodes) - len(self._absent_keys)

1729

1730

def validate(self):

1731

"""In memory index's have no known corruption at the moment."""

1732

1733

1734

class GraphIndexPrefixAdapter(object):

1735

"""An adapter between GraphIndex with different key lengths.

1736

1737

Queries against this will emit queries against the adapted Graph with the

1738

prefix added, queries for all items use iter_entries_prefix. The returned

1739

nodes will have their keys and node references adjusted to remove the

1740

prefix. Finally, an add_nodes_callback can be supplied - when called the

1741

nodes and references being added will have prefix prepended.

1742

"""

1743

1744

def __init__(self, adapted, prefix, missing_key_length,

1745

add_nodes_callback=None):

1746

"""Construct an adapter against adapted with prefix."""

1747

self.adapted = adapted

1748

self.prefix_key = prefix + (None,)*missing_key_length

1749

self.prefix = prefix

1750

self.prefix_len = len(prefix)

1751

self.add_nodes_callback = add_nodes_callback

1752

1753

def add_nodes(self, nodes):

1754

"""Add nodes to the index.

1755

1756

:param nodes: An iterable of (key, node_refs, value) entries to add.

1757

"""

1758

# save nodes in case its an iterator

1759

nodes = tuple(nodes)

1760

translated_nodes = []

1761

try:

1762

# Add prefix_key to each reference node_refs is a tuple of tuples,

1763

# so split it apart, and add prefix_key to the internal reference

1764

for (key, value, node_refs) in nodes:

1765

adjusted_references = (

1766

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1767

for ref_list in node_refs))

1768

translated_nodes.append((self.prefix + key, value,

1769

adjusted_references))

1770

except ValueError:

1771

# XXX: TODO add an explicit interface for getting the reference list

1772

# status, to handle this bit of user-friendliness in the API more

1773

# explicitly.

1774

for (key, value) in nodes:

1775

translated_nodes.append((self.prefix + key, value))

1776

self.add_nodes_callback(translated_nodes)

1777

1778

def add_node(self, key, value, references=()):

1779

"""Add a node to the index.

1780

1781

:param key: The key. keys are non-empty tuples containing

1782

as many whitespace-free utf8 bytestrings as the key length

1783

defined for this index.

1784

:param references: An iterable of iterables of keys. Each is a

1785

reference to another key.

1786

:param value: The value to associate with the key. It may be any

1787

bytes as long as it does not contain \0 or \n.

1788

"""

1789

self.add_nodes(((key, value, references), ))

1790

1791

def _strip_prefix(self, an_iter):

1792

"""Strip prefix data from nodes and return it."""

1793

for node in an_iter:

1794

# cross checks

1795

if node[1][:self.prefix_len] != self.prefix:

1796

raise errors.BadIndexData(self)

1797

for ref_list in node[3]:

1798

for ref_node in ref_list:

1799

if ref_node[:self.prefix_len] != self.prefix:

1800

raise errors.BadIndexData(self)

1801

yield node[0], node[1][self.prefix_len:], node[2], (

1802

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1803

for ref_list in node[3]))

1804

1805

def iter_all_entries(self):

1806

"""Iterate over all keys within the index

1807

1808

iter_all_entries is implemented against the adapted index using

1809

iter_entries_prefix.

1810

1811

:return: An iterable of (index, key, reference_lists, value). There is no

1812

defined order for the result iteration - it will be in the most

1813

efficient order for the index (in this case dictionary hash order).

1814

"""

1815

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1816

1817

def iter_entries(self, keys):

1818

"""Iterate over keys within the index.

1819

1820

:param keys: An iterable providing the keys to be retrieved.

1821

:return: An iterable of (index, key, value, reference_lists). There is no

1822

defined order for the result iteration - it will be in the most

1823

efficient order for the index (keys iteration order in this case).

1824

"""

1825

return self._strip_prefix(self.adapted.iter_entries(

1826

self.prefix + key for key in keys))

1827

1828

def iter_entries_prefix(self, keys):

1829

"""Iterate over keys within the index using prefix matching.

1830

1831

Prefix matching is applied within the tuple of a key, not to within

1832

the bytestring of each key element. e.g. if you have the keys ('foo',

1833

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1834

only the former key is returned.

1835

1836

:param keys: An iterable providing the key prefixes to be retrieved.

1837

Each key prefix takes the form of a tuple the length of a key, but

1838

with the last N elements 'None' rather than a regular bytestring.

1839

The first element cannot be 'None'.

1840

:return: An iterable as per iter_all_entries, but restricted to the

1841

keys with a matching prefix to those supplied. No additional keys

1842

will be returned, and every match that is in the index will be

1843

returned.

1844

"""

1845

return self._strip_prefix(self.adapted.iter_entries_prefix(

1846

self.prefix + key for key in keys))

1847

1848

def key_count(self):

1849

"""Return an estimate of the number of keys in this index.

1850

1851

For GraphIndexPrefixAdapter this is relatively expensive - key

1852

iteration with the prefix is done.

1853

"""

1854

return len(list(self.iter_all_entries()))

1855

1856

def validate(self):

1857

"""Call the adapted's validate."""

1858

self.adapted.validate()

Older »