~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Canonical.com Patch Queue Manager
Date: 2009-08-17 22:43:26 UTC
mfrom: (4617.1.2 integration)
Revision ID: pqm@pqm.ubuntu.com-20090817224326-uhljmr5me5x3xyda

(robertc) Multiple 2a-as-default fixes. (Robert Collins)

files added:
.bzrignore

.rsyncexclude

BRANCH.TODO

COPYING.txt

INSTALL

Makefile

NEWS

README

TODO

bzr.ico

bzrlib

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_py.py

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store

bzrlib/store/__init__.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/BUILD-NOTES

doc/Makefile

doc/_static

doc/_static/bzr icon 16.png

doc/_static/bzr.ico

doc/_static/en

doc/_static/en/quick-reference

doc/_static/en/quick-reference/Makefile

doc/_static/en/quick-reference/bzr-quick-reference.pdf

doc/_static/en/quick-reference/bzr-quick-reference.png

doc/_static/en/quick-reference/bzr-quick-reference.svg

doc/_templates

doc/_templates/index.html

doc/_templates/layout.html

doc/bazaar-vcs.org.kid

doc/conf.py

doc/contents.txt

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/developer-guide/HACKING.txt

doc/en/migration

doc/en/migration/index.txt

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-for-2x.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/developer-guide

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/Makefile

doc/es/quick-reference/quick-start-summary.pdf

doc/es/quick-reference/quick-start-summary.png

doc/es/quick-reference/quick-start-summary.svg

doc/es/release-notes

doc/es/user-guide

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/es/user-reference

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/make.bat

doc/news-template.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

setup.py

tools

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/convertfile.py

tools/convertinv.py

tools/generate_docs.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
.bzrignore

COPYING

NEWS

README

TODO

__init__.py

equivalence_table.py

errors.py

setup.py

tests

tests/__init__.py

tests/test_equivalence_table.py

tests/test_errors.py

tests/test_repofmt.py

files renamed:
_groupcompress_c.pyx => bzrlib/_groupcompress_pyx.pyx

groupcompress.py => bzrlib/groupcompress.py

repofmt.py => bzrlib/repofmt/groupcompress_repo.py

tests/test__groupcompress_c.py => bzrlib/tests/test__groupcompress.py

tests/test_groupcompress.py => bzrlib/tests/test_groupcompress.py

DESIGN => doc/developers/groupcompress-design.txt

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

self._key_length = key_elements

100

self._optimize_for_size = False

101

self._combine_backing_indices = True

102

103

def _check_key(self, key):

104

"""Raise BadIndexKey if key is not a valid key for this index."""

105

if type(key) != tuple:

106

raise errors.BadIndexKey(key)

107

if self._key_length != len(key):

108

raise errors.BadIndexKey(key)

109

for element in key:

110

if not element or _whitespace_re.search(element) is not None:

111

raise errors.BadIndexKey(element)

112

113

def _external_references(self):

114

"""Return references that are not present in this index.

115

"""

116

keys = set()

117

refs = set()

118

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

119

# lists are used. It is currently correct for pack-0.92 through

120

# 1.9, which use the node references (3rd column) second

121

# reference list as the compression parent. Perhaps this should

122

# be moved into something higher up the stack, since it

123

# makes assumptions about how the index is used.

124

if self.reference_lists > 1:

125

for node in self.iter_all_entries():

126

keys.add(node[1])

127

refs.update(node[3][1])

128

return refs - keys

129

else:

130

# If reference_lists == 0 there can be no external references, and

131

# if reference_lists == 1, then there isn't a place to store the

132

# compression parent

133

return set()

134

135

def _get_nodes_by_key(self):

136

if self._nodes_by_key is None:

137

nodes_by_key = {}

138

if self.reference_lists:

139

for key, (absent, references, value) in self._nodes.iteritems():

140

if absent:

141

continue

142

key_dict = nodes_by_key

143

for subkey in key[:-1]:

144

key_dict = key_dict.setdefault(subkey, {})

145

key_dict[key[-1]] = key, value, references

146

else:

147

for key, (absent, references, value) in self._nodes.iteritems():

148

if absent:

149

continue

150

key_dict = nodes_by_key

151

for subkey in key[:-1]:

152

key_dict = key_dict.setdefault(subkey, {})

153

key_dict[key[-1]] = key, value

154

self._nodes_by_key = nodes_by_key

155

return self._nodes_by_key

156

157

def _update_nodes_by_key(self, key, value, node_refs):

158

"""Update the _nodes_by_key dict with a new key.

159

160

For a key of (foo, bar, baz) create

161

_nodes_by_key[foo][bar][baz] = key_value

162

"""

163

if self._nodes_by_key is None:

164

return

165

key_dict = self._nodes_by_key

166

if self.reference_lists:

167

key_value = key, value, node_refs

168

else:

169

key_value = key, value

170

for subkey in key[:-1]:

171

key_dict = key_dict.setdefault(subkey, {})

172

key_dict[key[-1]] = key_value

173

174

def _check_key_ref_value(self, key, references, value):

175

"""Check that 'key' and 'references' are all valid.

176

177

:param key: A key tuple. Must conform to the key interface (be a tuple,

178

be of the right length, not have any whitespace or nulls in any key

179

element.)

180

:param references: An iterable of reference lists. Something like

181

[[(ref, key)], [(ref, key), (other, key)]]

182

:param value: The value associate with this key. Must not contain

183

newlines or null characters.

184

:return: (node_refs, absent_references)

185

node_refs basically a packed form of 'references' where all

186

iterables are tuples

187

absent_references reference keys that are not in self._nodes.

188

This may contain duplicates if the same key is

189

referenced in multiple lists.

190

"""

191

self._check_key(key)

192

if _newline_null_re.search(value) is not None:

193

raise errors.BadIndexValue(value)

194

if len(references) != self.reference_lists:

195

raise errors.BadIndexValue(references)

196

node_refs = []

197

absent_references = []

198

for reference_list in references:

199

for reference in reference_list:

200

# If reference *is* in self._nodes, then we know it has already

201

# been checked.

202

if reference not in self._nodes:

203

self._check_key(reference)

204

absent_references.append(reference)

205

node_refs.append(tuple(reference_list))

206

return tuple(node_refs), absent_references

207

208

def add_node(self, key, value, references=()):

209

"""Add a node to the index.

210

211

:param key: The key. keys are non-empty tuples containing

212

as many whitespace-free utf8 bytestrings as the key length

213

defined for this index.

214

:param references: An iterable of iterables of keys. Each is a

215

reference to another key.

216

:param value: The value to associate with the key. It may be any

217

bytes as long as it does not contain \0 or \n.

218

"""

219

(node_refs,

220

absent_references) = self._check_key_ref_value(key, references, value)

221

if key in self._nodes and self._nodes[key][0] != 'a':

222

raise errors.BadIndexDuplicateKey(key, self)

223

for reference in absent_references:

224

# There may be duplicates, but I don't think it is worth worrying

225

# about

226

self._nodes[reference] = ('a', (), '')

227

self._nodes[key] = ('', node_refs, value)

228

self._keys.add(key)

229

if self._nodes_by_key is not None and self._key_length > 1:

230

self._update_nodes_by_key(key, value, node_refs)

231

232

def finish(self):

233

lines = [_SIGNATURE]

234

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

235

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

236

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

237

prefix_length = sum(len(x) for x in lines)

238

# references are byte offsets. To avoid having to do nasty

239

# polynomial work to resolve offsets (references to later in the

240

# file cannot be determined until all the inbetween references have

241

# been calculated too) we pad the offsets with 0's to make them be

242

# of consistent length. Using binary offsets would break the trivial

243

# file parsing.

244

# to calculate the width of zero's needed we do three passes:

245

# one to gather all the non-reference data and the number of references.

246

# one to pad all the data with reference-length and determine entry

247

# addresses.

248

# One to serialise.

249

250

# forward sorted by key. In future we may consider topological sorting,

251

# at the cost of table scans for direct lookup, or a second index for

252

# direct lookup

253

nodes = sorted(self._nodes.items())

254

# if we do not prepass, we don't know how long it will be up front.

255

expected_bytes = None

256

# we only need to pre-pass if we have reference lists at all.

257

if self.reference_lists:

258

key_offset_info = []

259

non_ref_bytes = prefix_length

260

total_references = 0

261

# TODO use simple multiplication for the constants in this loop.

262

for key, (absent, references, value) in nodes:

263

# record the offset known *so far* for this key:

264

# the non reference bytes to date, and the total references to

265

# date - saves reaccumulating on the second pass

266

key_offset_info.append((key, non_ref_bytes, total_references))

267

# key is literal, value is literal, there are 3 null's, 1 NL

268

# key is variable length tuple, \x00 between elements

269

non_ref_bytes += sum(len(element) for element in key)

270

if self._key_length > 1:

271

non_ref_bytes += self._key_length - 1

272

# value is literal bytes, there are 3 null's, 1 NL.

273

non_ref_bytes += len(value) + 3 + 1

274

# one byte for absent if set.

275

if absent:

276

non_ref_bytes += 1

277

elif self.reference_lists:

278

# (ref_lists -1) tabs

279

non_ref_bytes += self.reference_lists - 1

280

# (ref-1 cr's per ref_list)

281

for ref_list in references:

282

# how many references across the whole file?

283

total_references += len(ref_list)

284

# accrue reference separators

285

if ref_list:

286

non_ref_bytes += len(ref_list) - 1

287

# how many digits are needed to represent the total byte count?

288

digits = 1

289

possible_total_bytes = non_ref_bytes + total_references*digits

290

while 10 ** digits < possible_total_bytes:

291

digits += 1

292

possible_total_bytes = non_ref_bytes + total_references*digits

293

expected_bytes = possible_total_bytes + 1 # terminating newline

294

# resolve key addresses.

295

key_addresses = {}

296

for key, non_ref_bytes, total_references in key_offset_info:

297

key_addresses[key] = non_ref_bytes + total_references*digits

298

# serialise

299

format_string = '%%0%sd' % digits

300

for key, (absent, references, value) in nodes:

301

flattened_references = []

302

for ref_list in references:

303

ref_addresses = []

304

for reference in ref_list:

305

ref_addresses.append(format_string % key_addresses[reference])

306

flattened_references.append('\r'.join(ref_addresses))

307

string_key = '\x00'.join(key)

308

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

309

'\t'.join(flattened_references), value))

310

lines.append('\n')

311

result = StringIO(''.join(lines))

312

if expected_bytes and len(result.getvalue()) != expected_bytes:

313

raise errors.BzrError('Failed index creation. Internal error:'

314

' mismatched output length and expected length: %d %d' %

315

(len(result.getvalue()), expected_bytes))

316

return result

317

318

def set_optimize(self, for_size=None, combine_backing_indices=None):

319

"""Change how the builder tries to optimize the result.

320

321

:param for_size: Tell the builder to try and make the index as small as

322

possible.

323

:param combine_backing_indices: If the builder spills to disk to save

324

memory, should the on-disk indices be combined. Set to True if you

325

are going to be probing the index, but to False if you are not. (If

326

you are not querying, then the time spent combining is wasted.)

327

:return: None

328

"""

329

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

330

# other builders do.

331

if for_size is not None:

332

self._optimize_for_size = for_size

333

if combine_backing_indices is not None:

334

self._combine_backing_indices = combine_backing_indices

335

336

337

class GraphIndex(object):

338

"""An index for data with embedded graphs.

339

340

The index maps keys to a list of key reference lists, and a value.

341

Each node has the same number of key reference lists. Each key reference

342

list can be empty or an arbitrary length. The value is an opaque NULL

343

terminated string without any newlines. The storage of the index is

344

hidden in the interface: keys and key references are always tuples of

345

bytestrings, never the internal representation (e.g. dictionary offsets).

346

347

It is presumed that the index will not be mutated - it is static data.

348

349

Successive iter_all_entries calls will read the entire index each time.

350

Additionally, iter_entries calls will read the index linearly until the

351

desired keys are found. XXX: This must be fixed before the index is

352

suitable for production use. :XXX

353

"""

354

355

def __init__(self, transport, name, size):

356

"""Open an index called name on transport.

357

358

:param transport: A bzrlib.transport.Transport.

359

:param name: A path to provide to transport API calls.

360

:param size: The size of the index in bytes. This is used for bisection

361

logic to perform partial index reads. While the size could be

362

obtained by statting the file this introduced an additional round

363

trip as well as requiring stat'able transports, both of which are

364

avoided by having it supplied. If size is None, then bisection

365

support will be disabled and accessing the index will just stream

366

all the data.

367

"""

368

self._transport = transport

369

self._name = name

370

# Becomes a dict of key:(value, reference-list-byte-locations) used by

371

# the bisection interface to store parsed but not resolved keys.

372

self._bisect_nodes = None

373

# Becomes a dict of key:(value, reference-list-keys) which are ready to

374

# be returned directly to callers.

375

self._nodes = None

376

# a sorted list of slice-addresses for the parsed bytes of the file.

377

# e.g. (0,1) would mean that byte 0 is parsed.

378

self._parsed_byte_map = []

379

# a sorted list of keys matching each slice address for parsed bytes

380

# e.g. (None, 'foo@bar') would mean that the first byte contained no

381

# key, and the end byte of the slice is the of the data for 'foo@bar'

382

self._parsed_key_map = []

383

self._key_count = None

384

self._keys_by_offset = None

385

self._nodes_by_key = None

386

self._size = size

387

# The number of bytes we've read so far in trying to process this file

388

self._bytes_read = 0

389

390

def __eq__(self, other):

391

"""Equal when self and other were created with the same parameters."""

392

return (

393

type(self) == type(other) and

394

self._transport == other._transport and

395

self._name == other._name and

396

self._size == other._size)

397

398

def __ne__(self, other):

399

return not self.__eq__(other)

400

401

def __repr__(self):

402

return "%s(%r)" % (self.__class__.__name__,

403

self._transport.abspath(self._name))

404

405

def _buffer_all(self, stream=None):

406

"""Buffer all the index data.

407

408

Mutates self._nodes and self.keys_by_offset.

409

"""

410

if self._nodes is not None:

411

# We already did this

412

return

413

if 'index' in debug.debug_flags:

414

mutter('Reading entire index %s', self._transport.abspath(self._name))

415

if stream is None:

416

stream = self._transport.get(self._name)

417

self._read_prefix(stream)

418

self._expected_elements = 3 + self._key_length

419

line_count = 0

420

# raw data keyed by offset

421

self._keys_by_offset = {}

422

# ready-to-return key:value or key:value, node_ref_lists

423

self._nodes = {}

424

self._nodes_by_key = None

425

trailers = 0

426

pos = stream.tell()

427

lines = stream.read().split('\n')

428

del lines[-1]

429

_, _, _, trailers = self._parse_lines(lines, pos)

430

for key, absent, references, value in self._keys_by_offset.itervalues():

431

if absent:

432

continue

433

# resolve references:

434

if self.node_ref_lists:

435

node_value = (value, self._resolve_references(references))

436

else:

437

node_value = value

438

self._nodes[key] = node_value

439

# cache the keys for quick set intersections

440

self._keys = set(self._nodes)

441

if trailers != 1:

442

# there must be one line - the empty trailer line.

443

raise errors.BadIndexData(self)

444

445

def external_references(self, ref_list_num):

446

"""Return references that are not present in this index.

447

"""

448

self._buffer_all()

449

if ref_list_num + 1 > self.node_ref_lists:

450

raise ValueError('No ref list %d, index has %d ref lists'

451

% (ref_list_num, self.node_ref_lists))

452

refs = set()

453

for key, (value, ref_lists) in self._nodes.iteritems():

454

ref_list = ref_lists[ref_list_num]

455

refs.update(ref_list)

456

return refs - self._keys

457

458

def _get_nodes_by_key(self):

459

if self._nodes_by_key is None:

460

nodes_by_key = {}

461

if self.node_ref_lists:

462

for key, (value, references) in self._nodes.iteritems():

463

key_dict = nodes_by_key

464

for subkey in key[:-1]:

465

key_dict = key_dict.setdefault(subkey, {})

466

key_dict[key[-1]] = key, value, references

467

else:

468

for key, value in self._nodes.iteritems():

469

key_dict = nodes_by_key

470

for subkey in key[:-1]:

471

key_dict = key_dict.setdefault(subkey, {})

472

key_dict[key[-1]] = key, value

473

self._nodes_by_key = nodes_by_key

474

return self._nodes_by_key

475

476

def iter_all_entries(self):

477

"""Iterate over all keys within the index.

478

479

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

480

The former tuple is used when there are no reference lists in the

481

index, making the API compatible with simple key:value index types.

482

There is no defined order for the result iteration - it will be in

483

the most efficient order for the index.

484

"""

485

if 'evil' in debug.debug_flags:

486

trace.mutter_callsite(3,

487

"iter_all_entries scales with size of history.")

488

if self._nodes is None:

489

self._buffer_all()

490

if self.node_ref_lists:

491

for key, (value, node_ref_lists) in self._nodes.iteritems():

492

yield self, key, value, node_ref_lists

493

else:

494

for key, value in self._nodes.iteritems():

495

yield self, key, value

496

497

def _read_prefix(self, stream):

498

signature = stream.read(len(self._signature()))

499

if not signature == self._signature():

500

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

501

options_line = stream.readline()

502

if not options_line.startswith(_OPTION_NODE_REFS):

503

raise errors.BadIndexOptions(self)

504

try:

505

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

506

except ValueError:

507

raise errors.BadIndexOptions(self)

508

options_line = stream.readline()

509

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

510

raise errors.BadIndexOptions(self)

511

try:

512

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

513

except ValueError:

514

raise errors.BadIndexOptions(self)

515

options_line = stream.readline()

516

if not options_line.startswith(_OPTION_LEN):

517

raise errors.BadIndexOptions(self)

518

try:

519

self._key_count = int(options_line[len(_OPTION_LEN):-1])

520

except ValueError:

521

raise errors.BadIndexOptions(self)

522

523

def _resolve_references(self, references):

524

"""Return the resolved key references for references.

525

526

References are resolved by looking up the location of the key in the

527

_keys_by_offset map and substituting the key name, preserving ordering.

528

529

:param references: An iterable of iterables of key locations. e.g.

530

[[123, 456], [123]]

531

:return: A tuple of tuples of keys.

532

"""

533

node_refs = []

534

for ref_list in references:

535

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

536

return tuple(node_refs)

537

538

def _find_index(self, range_map, key):

539

"""Helper for the _parsed_*_index calls.

540

541

Given a range map - [(start, end), ...], finds the index of the range

542

in the map for key if it is in the map, and if it is not there, the

543

immediately preceeding range in the map.

544

"""

545

result = bisect_right(range_map, key) - 1

546

if result + 1 < len(range_map):

547

# check the border condition, it may be in result + 1

548

if range_map[result + 1][0] == key[0]:

549

return result + 1

550

return result

551

552

def _parsed_byte_index(self, offset):

553

"""Return the index of the entry immediately before offset.

554

555

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

556

there is one unparsed byte (the 11th, addressed as[10]). then:

557

asking for 0 will return 0

558

asking for 10 will return 0

559

asking for 11 will return 1

560

asking for 12 will return 1

561

"""

562

key = (offset, 0)

563

return self._find_index(self._parsed_byte_map, key)

564

565

def _parsed_key_index(self, key):

566

"""Return the index of the entry immediately before key.

567

568

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

569

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

570

have been parsed, then:

571

asking for '' will return 0

572

asking for 'a' will return 0

573

asking for 'b' will return 1

574

asking for 'e' will return 1

575

"""

576

search_key = (key, None)

577

return self._find_index(self._parsed_key_map, search_key)

578

579

def _is_parsed(self, offset):

580

"""Returns True if offset has been parsed."""

581

index = self._parsed_byte_index(offset)

582

if index == len(self._parsed_byte_map):

583

return offset < self._parsed_byte_map[index - 1][1]

584

start, end = self._parsed_byte_map[index]

585

return offset >= start and offset < end

586

587

def _iter_entries_from_total_buffer(self, keys):

588

"""Iterate over keys when the entire index is parsed."""

589

keys = keys.intersection(self._keys)

590

if self.node_ref_lists:

591

for key in keys:

592

value, node_refs = self._nodes[key]

593

yield self, key, value, node_refs

594

else:

595

for key in keys:

596

yield self, key, self._nodes[key]

597

598

def iter_entries(self, keys):

599

"""Iterate over keys within the index.

600

601

:param keys: An iterable providing the keys to be retrieved.

602

:return: An iterable as per iter_all_entries, but restricted to the

603

keys supplied. No additional keys will be returned, and every

604

key supplied that is in the index will be returned.

605

"""

606

keys = set(keys)

607

if not keys:

608

return []

609

if self._size is None and self._nodes is None:

610

self._buffer_all()

611

612

# We fit about 20 keys per minimum-read (4K), so if we are looking for

613

# more than 1/20th of the index its likely (assuming homogenous key

614

# spread) that we'll read the entire index. If we're going to do that,

615

# buffer the whole thing. A better analysis might take key spread into

616

# account - but B+Tree indices are better anyway.

617

# We could look at all data read, and use a threshold there, which will

618

# trigger on ancestry walks, but that is not yet fully mapped out.

619

if self._nodes is None and len(keys) * 20 > self.key_count():

620

self._buffer_all()

621

if self._nodes is not None:

622

return self._iter_entries_from_total_buffer(keys)

623

else:

624

return (result[1] for result in bisect_multi_bytes(

625

self._lookup_keys_via_location, self._size, keys))

626

627

def iter_entries_prefix(self, keys):

628

"""Iterate over keys within the index using prefix matching.

629

630

Prefix matching is applied within the tuple of a key, not to within

631

the bytestring of each key element. e.g. if you have the keys ('foo',

632

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

633

only the former key is returned.

634

635

WARNING: Note that this method currently causes a full index parse

636

unconditionally (which is reasonably appropriate as it is a means for

637

thunking many small indices into one larger one and still supplies

638

iter_all_entries at the thunk layer).

639

640

:param keys: An iterable providing the key prefixes to be retrieved.

641

Each key prefix takes the form of a tuple the length of a key, but

642

with the last N elements 'None' rather than a regular bytestring.

643

The first element cannot be 'None'.

644

:return: An iterable as per iter_all_entries, but restricted to the

645

keys with a matching prefix to those supplied. No additional keys

646

will be returned, and every match that is in the index will be

647

returned.

648

"""

649

keys = set(keys)

650

if not keys:

651

return

652

# load data - also finds key lengths

653

if self._nodes is None:

654

self._buffer_all()

655

if self._key_length == 1:

656

for key in keys:

657

# sanity check

658

if key[0] is None:

659

raise errors.BadIndexKey(key)

660

if len(key) != self._key_length:

661

raise errors.BadIndexKey(key)

662

if self.node_ref_lists:

663

value, node_refs = self._nodes[key]

664

yield self, key, value, node_refs

665

else:

666

yield self, key, self._nodes[key]

667

return

668

nodes_by_key = self._get_nodes_by_key()

669

for key in keys:

670

# sanity check

671

if key[0] is None:

672

raise errors.BadIndexKey(key)

673

if len(key) != self._key_length:

674

raise errors.BadIndexKey(key)

675

# find what it refers to:

676

key_dict = nodes_by_key

677

elements = list(key)

678

# find the subdict whose contents should be returned.

679

try:

680

while len(elements) and elements[0] is not None:

681

key_dict = key_dict[elements[0]]

682

elements.pop(0)

683

except KeyError:

684

# a non-existant lookup.

685

continue

686

if len(elements):

687

dicts = [key_dict]

688

while dicts:

689

key_dict = dicts.pop(-1)

690

# can't be empty or would not exist

691

item, value = key_dict.iteritems().next()

692

if type(value) == dict:

693

# push keys

694

dicts.extend(key_dict.itervalues())

695

else:

696

# yield keys

697

for value in key_dict.itervalues():

698

# each value is the key:value:node refs tuple

699

# ready to yield.

700

yield (self, ) + value

701

else:

702

# the last thing looked up was a terminal element

703

yield (self, ) + key_dict

704

705

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

706

"""See BTreeIndex._find_ancestors."""

707

# The api can be implemented as a trivial overlay on top of

708

# iter_entries, it is not an efficient implementation, but it at least

709

# gets the job done.

710

found_keys = set()

711

search_keys = set()

712

for index, key, value, refs in self.iter_entries(keys):

713

parent_keys = refs[ref_list_num]

714

found_keys.add(key)

715

parent_map[key] = parent_keys

716

search_keys.update(parent_keys)

717

# Figure out what, if anything, was missing

718

missing_keys.update(set(keys).difference(found_keys))

719

search_keys = search_keys.difference(parent_map)

720

return search_keys

721

722

def key_count(self):

723

"""Return an estimate of the number of keys in this index.

724

725

For GraphIndex the estimate is exact.

726

"""

727

if self._key_count is None:

728

self._read_and_parse([_HEADER_READV])

729

return self._key_count

730

731

def _lookup_keys_via_location(self, location_keys):

732

"""Public interface for implementing bisection.

733

734

If _buffer_all has been called, then all the data for the index is in

735

memory, and this method should not be called, as it uses a separate

736

cache because it cannot pre-resolve all indices, which buffer_all does

737

for performance.

738

739

:param location_keys: A list of location(byte offset), key tuples.

740

:return: A list of (location_key, result) tuples as expected by

741

bzrlib.bisect_multi.bisect_multi_bytes.

742

"""

743

# Possible improvements:

744

# - only bisect lookup each key once

745

# - sort the keys first, and use that to reduce the bisection window

746

# -----

747

# this progresses in three parts:

748

# read data

749

# parse it

750

# attempt to answer the question from the now in memory data.

751

# build the readv request

752

# for each location, ask for 800 bytes - much more than rows we've seen

753

# anywhere.

754

readv_ranges = []

755

for location, key in location_keys:

756

# can we answer from cache?

757

if self._bisect_nodes and key in self._bisect_nodes:

758

# We have the key parsed.

759

continue

760

index = self._parsed_key_index(key)

761

if (len(self._parsed_key_map) and

762

self._parsed_key_map[index][0] <= key and

763

(self._parsed_key_map[index][1] >= key or

764

# end of the file has been parsed

765

self._parsed_byte_map[index][1] == self._size)):

766

# the key has been parsed, so no lookup is needed even if its

767

# not present.

768

continue

769

# - if we have examined this part of the file already - yes

770

index = self._parsed_byte_index(location)

771

if (len(self._parsed_byte_map) and

772

self._parsed_byte_map[index][0] <= location and

773

self._parsed_byte_map[index][1] > location):

774

# the byte region has been parsed, so no read is needed.

775

continue

776

length = 800

777

if location + length > self._size:

778

length = self._size - location

779

# todo, trim out parsed locations.

780

if length > 0:

781

readv_ranges.append((location, length))

782

# read the header if needed

783

if self._bisect_nodes is None:

784

readv_ranges.append(_HEADER_READV)

785

self._read_and_parse(readv_ranges)

786

result = []

787

if self._nodes is not None:

788

# _read_and_parse triggered a _buffer_all because we requested the

789

# whole data range

790

for location, key in location_keys:

791

if key not in self._nodes: # not present

792

result.append(((location, key), False))

793

elif self.node_ref_lists:

794

value, refs = self._nodes[key]

795

result.append(((location, key),

796

(self, key, value, refs)))

797

else:

798

result.append(((location, key),

799

(self, key, self._nodes[key])))

800

return result

801

# generate results:

802

# - figure out <, >, missing, present

803

# - result present references so we can return them.

804

# keys that we cannot answer until we resolve references

805

pending_references = []

806

pending_locations = set()

807

for location, key in location_keys:

808

# can we answer from cache?

809

if key in self._bisect_nodes:

810

# the key has been parsed, so no lookup is needed

811

if self.node_ref_lists:

812

# the references may not have been all parsed.

813

value, refs = self._bisect_nodes[key]

814

wanted_locations = []

815

for ref_list in refs:

816

for ref in ref_list:

817

if ref not in self._keys_by_offset:

818

wanted_locations.append(ref)

819

if wanted_locations:

820

pending_locations.update(wanted_locations)

821

pending_references.append((location, key))

822

continue

823

result.append(((location, key), (self, key,

824

value, self._resolve_references(refs))))

825

else:

826

result.append(((location, key),

827

(self, key, self._bisect_nodes[key])))

828

continue

829

else:

830

# has the region the key should be in, been parsed?

831

index = self._parsed_key_index(key)

832

if (self._parsed_key_map[index][0] <= key and

833

(self._parsed_key_map[index][1] >= key or

834

# end of the file has been parsed

835

self._parsed_byte_map[index][1] == self._size)):

836

result.append(((location, key), False))

837

continue

838

# no, is the key above or below the probed location:

839

# get the range of the probed & parsed location

840

index = self._parsed_byte_index(location)

841

# if the key is below the start of the range, its below

842

if key < self._parsed_key_map[index][0]:

843

direction = -1

844

else:

845

direction = +1

846

result.append(((location, key), direction))

847

readv_ranges = []

848

# lookup data to resolve references

849

for location in pending_locations:

850

length = 800

851

if location + length > self._size:

852

length = self._size - location

853

# TODO: trim out parsed locations (e.g. if the 800 is into the

854

# parsed region trim it, and dont use the adjust_for_latency

855

# facility)

856

if length > 0:

857

readv_ranges.append((location, length))

858

self._read_and_parse(readv_ranges)

859

if self._nodes is not None:

860

# The _read_and_parse triggered a _buffer_all, grab the data and

861

# return it

862

for location, key in pending_references:

863

value, refs = self._nodes[key]

864

result.append(((location, key), (self, key, value, refs)))

865

return result

866

for location, key in pending_references:

867

# answer key references we had to look-up-late.

868

value, refs = self._bisect_nodes[key]

869

result.append(((location, key), (self, key,

870

value, self._resolve_references(refs))))

871

return result

872

873

def _parse_header_from_bytes(self, bytes):

874

"""Parse the header from a region of bytes.

875

876

:param bytes: The data to parse.

877

:return: An offset, data tuple such as readv yields, for the unparsed

878

data. (which may length 0).

879

"""

880

signature = bytes[0:len(self._signature())]

881

if not signature == self._signature():

882

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

883

lines = bytes[len(self._signature()):].splitlines()

884

options_line = lines[0]

885

if not options_line.startswith(_OPTION_NODE_REFS):

886

raise errors.BadIndexOptions(self)

887

try:

888

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

889

except ValueError:

890

raise errors.BadIndexOptions(self)

891

options_line = lines[1]

892

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

893

raise errors.BadIndexOptions(self)

894

try:

895

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

896

except ValueError:

897

raise errors.BadIndexOptions(self)

898

options_line = lines[2]

899

if not options_line.startswith(_OPTION_LEN):

900

raise errors.BadIndexOptions(self)

901

try:

902

self._key_count = int(options_line[len(_OPTION_LEN):])

903

except ValueError:

904

raise errors.BadIndexOptions(self)

905

# calculate the bytes we have processed

906

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

907

len(lines[2]) + 3)

908

self._parsed_bytes(0, None, header_end, None)

909

# setup parsing state

910

self._expected_elements = 3 + self._key_length

911

# raw data keyed by offset

912

self._keys_by_offset = {}

913

# keys with the value and node references

914

self._bisect_nodes = {}

915

return header_end, bytes[header_end:]

916

917

def _parse_region(self, offset, data):

918

"""Parse node data returned from a readv operation.

919

920

:param offset: The byte offset the data starts at.

921

:param data: The data to parse.

922

"""

923

# trim the data.

924

# end first:

925

end = offset + len(data)

926

high_parsed = offset

927

while True:

928

# Trivial test - if the current index's end is within the

929

# low-matching parsed range, we're done.

930

index = self._parsed_byte_index(high_parsed)

931

if end < self._parsed_byte_map[index][1]:

932

return

933

# print "[%d:%d]" % (offset, end), \

934

# self._parsed_byte_map[index:index + 2]

935

high_parsed, last_segment = self._parse_segment(

936

offset, data, end, index)

937

if last_segment:

938

return

939

940

def _parse_segment(self, offset, data, end, index):

941

"""Parse one segment of data.

942

943

:param offset: Where 'data' begins in the file.

944

:param data: Some data to parse a segment of.

945

:param end: Where data ends

946

:param index: The current index into the parsed bytes map.

947

:return: True if the parsed segment is the last possible one in the

948

range of data.

949

:return: high_parsed_byte, last_segment.

950

high_parsed_byte is the location of the highest parsed byte in this

951

segment, last_segment is True if the parsed segment is the last

952

possible one in the data block.

953

"""

954

# default is to use all data

955

trim_end = None

956

# accomodate overlap with data before this.

957

if offset < self._parsed_byte_map[index][1]:

958

# overlaps the lower parsed region

959

# skip the parsed data

960

trim_start = self._parsed_byte_map[index][1] - offset

961

# don't trim the start for \n

962

start_adjacent = True

963

elif offset == self._parsed_byte_map[index][1]:

964

# abuts the lower parsed region

965

# use all data

966

trim_start = None

967

# do not trim anything

968

start_adjacent = True

969

else:

970

# does not overlap the lower parsed region

971

# use all data

972

trim_start = None

973

# but trim the leading \n

974

start_adjacent = False

975

if end == self._size:

976

# lines up to the end of all data:

977

# use it all

978

trim_end = None

979

# do not strip to the last \n

980

end_adjacent = True

981

last_segment = True

982

elif index + 1 == len(self._parsed_byte_map):

983

# at the end of the parsed data

984

# use it all

985

trim_end = None

986

# but strip to the last \n

987

end_adjacent = False

988

last_segment = True

989

elif end == self._parsed_byte_map[index + 1][0]:

990

# buts up against the next parsed region

991

# use it all

992

trim_end = None

993

# do not strip to the last \n

994

end_adjacent = True

995

last_segment = True

996

elif end > self._parsed_byte_map[index + 1][0]:

997

# overlaps into the next parsed region

998

# only consider the unparsed data

999

trim_end = self._parsed_byte_map[index + 1][0] - offset

1000

# do not strip to the last \n as we know its an entire record

1001

end_adjacent = True

1002

last_segment = end < self._parsed_byte_map[index + 1][1]

1003

else:

1004

# does not overlap into the next region

1005

# use it all

1006

trim_end = None

1007

# but strip to the last \n

1008

end_adjacent = False

1009

last_segment = True

1010

# now find bytes to discard if needed

1011

if not start_adjacent:

1012

# work around python bug in rfind

1013

if trim_start is None:

1014

trim_start = data.find('\n') + 1

1015

else:

1016

trim_start = data.find('\n', trim_start) + 1

1017

if not (trim_start != 0):

1018

raise AssertionError('no \n was present')

1019

# print 'removing start', offset, trim_start, repr(data[:trim_start])

1020

if not end_adjacent:

1021

# work around python bug in rfind

1022

if trim_end is None:

1023

trim_end = data.rfind('\n') + 1

1024

else:

1025

trim_end = data.rfind('\n', None, trim_end) + 1

1026

if not (trim_end != 0):

1027

raise AssertionError('no \n was present')

1028

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1029

# adjust offset and data to the parseable data.

1030

trimmed_data = data[trim_start:trim_end]

1031

if not (trimmed_data):

1032

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1033

% (trim_start, trim_end, offset, offset + len(data)))

1034

if trim_start:

1035

offset += trim_start

1036

# print "parsing", repr(trimmed_data)

1037

# splitlines mangles the \r delimiters.. don't use it.

1038

lines = trimmed_data.split('\n')

1039

del lines[-1]

1040

pos = offset

1041

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1042

for key, value in nodes:

1043

self._bisect_nodes[key] = value

1044

self._parsed_bytes(offset, first_key,

1045

offset + len(trimmed_data), last_key)

1046

return offset + len(trimmed_data), last_segment

1047

1048

def _parse_lines(self, lines, pos):

1049

key = None

1050

first_key = None

1051

trailers = 0

1052

nodes = []

1053

for line in lines:

1054

if line == '':

1055

# must be at the end

1056

if self._size:

1057

if not (self._size == pos + 1):

1058

raise AssertionError("%s %s" % (self._size, pos))

1059

trailers += 1

1060

continue

1061

elements = line.split('\0')

1062

if len(elements) != self._expected_elements:

1063

raise errors.BadIndexData(self)

1064

# keys are tuples. Each element is a string that may occur many

1065

# times, so we intern them to save space. AB, RC, 200807

1066

key = tuple([intern(element) for element in elements[:self._key_length]])

1067

if first_key is None:

1068

first_key = key

1069

absent, references, value = elements[-3:]

1070

ref_lists = []

1071

for ref_string in references.split('\t'):

1072

ref_lists.append(tuple([

1073

int(ref) for ref in ref_string.split('\r') if ref

1074

]))

1075

ref_lists = tuple(ref_lists)

1076

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1077

pos += len(line) + 1 # +1 for the \n

1078

if absent:

1079

continue

1080

if self.node_ref_lists:

1081

node_value = (value, ref_lists)

1082

else:

1083

node_value = value

1084

nodes.append((key, node_value))

1085

# print "parsed ", key

1086

return first_key, key, nodes, trailers

1087

1088

def _parsed_bytes(self, start, start_key, end, end_key):

1089

"""Mark the bytes from start to end as parsed.

1090

1091

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1092

1) as parsed.

1093

1094

:param start: The start of the parsed region.

1095

:param end: The end of the parsed region.

1096

"""

1097

index = self._parsed_byte_index(start)

1098

new_value = (start, end)

1099

new_key = (start_key, end_key)

1100

if index == -1:

1101

# first range parsed is always the beginning.

1102

self._parsed_byte_map.insert(index, new_value)

1103

self._parsed_key_map.insert(index, new_key)

1104

return

1105

# four cases:

1106

# new region

1107

# extend lower region

1108

# extend higher region

1109

# combine two regions

1110

if (index + 1 < len(self._parsed_byte_map) and

1111

self._parsed_byte_map[index][1] == start and

1112

self._parsed_byte_map[index + 1][0] == end):

1113

# combine two regions

1114

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1115

self._parsed_byte_map[index + 1][1])

1116

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1117

self._parsed_key_map[index + 1][1])

1118

del self._parsed_byte_map[index + 1]

1119

del self._parsed_key_map[index + 1]

1120

elif self._parsed_byte_map[index][1] == start:

1121

# extend the lower entry

1122

self._parsed_byte_map[index] = (

1123

self._parsed_byte_map[index][0], end)

1124

self._parsed_key_map[index] = (

1125

self._parsed_key_map[index][0], end_key)

1126

elif (index + 1 < len(self._parsed_byte_map) and

1127

self._parsed_byte_map[index + 1][0] == end):

1128

# extend the higher entry

1129

self._parsed_byte_map[index + 1] = (

1130

start, self._parsed_byte_map[index + 1][1])

1131

self._parsed_key_map[index + 1] = (

1132

start_key, self._parsed_key_map[index + 1][1])

1133

else:

1134

# new entry

1135

self._parsed_byte_map.insert(index + 1, new_value)

1136

self._parsed_key_map.insert(index + 1, new_key)

1137

1138

def _read_and_parse(self, readv_ranges):

1139

"""Read the the ranges and parse the resulting data.

1140

1141

:param readv_ranges: A prepared readv range list.

1142

"""

1143

if not readv_ranges:

1144

return

1145

if self._nodes is None and self._bytes_read * 2 >= self._size:

1146

# We've already read more than 50% of the file and we are about to

1147

# request more data, just _buffer_all() and be done

1148

self._buffer_all()

1149

return

1150

1151

readv_data = self._transport.readv(self._name, readv_ranges, True,

1152

self._size)

1153

# parse

1154

for offset, data in readv_data:

1155

self._bytes_read += len(data)

1156

if offset == 0 and len(data) == self._size:

1157

# We read the whole range, most likely because the

1158

# Transport upcast our readv ranges into one long request

1159

# for enough total data to grab the whole index.

1160

self._buffer_all(StringIO(data))

1161

return

1162

if self._bisect_nodes is None:

1163

# this must be the start

1164

if not (offset == 0):

1165

raise AssertionError()

1166

offset, data = self._parse_header_from_bytes(data)

1167

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1168

self._parse_region(offset, data)

1169

1170

def _signature(self):

1171

"""The file signature for this index type."""

1172

return _SIGNATURE

1173

1174

def validate(self):

1175

"""Validate that everything in the index can be accessed."""

1176

# iter_all validates completely at the moment, so just do that.

1177

for node in self.iter_all_entries():

1178

pass

1179

1180

1181

class CombinedGraphIndex(object):

1182

"""A GraphIndex made up from smaller GraphIndices.

1183

1184

The backing indices must implement GraphIndex, and are presumed to be

1185

static data.

1186

1187

Queries against the combined index will be made against the first index,

1188

and then the second and so on. The order of index's can thus influence

1189

performance significantly. For example, if one index is on local disk and a

1190

second on a remote server, the local disk index should be before the other

1191

in the index list.

1192

"""

1193

1194

def __init__(self, indices, reload_func=None):

1195

"""Create a CombinedGraphIndex backed by indices.

1196

1197

:param indices: An ordered list of indices to query for data.

1198

:param reload_func: A function to call if we find we are missing an

1199

index. Should have the form reload_func() => True/False to indicate

1200

if reloading actually changed anything.

1201

"""

1202

self._indices = indices

1203

self._reload_func = reload_func

1204

1205

def __repr__(self):

1206

return "%s(%s)" % (

1207

self.__class__.__name__,

1208

', '.join(map(repr, self._indices)))

1209

1210

def get_parent_map(self, keys):

1211

"""See graph.StackedParentsProvider.get_parent_map"""

1212

search_keys = set(keys)

1213

if NULL_REVISION in search_keys:

1214

search_keys.discard(NULL_REVISION)

1215

found_parents = {NULL_REVISION:[]}

1216

else:

1217

found_parents = {}

1218

for index, key, value, refs in self.iter_entries(search_keys):

1219

parents = refs[0]

1220

if not parents:

1221

parents = (NULL_REVISION,)

1222

found_parents[key] = parents

1223

return found_parents

1224

1225

has_key = _has_key_from_parent_map

1226

1227

def insert_index(self, pos, index):

1228

"""Insert a new index in the list of indices to query.

1229

1230

:param pos: The position to insert the index.

1231

:param index: The index to insert.

1232

"""

1233

self._indices.insert(pos, index)

1234

1235

def iter_all_entries(self):

1236

"""Iterate over all keys within the index

1237

1238

Duplicate keys across child indices are presumed to have the same

1239

value and are only reported once.

1240

1241

:return: An iterable of (index, key, reference_lists, value).

1242

There is no defined order for the result iteration - it will be in

1243

the most efficient order for the index.

1244

"""

1245

seen_keys = set()

1246

while True:

1247

try:

1248

for index in self._indices:

1249

for node in index.iter_all_entries():

1250

if node[1] not in seen_keys:

1251

yield node

1252

seen_keys.add(node[1])

1253

return

1254

except errors.NoSuchFile:

1255

self._reload_or_raise()

1256

1257

def iter_entries(self, keys):

1258

"""Iterate over keys within the index.

1259

1260

Duplicate keys across child indices are presumed to have the same

1261

value and are only reported once.

1262

1263

:param keys: An iterable providing the keys to be retrieved.

1264

:return: An iterable of (index, key, reference_lists, value). There is no

1265

defined order for the result iteration - it will be in the most

1266

efficient order for the index.

1267

"""

1268

keys = set(keys)

1269

while True:

1270

try:

1271

for index in self._indices:

1272

if not keys:

1273

return

1274

for node in index.iter_entries(keys):

1275

keys.remove(node[1])

1276

yield node

1277

return

1278

except errors.NoSuchFile:

1279

self._reload_or_raise()

1280

1281

def iter_entries_prefix(self, keys):

1282

"""Iterate over keys within the index using prefix matching.

1283

1284

Duplicate keys across child indices are presumed to have the same

1285

value and are only reported once.

1286

1287

Prefix matching is applied within the tuple of a key, not to within

1288

the bytestring of each key element. e.g. if you have the keys ('foo',

1289

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1290

only the former key is returned.

1291

1292

:param keys: An iterable providing the key prefixes to be retrieved.

1293

Each key prefix takes the form of a tuple the length of a key, but

1294

with the last N elements 'None' rather than a regular bytestring.

1295

The first element cannot be 'None'.

1296

:return: An iterable as per iter_all_entries, but restricted to the

1297

keys with a matching prefix to those supplied. No additional keys

1298

will be returned, and every match that is in the index will be

1299

returned.

1300

"""

1301

keys = set(keys)

1302

if not keys:

1303

return

1304

seen_keys = set()

1305

while True:

1306

try:

1307

for index in self._indices:

1308

for node in index.iter_entries_prefix(keys):

1309

if node[1] in seen_keys:

1310

continue

1311

seen_keys.add(node[1])

1312

yield node

1313

return

1314

except errors.NoSuchFile:

1315

self._reload_or_raise()

1316

1317

def find_ancestry(self, keys, ref_list_num):

1318

"""Find the complete ancestry for the given set of keys.

1319

1320

Note that this is a whole-ancestry request, so it should be used

1321

sparingly.

1322

1323

:param keys: An iterable of keys to look for

1324

:param ref_list_num: The reference list which references the parents

1325

we care about.

1326

:return: (parent_map, missing_keys)

1327

"""

1328

missing_keys = set()

1329

parent_map = {}

1330

keys_to_lookup = set(keys)

1331

generation = 0

1332

while keys_to_lookup:

1333

# keys that *all* indexes claim are missing, stop searching them

1334

generation += 1

1335

all_index_missing = None

1336

# print 'gen\tidx\tsub\tn_keys\tn_pmap\tn_miss'

1337

# print '%4d\t\t\t%4d\t%5d\t%5d' % (generation, len(keys_to_lookup),

1338

# len(parent_map),

1339

# len(missing_keys))

1340

for index_idx, index in enumerate(self._indices):

1341

# TODO: we should probably be doing something with

1342

# 'missing_keys' since we've already determined that

1343

# those revisions have not been found anywhere

1344

index_missing_keys = set()

1345

# Find all of the ancestry we can from this index

1346

# keep looking until the search_keys set is empty, which means

1347

# things we didn't find should be in index_missing_keys

1348

search_keys = keys_to_lookup

1349

sub_generation = 0

1350

# print ' \t%2d\t\t%4d\t%5d\t%5d' % (

1351

# index_idx, len(search_keys),

1352

# len(parent_map), len(index_missing_keys))

1353

while search_keys:

1354

sub_generation += 1

1355

# TODO: ref_list_num should really be a parameter, since

1356

# CombinedGraphIndex does not know what the ref lists

1357

# mean.

1358

search_keys = index._find_ancestors(search_keys,

1359

ref_list_num, parent_map, index_missing_keys)

1360

# print ' \t \t%2d\t%4d\t%5d\t%5d' % (

1361

# sub_generation, len(search_keys),

1362

# len(parent_map), len(index_missing_keys))

1363

# Now set whatever was missing to be searched in the next index

1364

keys_to_lookup = index_missing_keys

1365

if all_index_missing is None:

1366

all_index_missing = set(index_missing_keys)

1367

else:

1368

all_index_missing.intersection_update(index_missing_keys)

1369

if not keys_to_lookup:

1370

break

1371

if all_index_missing is None:

1372

# There were no indexes, so all search keys are 'missing'

1373

missing_keys.update(keys_to_lookup)

1374

keys_to_lookup = None

1375

else:

1376

missing_keys.update(all_index_missing)

1377

keys_to_lookup.difference_update(all_index_missing)

1378

return parent_map, missing_keys

1379

1380

def key_count(self):

1381

"""Return an estimate of the number of keys in this index.

1382

1383

For CombinedGraphIndex this is approximated by the sum of the keys of

1384

the child indices. As child indices may have duplicate keys this can

1385

have a maximum error of the number of child indices * largest number of

1386

keys in any index.

1387

"""

1388

while True:

1389

try:

1390

return sum((index.key_count() for index in self._indices), 0)

1391

except errors.NoSuchFile:

1392

self._reload_or_raise()

1393

1394

missing_keys = _missing_keys_from_parent_map

1395

1396

def _reload_or_raise(self):

1397

"""We just got a NoSuchFile exception.

1398

1399

Try to reload the indices, if it fails, just raise the current

1400

exception.

1401

"""

1402

if self._reload_func is None:

1403

raise

1404

exc_type, exc_value, exc_traceback = sys.exc_info()

1405

trace.mutter('Trying to reload after getting exception: %s',

1406

exc_value)

1407

if not self._reload_func():

1408

# We tried to reload, but nothing changed, so we fail anyway

1409

trace.mutter('_reload_func indicated nothing has changed.'

1410

' Raising original exception.')

1411

raise exc_type, exc_value, exc_traceback

1412

1413

def validate(self):

1414

"""Validate that everything in the index can be accessed."""

1415

while True:

1416

try:

1417

for index in self._indices:

1418

index.validate()

1419

return

1420

except errors.NoSuchFile:

1421

self._reload_or_raise()

1422

1423

1424

class InMemoryGraphIndex(GraphIndexBuilder):

1425

"""A GraphIndex which operates entirely out of memory and is mutable.

1426

1427

This is designed to allow the accumulation of GraphIndex entries during a

1428

single write operation, where the accumulated entries need to be immediately

1429

available - for example via a CombinedGraphIndex.

1430

"""

1431

1432

def add_nodes(self, nodes):

1433

"""Add nodes to the index.

1434

1435

:param nodes: An iterable of (key, node_refs, value) entries to add.

1436

"""

1437

if self.reference_lists:

1438

for (key, value, node_refs) in nodes:

1439

self.add_node(key, value, node_refs)

1440

else:

1441

for (key, value) in nodes:

1442

self.add_node(key, value)

1443

1444

def iter_all_entries(self):

1445

"""Iterate over all keys within the index

1446

1447

:return: An iterable of (index, key, reference_lists, value). There is no

1448

defined order for the result iteration - it will be in the most

1449

efficient order for the index (in this case dictionary hash order).

1450

"""

1451

if 'evil' in debug.debug_flags:

1452

trace.mutter_callsite(3,

1453

"iter_all_entries scales with size of history.")

1454

if self.reference_lists:

1455

for key, (absent, references, value) in self._nodes.iteritems():

1456

if not absent:

1457

yield self, key, value, references

1458

else:

1459

for key, (absent, references, value) in self._nodes.iteritems():

1460

if not absent:

1461

yield self, key, value

1462

1463

def iter_entries(self, keys):

1464

"""Iterate over keys within the index.

1465

1466

:param keys: An iterable providing the keys to be retrieved.

1467

:return: An iterable of (index, key, value, reference_lists). There is no

1468

defined order for the result iteration - it will be in the most

1469

efficient order for the index (keys iteration order in this case).

1470

"""

1471

keys = set(keys)

1472

if self.reference_lists:

1473

for key in keys.intersection(self._keys):

1474

node = self._nodes[key]

1475

if not node[0]:

1476

yield self, key, node[2], node[1]

1477

else:

1478

for key in keys.intersection(self._keys):

1479

node = self._nodes[key]

1480

if not node[0]:

1481

yield self, key, node[2]

1482

1483

def iter_entries_prefix(self, keys):

1484

"""Iterate over keys within the index using prefix matching.

1485

1486

Prefix matching is applied within the tuple of a key, not to within

1487

the bytestring of each key element. e.g. if you have the keys ('foo',

1488

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1489

only the former key is returned.

1490

1491

:param keys: An iterable providing the key prefixes to be retrieved.

1492

Each key prefix takes the form of a tuple the length of a key, but

1493

with the last N elements 'None' rather than a regular bytestring.

1494

The first element cannot be 'None'.

1495

:return: An iterable as per iter_all_entries, but restricted to the

1496

keys with a matching prefix to those supplied. No additional keys

1497

will be returned, and every match that is in the index will be

1498

returned.

1499

"""

1500

# XXX: To much duplication with the GraphIndex class; consider finding

1501

# a good place to pull out the actual common logic.

1502

keys = set(keys)

1503

if not keys:

1504

return

1505

if self._key_length == 1:

1506

for key in keys:

1507

# sanity check

1508

if key[0] is None:

1509

raise errors.BadIndexKey(key)

1510

if len(key) != self._key_length:

1511

raise errors.BadIndexKey(key)

1512

node = self._nodes[key]

1513

if node[0]:

1514

continue

1515

if self.reference_lists:

1516

yield self, key, node[2], node[1]

1517

else:

1518

yield self, key, node[2]

1519

return

1520

nodes_by_key = self._get_nodes_by_key()

1521

for key in keys:

1522

# sanity check

1523

if key[0] is None:

1524

raise errors.BadIndexKey(key)

1525

if len(key) != self._key_length:

1526

raise errors.BadIndexKey(key)

1527

# find what it refers to:

1528

key_dict = nodes_by_key

1529

elements = list(key)

1530

# find the subdict to return

1531

try:

1532

while len(elements) and elements[0] is not None:

1533

key_dict = key_dict[elements[0]]

1534

elements.pop(0)

1535

except KeyError:

1536

# a non-existant lookup.

1537

continue

1538

if len(elements):

1539

dicts = [key_dict]

1540

while dicts:

1541

key_dict = dicts.pop(-1)

1542

# can't be empty or would not exist

1543

item, value = key_dict.iteritems().next()

1544

if type(value) == dict:

1545

# push keys

1546

dicts.extend(key_dict.itervalues())

1547

else:

1548

# yield keys

1549

for value in key_dict.itervalues():

1550

yield (self, ) + value

1551

else:

1552

yield (self, ) + key_dict

1553

1554

def key_count(self):

1555

"""Return an estimate of the number of keys in this index.

1556

1557

For InMemoryGraphIndex the estimate is exact.

1558

"""

1559

return len(self._keys)

1560

1561

def validate(self):

1562

"""In memory index's have no known corruption at the moment."""

1563

1564

1565

class GraphIndexPrefixAdapter(object):

1566

"""An adapter between GraphIndex with different key lengths.

1567

1568

Queries against this will emit queries against the adapted Graph with the

1569

prefix added, queries for all items use iter_entries_prefix. The returned

1570

nodes will have their keys and node references adjusted to remove the

1571

prefix. Finally, an add_nodes_callback can be supplied - when called the

1572

nodes and references being added will have prefix prepended.

1573

"""

1574

1575

def __init__(self, adapted, prefix, missing_key_length,

1576

add_nodes_callback=None):

1577

"""Construct an adapter against adapted with prefix."""

1578

self.adapted = adapted

1579

self.prefix_key = prefix + (None,)*missing_key_length

1580

self.prefix = prefix

1581

self.prefix_len = len(prefix)

1582

self.add_nodes_callback = add_nodes_callback

1583

1584

def add_nodes(self, nodes):

1585

"""Add nodes to the index.

1586

1587

:param nodes: An iterable of (key, node_refs, value) entries to add.

1588

"""

1589

# save nodes in case its an iterator

1590

nodes = tuple(nodes)

1591

translated_nodes = []

1592

try:

1593

# Add prefix_key to each reference node_refs is a tuple of tuples,

1594

# so split it apart, and add prefix_key to the internal reference

1595

for (key, value, node_refs) in nodes:

1596

adjusted_references = (

1597

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1598

for ref_list in node_refs))

1599

translated_nodes.append((self.prefix + key, value,

1600

adjusted_references))

1601

except ValueError:

1602

# XXX: TODO add an explicit interface for getting the reference list

1603

# status, to handle this bit of user-friendliness in the API more

1604

# explicitly.

1605

for (key, value) in nodes:

1606

translated_nodes.append((self.prefix + key, value))

1607

self.add_nodes_callback(translated_nodes)

1608

1609

def add_node(self, key, value, references=()):

1610

"""Add a node to the index.

1611

1612

:param key: The key. keys are non-empty tuples containing

1613

as many whitespace-free utf8 bytestrings as the key length

1614

defined for this index.

1615

:param references: An iterable of iterables of keys. Each is a

1616

reference to another key.

1617

:param value: The value to associate with the key. It may be any

1618

bytes as long as it does not contain \0 or \n.

1619

"""

1620

self.add_nodes(((key, value, references), ))

1621

1622

def _strip_prefix(self, an_iter):

1623

"""Strip prefix data from nodes and return it."""

1624

for node in an_iter:

1625

# cross checks

1626

if node[1][:self.prefix_len] != self.prefix:

1627

raise errors.BadIndexData(self)

1628

for ref_list in node[3]:

1629

for ref_node in ref_list:

1630

if ref_node[:self.prefix_len] != self.prefix:

1631

raise errors.BadIndexData(self)

1632

yield node[0], node[1][self.prefix_len:], node[2], (

1633

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1634

for ref_list in node[3]))

1635

1636

def iter_all_entries(self):

1637

"""Iterate over all keys within the index

1638

1639

iter_all_entries is implemented against the adapted index using

1640

iter_entries_prefix.

1641

1642

:return: An iterable of (index, key, reference_lists, value). There is no

1643

defined order for the result iteration - it will be in the most

1644

efficient order for the index (in this case dictionary hash order).

1645

"""

1646

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1647

1648

def iter_entries(self, keys):

1649

"""Iterate over keys within the index.

1650

1651

:param keys: An iterable providing the keys to be retrieved.

1652

:return: An iterable of (index, key, value, reference_lists). There is no

1653

defined order for the result iteration - it will be in the most

1654

efficient order for the index (keys iteration order in this case).

1655

"""

1656

return self._strip_prefix(self.adapted.iter_entries(

1657

self.prefix + key for key in keys))

1658

1659

def iter_entries_prefix(self, keys):

1660

"""Iterate over keys within the index using prefix matching.

1661

1662

Prefix matching is applied within the tuple of a key, not to within

1663

the bytestring of each key element. e.g. if you have the keys ('foo',

1664

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1665

only the former key is returned.

1666

1667

:param keys: An iterable providing the key prefixes to be retrieved.

1668

Each key prefix takes the form of a tuple the length of a key, but

1669

with the last N elements 'None' rather than a regular bytestring.

1670

The first element cannot be 'None'.

1671

:return: An iterable as per iter_all_entries, but restricted to the

1672

keys with a matching prefix to those supplied. No additional keys

1673

will be returned, and every match that is in the index will be

1674

returned.

1675

"""

1676

return self._strip_prefix(self.adapted.iter_entries_prefix(

1677

self.prefix + key for key in keys))

1678

1679

def key_count(self):

1680

"""Return an estimate of the number of keys in this index.

1681

1682

For GraphIndexPrefixAdapter this is relatively expensive - key

1683

iteration with the prefix is done.

1684

"""

1685

return len(list(self.iter_all_entries()))

1686

1687

def validate(self):

1688

"""Call the adapted's validate."""

1689

self.adapted.validate()

Older »