~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Aaron Bentley
Date: 2006-06-21 14:30:57 UTC
mfrom: (1801.1.1 bzr.dev)
mto: This revision was merged to the branch mainline in revision 1803.
Revision ID: abentley@panoramicfeedback.com-20060621143057-776e4b8d707e430e

Install benchmarks. (Jelmer Vernooij)

files added:
NEWS.developers

build-api

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_emptytree.py

bzrlib/tests/test_escaped_store.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/README.1st

files removed:
COPYING.txt

bzr.ico

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_export_c_api.h

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_import_c_api.h

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_interned_pyx.pxd

bzrlib/_static_tuple_interned_pyx.pyx

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/cache_utf8.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/email_message.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inventory_delta.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/pack.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/revisiontree.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/tag.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__static_tuple_interned.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/timestamp.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/ftp

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/log.py

bzrlib/transport/nosmart.py

bzrlib/transport/remote.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/views.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/BUILD-NOTES

doc/Makefile

doc/_static

doc/_static/bzr icon 16.png

doc/_static/bzr.ico

doc/_static/en

doc/_static/en/quick-reference

doc/_static/en/quick-reference/Makefile

doc/_static/en/quick-reference/bzr-quick-reference.pdf

doc/_static/en/quick-reference/bzr-quick-reference.png

doc/_static/en/quick-reference/bzr-quick-reference.svg

doc/_templates

doc/_templates/index.html

doc/_templates/layout.html

doc/bazaar-vcs.org.kid

doc/conf.py

doc/contents.txt

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-for-2x.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/developer-guide

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/Makefile

doc/es/quick-reference/quick-start-summary.pdf

doc/es/quick-reference/quick-start-summary.png

doc/es/quick-reference/quick-start-summary.svg

doc/es/release-notes

doc/es/user-guide

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/es/user-reference

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/make.bat

doc/news-template.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/check-newsbugs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files renamed:
doc/en/developer-guide/HACKING.txt => HACKING

bzrlib/bundle/serializer/v08.py => bzrlib/bundle/serializer/v07.py

bzrlib/deprecated_graph.py => bzrlib/graph.py

bzrlib/_patiencediff_py.py => bzrlib/patiencediff.py

bzrlib/tests/http_utils.py => bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/blackbox/test_send.py => bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/per_branch/ => bzrlib/tests/branch_implementations/

bzrlib/tests/per_bzrdir/ => bzrlib/tests/bzrdir_implementations/

bzrlib/tests/per_interrepository/ => bzrlib/tests/interrepository_implementations/

bzrlib/tests/per_repository/ => bzrlib/tests/repository_implementations/

bzrlib/tests/test_commands.py => bzrlib/tests/test_command.py

bzrlib/tests/test_deprecated_graph.py => bzrlib/tests/test_graph.py

bzrlib/tests/test_revisionspec.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/per_repository/test_revision.py => bzrlib/tests/test_revprops.py

bzrlib/tests/per_transport.py => bzrlib/tests/test_transport_implementations.py

bzrlib/tests/per_versionedfile.py => bzrlib/tests/test_versionedfile.py

bzrlib/tests/per_workingtree/ => bzrlib/tests/workingtree_implementations/

bzrlib/transport/ftp/__init__.py => bzrlib/transport/ftp.py

bzrlib/win32utils.py => bzrlib/win32console.py

bzrlib/xml8.py => bzrlib/xml5.py

bzrlib/help_topics/en/configuration.txt => doc/configuration.txt

doc/en/user-guide/plugins.txt => doc/plugins.txt

doc/en/user-guide/setting_up_email.txt => doc/setting_up_email.txt

doc/en/user-guide/specifying_revisions.txt => doc/specifying_revisions.txt

doc/en/tutorials/tutorial.txt => doc/tutorial.txt

doc/en/user-guide/using_aliases.txt => doc/using_aliases.txt

tools/generate_docs.py => generate_docs.py

bzrlib/doc_generate/ => tools/doc_generate/

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml_serializer.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

profile_imports.py

setup.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/trace-revisions

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

self._key_length = key_elements

100

self._optimize_for_size = False

101

self._combine_backing_indices = True

102

103

def _check_key(self, key):

104

"""Raise BadIndexKey if key is not a valid key for this index."""

105

if type(key) != tuple:

106

raise errors.BadIndexKey(key)

107

if self._key_length != len(key):

108

raise errors.BadIndexKey(key)

109

for element in key:

110

if not element or _whitespace_re.search(element) is not None:

111

raise errors.BadIndexKey(element)

112

113

def _external_references(self):

114

"""Return references that are not present in this index.

115

"""

116

keys = set()

117

refs = set()

118

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

119

# lists are used. It is currently correct for pack-0.92 through

120

# 1.9, which use the node references (3rd column) second

121

# reference list as the compression parent. Perhaps this should

122

# be moved into something higher up the stack, since it

123

# makes assumptions about how the index is used.

124

if self.reference_lists > 1:

125

for node in self.iter_all_entries():

126

keys.add(node[1])

127

refs.update(node[3][1])

128

return refs - keys

129

else:

130

# If reference_lists == 0 there can be no external references, and

131

# if reference_lists == 1, then there isn't a place to store the

132

# compression parent

133

return set()

134

135

def _get_nodes_by_key(self):

136

if self._nodes_by_key is None:

137

nodes_by_key = {}

138

if self.reference_lists:

139

for key, (absent, references, value) in self._nodes.iteritems():

140

if absent:

141

continue

142

key_dict = nodes_by_key

143

for subkey in key[:-1]:

144

key_dict = key_dict.setdefault(subkey, {})

145

key_dict[key[-1]] = key, value, references

146

else:

147

for key, (absent, references, value) in self._nodes.iteritems():

148

if absent:

149

continue

150

key_dict = nodes_by_key

151

for subkey in key[:-1]:

152

key_dict = key_dict.setdefault(subkey, {})

153

key_dict[key[-1]] = key, value

154

self._nodes_by_key = nodes_by_key

155

return self._nodes_by_key

156

157

def _update_nodes_by_key(self, key, value, node_refs):

158

"""Update the _nodes_by_key dict with a new key.

159

160

For a key of (foo, bar, baz) create

161

_nodes_by_key[foo][bar][baz] = key_value

162

"""

163

if self._nodes_by_key is None:

164

return

165

key_dict = self._nodes_by_key

166

if self.reference_lists:

167

key_value = key, value, node_refs

168

else:

169

key_value = key, value

170

for subkey in key[:-1]:

171

key_dict = key_dict.setdefault(subkey, {})

172

key_dict[key[-1]] = key_value

173

174

def _check_key_ref_value(self, key, references, value):

175

"""Check that 'key' and 'references' are all valid.

176

177

:param key: A key tuple. Must conform to the key interface (be a tuple,

178

be of the right length, not have any whitespace or nulls in any key

179

element.)

180

:param references: An iterable of reference lists. Something like

181

[[(ref, key)], [(ref, key), (other, key)]]

182

:param value: The value associate with this key. Must not contain

183

newlines or null characters.

184

:return: (node_refs, absent_references)

185

node_refs basically a packed form of 'references' where all

186

iterables are tuples

187

absent_references reference keys that are not in self._nodes.

188

This may contain duplicates if the same key is

189

referenced in multiple lists.

190

"""

191

self._check_key(key)

192

if _newline_null_re.search(value) is not None:

193

raise errors.BadIndexValue(value)

194

if len(references) != self.reference_lists:

195

raise errors.BadIndexValue(references)

196

node_refs = []

197

absent_references = []

198

for reference_list in references:

199

for reference in reference_list:

200

# If reference *is* in self._nodes, then we know it has already

201

# been checked.

202

if reference not in self._nodes:

203

self._check_key(reference)

204

absent_references.append(reference)

205

node_refs.append(tuple(reference_list))

206

return tuple(node_refs), absent_references

207

208

def add_node(self, key, value, references=()):

209

"""Add a node to the index.

210

211

:param key: The key. keys are non-empty tuples containing

212

as many whitespace-free utf8 bytestrings as the key length

213

defined for this index.

214

:param references: An iterable of iterables of keys. Each is a

215

reference to another key.

216

:param value: The value to associate with the key. It may be any

217

bytes as long as it does not contain \0 or \n.

218

"""

219

(node_refs,

220

absent_references) = self._check_key_ref_value(key, references, value)

221

if key in self._nodes and self._nodes[key][0] != 'a':

222

raise errors.BadIndexDuplicateKey(key, self)

223

for reference in absent_references:

224

# There may be duplicates, but I don't think it is worth worrying

225

# about

226

self._nodes[reference] = ('a', (), '')

227

self._nodes[key] = ('', node_refs, value)

228

self._keys.add(key)

229

if self._nodes_by_key is not None and self._key_length > 1:

230

self._update_nodes_by_key(key, value, node_refs)

231

232

def finish(self):

233

lines = [_SIGNATURE]

234

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

235

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

236

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

237

prefix_length = sum(len(x) for x in lines)

238

# references are byte offsets. To avoid having to do nasty

239

# polynomial work to resolve offsets (references to later in the

240

# file cannot be determined until all the inbetween references have

241

# been calculated too) we pad the offsets with 0's to make them be

242

# of consistent length. Using binary offsets would break the trivial

243

# file parsing.

244

# to calculate the width of zero's needed we do three passes:

245

# one to gather all the non-reference data and the number of references.

246

# one to pad all the data with reference-length and determine entry

247

# addresses.

248

# One to serialise.

249

250

# forward sorted by key. In future we may consider topological sorting,

251

# at the cost of table scans for direct lookup, or a second index for

252

# direct lookup

253

nodes = sorted(self._nodes.items())

254

# if we do not prepass, we don't know how long it will be up front.

255

expected_bytes = None

256

# we only need to pre-pass if we have reference lists at all.

257

if self.reference_lists:

258

key_offset_info = []

259

non_ref_bytes = prefix_length

260

total_references = 0

261

# TODO use simple multiplication for the constants in this loop.

262

for key, (absent, references, value) in nodes:

263

# record the offset known *so far* for this key:

264

# the non reference bytes to date, and the total references to

265

# date - saves reaccumulating on the second pass

266

key_offset_info.append((key, non_ref_bytes, total_references))

267

# key is literal, value is literal, there are 3 null's, 1 NL

268

# key is variable length tuple, \x00 between elements

269

non_ref_bytes += sum(len(element) for element in key)

270

if self._key_length > 1:

271

non_ref_bytes += self._key_length - 1

272

# value is literal bytes, there are 3 null's, 1 NL.

273

non_ref_bytes += len(value) + 3 + 1

274

# one byte for absent if set.

275

if absent:

276

non_ref_bytes += 1

277

elif self.reference_lists:

278

# (ref_lists -1) tabs

279

non_ref_bytes += self.reference_lists - 1

280

# (ref-1 cr's per ref_list)

281

for ref_list in references:

282

# how many references across the whole file?

283

total_references += len(ref_list)

284

# accrue reference separators

285

if ref_list:

286

non_ref_bytes += len(ref_list) - 1

287

# how many digits are needed to represent the total byte count?

288

digits = 1

289

possible_total_bytes = non_ref_bytes + total_references*digits

290

while 10 ** digits < possible_total_bytes:

291

digits += 1

292

possible_total_bytes = non_ref_bytes + total_references*digits

293

expected_bytes = possible_total_bytes + 1 # terminating newline

294

# resolve key addresses.

295

key_addresses = {}

296

for key, non_ref_bytes, total_references in key_offset_info:

297

key_addresses[key] = non_ref_bytes + total_references*digits

298

# serialise

299

format_string = '%%0%sd' % digits

300

for key, (absent, references, value) in nodes:

301

flattened_references = []

302

for ref_list in references:

303

ref_addresses = []

304

for reference in ref_list:

305

ref_addresses.append(format_string % key_addresses[reference])

306

flattened_references.append('\r'.join(ref_addresses))

307

string_key = '\x00'.join(key)

308

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

309

'\t'.join(flattened_references), value))

310

lines.append('\n')

311

result = StringIO(''.join(lines))

312

if expected_bytes and len(result.getvalue()) != expected_bytes:

313

raise errors.BzrError('Failed index creation. Internal error:'

314

' mismatched output length and expected length: %d %d' %

315

(len(result.getvalue()), expected_bytes))

316

return result

317

318

def set_optimize(self, for_size=None, combine_backing_indices=None):

319

"""Change how the builder tries to optimize the result.

320

321

:param for_size: Tell the builder to try and make the index as small as

322

possible.

323

:param combine_backing_indices: If the builder spills to disk to save

324

memory, should the on-disk indices be combined. Set to True if you

325

are going to be probing the index, but to False if you are not. (If

326

you are not querying, then the time spent combining is wasted.)

327

:return: None

328

"""

329

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

330

# other builders do.

331

if for_size is not None:

332

self._optimize_for_size = for_size

333

if combine_backing_indices is not None:

334

self._combine_backing_indices = combine_backing_indices

335

336

def find_ancestry(self, keys, ref_list_num):

337

"""See CombinedGraphIndex.find_ancestry()"""

338

pending = set(keys)

339

parent_map = {}

340

missing_keys = set()

341

while pending:

342

next_pending = set()

343

for _, key, value, ref_lists in self.iter_entries(pending):

344

parent_keys = ref_lists[ref_list_num]

345

parent_map[key] = parent_keys

346

next_pending.update([p for p in parent_keys if p not in

347

parent_map])

348

missing_keys.update(pending.difference(parent_map))

349

pending = next_pending

350

return parent_map, missing_keys

351

352

353

class GraphIndex(object):

354

"""An index for data with embedded graphs.

355

356

The index maps keys to a list of key reference lists, and a value.

357

Each node has the same number of key reference lists. Each key reference

358

list can be empty or an arbitrary length. The value is an opaque NULL

359

terminated string without any newlines. The storage of the index is

360

hidden in the interface: keys and key references are always tuples of

361

bytestrings, never the internal representation (e.g. dictionary offsets).

362

363

It is presumed that the index will not be mutated - it is static data.

364

365

Successive iter_all_entries calls will read the entire index each time.

366

Additionally, iter_entries calls will read the index linearly until the

367

desired keys are found. XXX: This must be fixed before the index is

368

suitable for production use. :XXX

369

"""

370

371

def __init__(self, transport, name, size):

372

"""Open an index called name on transport.

373

374

:param transport: A bzrlib.transport.Transport.

375

:param name: A path to provide to transport API calls.

376

:param size: The size of the index in bytes. This is used for bisection

377

logic to perform partial index reads. While the size could be

378

obtained by statting the file this introduced an additional round

379

trip as well as requiring stat'able transports, both of which are

380

avoided by having it supplied. If size is None, then bisection

381

support will be disabled and accessing the index will just stream

382

all the data.

383

"""

384

self._transport = transport

385

self._name = name

386

# Becomes a dict of key:(value, reference-list-byte-locations) used by

387

# the bisection interface to store parsed but not resolved keys.

388

self._bisect_nodes = None

389

# Becomes a dict of key:(value, reference-list-keys) which are ready to

390

# be returned directly to callers.

391

self._nodes = None

392

# a sorted list of slice-addresses for the parsed bytes of the file.

393

# e.g. (0,1) would mean that byte 0 is parsed.

394

self._parsed_byte_map = []

395

# a sorted list of keys matching each slice address for parsed bytes

396

# e.g. (None, 'foo@bar') would mean that the first byte contained no

397

# key, and the end byte of the slice is the of the data for 'foo@bar'

398

self._parsed_key_map = []

399

self._key_count = None

400

self._keys_by_offset = None

401

self._nodes_by_key = None

402

self._size = size

403

# The number of bytes we've read so far in trying to process this file

404

self._bytes_read = 0

405

406

def __eq__(self, other):

407

"""Equal when self and other were created with the same parameters."""

408

return (

409

type(self) == type(other) and

410

self._transport == other._transport and

411

self._name == other._name and

412

self._size == other._size)

413

414

def __ne__(self, other):

415

return not self.__eq__(other)

416

417

def __repr__(self):

418

return "%s(%r)" % (self.__class__.__name__,

419

self._transport.abspath(self._name))

420

421

def _buffer_all(self, stream=None):

422

"""Buffer all the index data.

423

424

Mutates self._nodes and self.keys_by_offset.

425

"""

426

if self._nodes is not None:

427

# We already did this

428

return

429

if 'index' in debug.debug_flags:

430

mutter('Reading entire index %s', self._transport.abspath(self._name))

431

if stream is None:

432

stream = self._transport.get(self._name)

433

self._read_prefix(stream)

434

self._expected_elements = 3 + self._key_length

435

line_count = 0

436

# raw data keyed by offset

437

self._keys_by_offset = {}

438

# ready-to-return key:value or key:value, node_ref_lists

439

self._nodes = {}

440

self._nodes_by_key = None

441

trailers = 0

442

pos = stream.tell()

443

lines = stream.read().split('\n')

444

del lines[-1]

445

_, _, _, trailers = self._parse_lines(lines, pos)

446

for key, absent, references, value in self._keys_by_offset.itervalues():

447

if absent:

448

continue

449

# resolve references:

450

if self.node_ref_lists:

451

node_value = (value, self._resolve_references(references))

452

else:

453

node_value = value

454

self._nodes[key] = node_value

455

# cache the keys for quick set intersections

456

self._keys = set(self._nodes)

457

if trailers != 1:

458

# there must be one line - the empty trailer line.

459

raise errors.BadIndexData(self)

460

461

def external_references(self, ref_list_num):

462

"""Return references that are not present in this index.

463

"""

464

self._buffer_all()

465

if ref_list_num + 1 > self.node_ref_lists:

466

raise ValueError('No ref list %d, index has %d ref lists'

467

% (ref_list_num, self.node_ref_lists))

468

refs = set()

469

for key, (value, ref_lists) in self._nodes.iteritems():

470

ref_list = ref_lists[ref_list_num]

471

refs.update(ref_list)

472

return refs - self._keys

473

474

def _get_nodes_by_key(self):

475

if self._nodes_by_key is None:

476

nodes_by_key = {}

477

if self.node_ref_lists:

478

for key, (value, references) in self._nodes.iteritems():

479

key_dict = nodes_by_key

480

for subkey in key[:-1]:

481

key_dict = key_dict.setdefault(subkey, {})

482

key_dict[key[-1]] = key, value, references

483

else:

484

for key, value in self._nodes.iteritems():

485

key_dict = nodes_by_key

486

for subkey in key[:-1]:

487

key_dict = key_dict.setdefault(subkey, {})

488

key_dict[key[-1]] = key, value

489

self._nodes_by_key = nodes_by_key

490

return self._nodes_by_key

491

492

def iter_all_entries(self):

493

"""Iterate over all keys within the index.

494

495

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

496

The former tuple is used when there are no reference lists in the

497

index, making the API compatible with simple key:value index types.

498

There is no defined order for the result iteration - it will be in

499

the most efficient order for the index.

500

"""

501

if 'evil' in debug.debug_flags:

502

trace.mutter_callsite(3,

503

"iter_all_entries scales with size of history.")

504

if self._nodes is None:

505

self._buffer_all()

506

if self.node_ref_lists:

507

for key, (value, node_ref_lists) in self._nodes.iteritems():

508

yield self, key, value, node_ref_lists

509

else:

510

for key, value in self._nodes.iteritems():

511

yield self, key, value

512

513

def _read_prefix(self, stream):

514

signature = stream.read(len(self._signature()))

515

if not signature == self._signature():

516

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

517

options_line = stream.readline()

518

if not options_line.startswith(_OPTION_NODE_REFS):

519

raise errors.BadIndexOptions(self)

520

try:

521

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

522

except ValueError:

523

raise errors.BadIndexOptions(self)

524

options_line = stream.readline()

525

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

526

raise errors.BadIndexOptions(self)

527

try:

528

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

529

except ValueError:

530

raise errors.BadIndexOptions(self)

531

options_line = stream.readline()

532

if not options_line.startswith(_OPTION_LEN):

533

raise errors.BadIndexOptions(self)

534

try:

535

self._key_count = int(options_line[len(_OPTION_LEN):-1])

536

except ValueError:

537

raise errors.BadIndexOptions(self)

538

539

def _resolve_references(self, references):

540

"""Return the resolved key references for references.

541

542

References are resolved by looking up the location of the key in the

543

_keys_by_offset map and substituting the key name, preserving ordering.

544

545

:param references: An iterable of iterables of key locations. e.g.

546

[[123, 456], [123]]

547

:return: A tuple of tuples of keys.

548

"""

549

node_refs = []

550

for ref_list in references:

551

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

552

return tuple(node_refs)

553

554

def _find_index(self, range_map, key):

555

"""Helper for the _parsed_*_index calls.

556

557

Given a range map - [(start, end), ...], finds the index of the range

558

in the map for key if it is in the map, and if it is not there, the

559

immediately preceeding range in the map.

560

"""

561

result = bisect_right(range_map, key) - 1

562

if result + 1 < len(range_map):

563

# check the border condition, it may be in result + 1

564

if range_map[result + 1][0] == key[0]:

565

return result + 1

566

return result

567

568

def _parsed_byte_index(self, offset):

569

"""Return the index of the entry immediately before offset.

570

571

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

572

there is one unparsed byte (the 11th, addressed as[10]). then:

573

asking for 0 will return 0

574

asking for 10 will return 0

575

asking for 11 will return 1

576

asking for 12 will return 1

577

"""

578

key = (offset, 0)

579

return self._find_index(self._parsed_byte_map, key)

580

581

def _parsed_key_index(self, key):

582

"""Return the index of the entry immediately before key.

583

584

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

585

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

586

have been parsed, then:

587

asking for '' will return 0

588

asking for 'a' will return 0

589

asking for 'b' will return 1

590

asking for 'e' will return 1

591

"""

592

search_key = (key, None)

593

return self._find_index(self._parsed_key_map, search_key)

594

595

def _is_parsed(self, offset):

596

"""Returns True if offset has been parsed."""

597

index = self._parsed_byte_index(offset)

598

if index == len(self._parsed_byte_map):

599

return offset < self._parsed_byte_map[index - 1][1]

600

start, end = self._parsed_byte_map[index]

601

return offset >= start and offset < end

602

603

def _iter_entries_from_total_buffer(self, keys):

604

"""Iterate over keys when the entire index is parsed."""

605

keys = keys.intersection(self._keys)

606

if self.node_ref_lists:

607

for key in keys:

608

value, node_refs = self._nodes[key]

609

yield self, key, value, node_refs

610

else:

611

for key in keys:

612

yield self, key, self._nodes[key]

613

614

def iter_entries(self, keys):

615

"""Iterate over keys within the index.

616

617

:param keys: An iterable providing the keys to be retrieved.

618

:return: An iterable as per iter_all_entries, but restricted to the

619

keys supplied. No additional keys will be returned, and every

620

key supplied that is in the index will be returned.

621

"""

622

keys = set(keys)

623

if not keys:

624

return []

625

if self._size is None and self._nodes is None:

626

self._buffer_all()

627

628

# We fit about 20 keys per minimum-read (4K), so if we are looking for

629

# more than 1/20th of the index its likely (assuming homogenous key

630

# spread) that we'll read the entire index. If we're going to do that,

631

# buffer the whole thing. A better analysis might take key spread into

632

# account - but B+Tree indices are better anyway.

633

# We could look at all data read, and use a threshold there, which will

634

# trigger on ancestry walks, but that is not yet fully mapped out.

635

if self._nodes is None and len(keys) * 20 > self.key_count():

636

self._buffer_all()

637

if self._nodes is not None:

638

return self._iter_entries_from_total_buffer(keys)

639

else:

640

return (result[1] for result in bisect_multi_bytes(

641

self._lookup_keys_via_location, self._size, keys))

642

643

def iter_entries_prefix(self, keys):

644

"""Iterate over keys within the index using prefix matching.

645

646

Prefix matching is applied within the tuple of a key, not to within

647

the bytestring of each key element. e.g. if you have the keys ('foo',

648

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

649

only the former key is returned.

650

651

WARNING: Note that this method currently causes a full index parse

652

unconditionally (which is reasonably appropriate as it is a means for

653

thunking many small indices into one larger one and still supplies

654

iter_all_entries at the thunk layer).

655

656

:param keys: An iterable providing the key prefixes to be retrieved.

657

Each key prefix takes the form of a tuple the length of a key, but

658

with the last N elements 'None' rather than a regular bytestring.

659

The first element cannot be 'None'.

660

:return: An iterable as per iter_all_entries, but restricted to the

661

keys with a matching prefix to those supplied. No additional keys

662

will be returned, and every match that is in the index will be

663

returned.

664

"""

665

keys = set(keys)

666

if not keys:

667

return

668

# load data - also finds key lengths

669

if self._nodes is None:

670

self._buffer_all()

671

if self._key_length == 1:

672

for key in keys:

673

# sanity check

674

if key[0] is None:

675

raise errors.BadIndexKey(key)

676

if len(key) != self._key_length:

677

raise errors.BadIndexKey(key)

678

if self.node_ref_lists:

679

value, node_refs = self._nodes[key]

680

yield self, key, value, node_refs

681

else:

682

yield self, key, self._nodes[key]

683

return

684

nodes_by_key = self._get_nodes_by_key()

685

for key in keys:

686

# sanity check

687

if key[0] is None:

688

raise errors.BadIndexKey(key)

689

if len(key) != self._key_length:

690

raise errors.BadIndexKey(key)

691

# find what it refers to:

692

key_dict = nodes_by_key

693

elements = list(key)

694

# find the subdict whose contents should be returned.

695

try:

696

while len(elements) and elements[0] is not None:

697

key_dict = key_dict[elements[0]]

698

elements.pop(0)

699

except KeyError:

700

# a non-existant lookup.

701

continue

702

if len(elements):

703

dicts = [key_dict]

704

while dicts:

705

key_dict = dicts.pop(-1)

706

# can't be empty or would not exist

707

item, value = key_dict.iteritems().next()

708

if type(value) == dict:

709

# push keys

710

dicts.extend(key_dict.itervalues())

711

else:

712

# yield keys

713

for value in key_dict.itervalues():

714

# each value is the key:value:node refs tuple

715

# ready to yield.

716

yield (self, ) + value

717

else:

718

# the last thing looked up was a terminal element

719

yield (self, ) + key_dict

720

721

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

722

"""See BTreeIndex._find_ancestors."""

723

# The api can be implemented as a trivial overlay on top of

724

# iter_entries, it is not an efficient implementation, but it at least

725

# gets the job done.

726

found_keys = set()

727

search_keys = set()

728

for index, key, value, refs in self.iter_entries(keys):

729

parent_keys = refs[ref_list_num]

730

found_keys.add(key)

731

parent_map[key] = parent_keys

732

search_keys.update(parent_keys)

733

# Figure out what, if anything, was missing

734

missing_keys.update(set(keys).difference(found_keys))

735

search_keys = search_keys.difference(parent_map)

736

return search_keys

737

738

def key_count(self):

739

"""Return an estimate of the number of keys in this index.

740

741

For GraphIndex the estimate is exact.

742

"""

743

if self._key_count is None:

744

self._read_and_parse([_HEADER_READV])

745

return self._key_count

746

747

def _lookup_keys_via_location(self, location_keys):

748

"""Public interface for implementing bisection.

749

750

If _buffer_all has been called, then all the data for the index is in

751

memory, and this method should not be called, as it uses a separate

752

cache because it cannot pre-resolve all indices, which buffer_all does

753

for performance.

754

755

:param location_keys: A list of location(byte offset), key tuples.

756

:return: A list of (location_key, result) tuples as expected by

757

bzrlib.bisect_multi.bisect_multi_bytes.

758

"""

759

# Possible improvements:

760

# - only bisect lookup each key once

761

# - sort the keys first, and use that to reduce the bisection window

762

# -----

763

# this progresses in three parts:

764

# read data

765

# parse it

766

# attempt to answer the question from the now in memory data.

767

# build the readv request

768

# for each location, ask for 800 bytes - much more than rows we've seen

769

# anywhere.

770

readv_ranges = []

771

for location, key in location_keys:

772

# can we answer from cache?

773

if self._bisect_nodes and key in self._bisect_nodes:

774

# We have the key parsed.

775

continue

776

index = self._parsed_key_index(key)

777

if (len(self._parsed_key_map) and

778

self._parsed_key_map[index][0] <= key and

779

(self._parsed_key_map[index][1] >= key or

780

# end of the file has been parsed

781

self._parsed_byte_map[index][1] == self._size)):

782

# the key has been parsed, so no lookup is needed even if its

783

# not present.

784

continue

785

# - if we have examined this part of the file already - yes

786

index = self._parsed_byte_index(location)

787

if (len(self._parsed_byte_map) and

788

self._parsed_byte_map[index][0] <= location and

789

self._parsed_byte_map[index][1] > location):

790

# the byte region has been parsed, so no read is needed.

791

continue

792

length = 800

793

if location + length > self._size:

794

length = self._size - location

795

# todo, trim out parsed locations.

796

if length > 0:

797

readv_ranges.append((location, length))

798

# read the header if needed

799

if self._bisect_nodes is None:

800

readv_ranges.append(_HEADER_READV)

801

self._read_and_parse(readv_ranges)

802

result = []

803

if self._nodes is not None:

804

# _read_and_parse triggered a _buffer_all because we requested the

805

# whole data range

806

for location, key in location_keys:

807

if key not in self._nodes: # not present

808

result.append(((location, key), False))

809

elif self.node_ref_lists:

810

value, refs = self._nodes[key]

811

result.append(((location, key),

812

(self, key, value, refs)))

813

else:

814

result.append(((location, key),

815

(self, key, self._nodes[key])))

816

return result

817

# generate results:

818

# - figure out <, >, missing, present

819

# - result present references so we can return them.

820

# keys that we cannot answer until we resolve references

821

pending_references = []

822

pending_locations = set()

823

for location, key in location_keys:

824

# can we answer from cache?

825

if key in self._bisect_nodes:

826

# the key has been parsed, so no lookup is needed

827

if self.node_ref_lists:

828

# the references may not have been all parsed.

829

value, refs = self._bisect_nodes[key]

830

wanted_locations = []

831

for ref_list in refs:

832

for ref in ref_list:

833

if ref not in self._keys_by_offset:

834

wanted_locations.append(ref)

835

if wanted_locations:

836

pending_locations.update(wanted_locations)

837

pending_references.append((location, key))

838

continue

839

result.append(((location, key), (self, key,

840

value, self._resolve_references(refs))))

841

else:

842

result.append(((location, key),

843

(self, key, self._bisect_nodes[key])))

844

continue

845

else:

846

# has the region the key should be in, been parsed?

847

index = self._parsed_key_index(key)

848

if (self._parsed_key_map[index][0] <= key and

849

(self._parsed_key_map[index][1] >= key or

850

# end of the file has been parsed

851

self._parsed_byte_map[index][1] == self._size)):

852

result.append(((location, key), False))

853

continue

854

# no, is the key above or below the probed location:

855

# get the range of the probed & parsed location

856

index = self._parsed_byte_index(location)

857

# if the key is below the start of the range, its below

858

if key < self._parsed_key_map[index][0]:

859

direction = -1

860

else:

861

direction = +1

862

result.append(((location, key), direction))

863

readv_ranges = []

864

# lookup data to resolve references

865

for location in pending_locations:

866

length = 800

867

if location + length > self._size:

868

length = self._size - location

869

# TODO: trim out parsed locations (e.g. if the 800 is into the

870

# parsed region trim it, and dont use the adjust_for_latency

871

# facility)

872

if length > 0:

873

readv_ranges.append((location, length))

874

self._read_and_parse(readv_ranges)

875

if self._nodes is not None:

876

# The _read_and_parse triggered a _buffer_all, grab the data and

877

# return it

878

for location, key in pending_references:

879

value, refs = self._nodes[key]

880

result.append(((location, key), (self, key, value, refs)))

881

return result

882

for location, key in pending_references:

883

# answer key references we had to look-up-late.

884

value, refs = self._bisect_nodes[key]

885

result.append(((location, key), (self, key,

886

value, self._resolve_references(refs))))

887

return result

888

889

def _parse_header_from_bytes(self, bytes):

890

"""Parse the header from a region of bytes.

891

892

:param bytes: The data to parse.

893

:return: An offset, data tuple such as readv yields, for the unparsed

894

data. (which may length 0).

895

"""

896

signature = bytes[0:len(self._signature())]

897

if not signature == self._signature():

898

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

899

lines = bytes[len(self._signature()):].splitlines()

900

options_line = lines[0]

901

if not options_line.startswith(_OPTION_NODE_REFS):

902

raise errors.BadIndexOptions(self)

903

try:

904

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

905

except ValueError:

906

raise errors.BadIndexOptions(self)

907

options_line = lines[1]

908

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

909

raise errors.BadIndexOptions(self)

910

try:

911

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

912

except ValueError:

913

raise errors.BadIndexOptions(self)

914

options_line = lines[2]

915

if not options_line.startswith(_OPTION_LEN):

916

raise errors.BadIndexOptions(self)

917

try:

918

self._key_count = int(options_line[len(_OPTION_LEN):])

919

except ValueError:

920

raise errors.BadIndexOptions(self)

921

# calculate the bytes we have processed

922

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

923

len(lines[2]) + 3)

924

self._parsed_bytes(0, None, header_end, None)

925

# setup parsing state

926

self._expected_elements = 3 + self._key_length

927

# raw data keyed by offset

928

self._keys_by_offset = {}

929

# keys with the value and node references

930

self._bisect_nodes = {}

931

return header_end, bytes[header_end:]

932

933

def _parse_region(self, offset, data):

934

"""Parse node data returned from a readv operation.

935

936

:param offset: The byte offset the data starts at.

937

:param data: The data to parse.

938

"""

939

# trim the data.

940

# end first:

941

end = offset + len(data)

942

high_parsed = offset

943

while True:

944

# Trivial test - if the current index's end is within the

945

# low-matching parsed range, we're done.

946

index = self._parsed_byte_index(high_parsed)

947

if end < self._parsed_byte_map[index][1]:

948

return

949

# print "[%d:%d]" % (offset, end), \

950

# self._parsed_byte_map[index:index + 2]

951

high_parsed, last_segment = self._parse_segment(

952

offset, data, end, index)

953

if last_segment:

954

return

955

956

def _parse_segment(self, offset, data, end, index):

957

"""Parse one segment of data.

958

959

:param offset: Where 'data' begins in the file.

960

:param data: Some data to parse a segment of.

961

:param end: Where data ends

962

:param index: The current index into the parsed bytes map.

963

:return: True if the parsed segment is the last possible one in the

964

range of data.

965

:return: high_parsed_byte, last_segment.

966

high_parsed_byte is the location of the highest parsed byte in this

967

segment, last_segment is True if the parsed segment is the last

968

possible one in the data block.

969

"""

970

# default is to use all data

971

trim_end = None

972

# accomodate overlap with data before this.

973

if offset < self._parsed_byte_map[index][1]:

974

# overlaps the lower parsed region

975

# skip the parsed data

976

trim_start = self._parsed_byte_map[index][1] - offset

977

# don't trim the start for \n

978

start_adjacent = True

979

elif offset == self._parsed_byte_map[index][1]:

980

# abuts the lower parsed region

981

# use all data

982

trim_start = None

983

# do not trim anything

984

start_adjacent = True

985

else:

986

# does not overlap the lower parsed region

987

# use all data

988

trim_start = None

989

# but trim the leading \n

990

start_adjacent = False

991

if end == self._size:

992

# lines up to the end of all data:

993

# use it all

994

trim_end = None

995

# do not strip to the last \n

996

end_adjacent = True

997

last_segment = True

998

elif index + 1 == len(self._parsed_byte_map):

999

# at the end of the parsed data

1000

# use it all

1001

trim_end = None

1002

# but strip to the last \n

1003

end_adjacent = False

1004

last_segment = True

1005

elif end == self._parsed_byte_map[index + 1][0]:

1006

# buts up against the next parsed region

1007

# use it all

1008

trim_end = None

1009

# do not strip to the last \n

1010

end_adjacent = True

1011

last_segment = True

1012

elif end > self._parsed_byte_map[index + 1][0]:

1013

# overlaps into the next parsed region

1014

# only consider the unparsed data

1015

trim_end = self._parsed_byte_map[index + 1][0] - offset

1016

# do not strip to the last \n as we know its an entire record

1017

end_adjacent = True

1018

last_segment = end < self._parsed_byte_map[index + 1][1]

1019

else:

1020

# does not overlap into the next region

1021

# use it all

1022

trim_end = None

1023

# but strip to the last \n

1024

end_adjacent = False

1025

last_segment = True

1026

# now find bytes to discard if needed

1027

if not start_adjacent:

1028

# work around python bug in rfind

1029

if trim_start is None:

1030

trim_start = data.find('\n') + 1

1031

else:

1032

trim_start = data.find('\n', trim_start) + 1

1033

if not (trim_start != 0):

1034

raise AssertionError('no \n was present')

1035

# print 'removing start', offset, trim_start, repr(data[:trim_start])

1036

if not end_adjacent:

1037

# work around python bug in rfind

1038

if trim_end is None:

1039

trim_end = data.rfind('\n') + 1

1040

else:

1041

trim_end = data.rfind('\n', None, trim_end) + 1

1042

if not (trim_end != 0):

1043

raise AssertionError('no \n was present')

1044

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1045

# adjust offset and data to the parseable data.

1046

trimmed_data = data[trim_start:trim_end]

1047

if not (trimmed_data):

1048

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1049

% (trim_start, trim_end, offset, offset + len(data)))

1050

if trim_start:

1051

offset += trim_start

1052

# print "parsing", repr(trimmed_data)

1053

# splitlines mangles the \r delimiters.. don't use it.

1054

lines = trimmed_data.split('\n')

1055

del lines[-1]

1056

pos = offset

1057

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1058

for key, value in nodes:

1059

self._bisect_nodes[key] = value

1060

self._parsed_bytes(offset, first_key,

1061

offset + len(trimmed_data), last_key)

1062

return offset + len(trimmed_data), last_segment

1063

1064

def _parse_lines(self, lines, pos):

1065

key = None

1066

first_key = None

1067

trailers = 0

1068

nodes = []

1069

for line in lines:

1070

if line == '':

1071

# must be at the end

1072

if self._size:

1073

if not (self._size == pos + 1):

1074

raise AssertionError("%s %s" % (self._size, pos))

1075

trailers += 1

1076

continue

1077

elements = line.split('\0')

1078

if len(elements) != self._expected_elements:

1079

raise errors.BadIndexData(self)

1080

# keys are tuples. Each element is a string that may occur many

1081

# times, so we intern them to save space. AB, RC, 200807

1082

key = tuple([intern(element) for element in elements[:self._key_length]])

1083

if first_key is None:

1084

first_key = key

1085

absent, references, value = elements[-3:]

1086

ref_lists = []

1087

for ref_string in references.split('\t'):

1088

ref_lists.append(tuple([

1089

int(ref) for ref in ref_string.split('\r') if ref

1090

]))

1091

ref_lists = tuple(ref_lists)

1092

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1093

pos += len(line) + 1 # +1 for the \n

1094

if absent:

1095

continue

1096

if self.node_ref_lists:

1097

node_value = (value, ref_lists)

1098

else:

1099

node_value = value

1100

nodes.append((key, node_value))

1101

# print "parsed ", key

1102

return first_key, key, nodes, trailers

1103

1104

def _parsed_bytes(self, start, start_key, end, end_key):

1105

"""Mark the bytes from start to end as parsed.

1106

1107

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1108

1) as parsed.

1109

1110

:param start: The start of the parsed region.

1111

:param end: The end of the parsed region.

1112

"""

1113

index = self._parsed_byte_index(start)

1114

new_value = (start, end)

1115

new_key = (start_key, end_key)

1116

if index == -1:

1117

# first range parsed is always the beginning.

1118

self._parsed_byte_map.insert(index, new_value)

1119

self._parsed_key_map.insert(index, new_key)

1120

return

1121

# four cases:

1122

# new region

1123

# extend lower region

1124

# extend higher region

1125

# combine two regions

1126

if (index + 1 < len(self._parsed_byte_map) and

1127

self._parsed_byte_map[index][1] == start and

1128

self._parsed_byte_map[index + 1][0] == end):

1129

# combine two regions

1130

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1131

self._parsed_byte_map[index + 1][1])

1132

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1133

self._parsed_key_map[index + 1][1])

1134

del self._parsed_byte_map[index + 1]

1135

del self._parsed_key_map[index + 1]

1136

elif self._parsed_byte_map[index][1] == start:

1137

# extend the lower entry

1138

self._parsed_byte_map[index] = (

1139

self._parsed_byte_map[index][0], end)

1140

self._parsed_key_map[index] = (

1141

self._parsed_key_map[index][0], end_key)

1142

elif (index + 1 < len(self._parsed_byte_map) and

1143

self._parsed_byte_map[index + 1][0] == end):

1144

# extend the higher entry

1145

self._parsed_byte_map[index + 1] = (

1146

start, self._parsed_byte_map[index + 1][1])

1147

self._parsed_key_map[index + 1] = (

1148

start_key, self._parsed_key_map[index + 1][1])

1149

else:

1150

# new entry

1151

self._parsed_byte_map.insert(index + 1, new_value)

1152

self._parsed_key_map.insert(index + 1, new_key)

1153

1154

def _read_and_parse(self, readv_ranges):

1155

"""Read the the ranges and parse the resulting data.

1156

1157

:param readv_ranges: A prepared readv range list.

1158

"""

1159

if not readv_ranges:

1160

return

1161

if self._nodes is None and self._bytes_read * 2 >= self._size:

1162

# We've already read more than 50% of the file and we are about to

1163

# request more data, just _buffer_all() and be done

1164

self._buffer_all()

1165

return

1166

1167

readv_data = self._transport.readv(self._name, readv_ranges, True,

1168

self._size)

1169

# parse

1170

for offset, data in readv_data:

1171

self._bytes_read += len(data)

1172

if offset == 0 and len(data) == self._size:

1173

# We read the whole range, most likely because the

1174

# Transport upcast our readv ranges into one long request

1175

# for enough total data to grab the whole index.

1176

self._buffer_all(StringIO(data))

1177

return

1178

if self._bisect_nodes is None:

1179

# this must be the start

1180

if not (offset == 0):

1181

raise AssertionError()

1182

offset, data = self._parse_header_from_bytes(data)

1183

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1184

self._parse_region(offset, data)

1185

1186

def _signature(self):

1187

"""The file signature for this index type."""

1188

return _SIGNATURE

1189

1190

def validate(self):

1191

"""Validate that everything in the index can be accessed."""

1192

# iter_all validates completely at the moment, so just do that.

1193

for node in self.iter_all_entries():

1194

pass

1195

1196

1197

class CombinedGraphIndex(object):

1198

"""A GraphIndex made up from smaller GraphIndices.

1199

1200

The backing indices must implement GraphIndex, and are presumed to be

1201

static data.

1202

1203

Queries against the combined index will be made against the first index,

1204

and then the second and so on. The order of index's can thus influence

1205

performance significantly. For example, if one index is on local disk and a

1206

second on a remote server, the local disk index should be before the other

1207

in the index list.

1208

"""

1209

1210

def __init__(self, indices, reload_func=None):

1211

"""Create a CombinedGraphIndex backed by indices.

1212

1213

:param indices: An ordered list of indices to query for data.

1214

:param reload_func: A function to call if we find we are missing an

1215

index. Should have the form reload_func() => True/False to indicate

1216

if reloading actually changed anything.

1217

"""

1218

self._indices = indices

1219

self._reload_func = reload_func

1220

1221

def __repr__(self):

1222

return "%s(%s)" % (

1223

self.__class__.__name__,

1224

', '.join(map(repr, self._indices)))

1225

1226

def get_parent_map(self, keys):

1227

"""See graph.StackedParentsProvider.get_parent_map"""

1228

search_keys = set(keys)

1229

if NULL_REVISION in search_keys:

1230

search_keys.discard(NULL_REVISION)

1231

found_parents = {NULL_REVISION:[]}

1232

else:

1233

found_parents = {}

1234

for index, key, value, refs in self.iter_entries(search_keys):

1235

parents = refs[0]

1236

if not parents:

1237

parents = (NULL_REVISION,)

1238

found_parents[key] = parents

1239

return found_parents

1240

1241

has_key = _has_key_from_parent_map

1242

1243

def insert_index(self, pos, index):

1244

"""Insert a new index in the list of indices to query.

1245

1246

:param pos: The position to insert the index.

1247

:param index: The index to insert.

1248

"""

1249

self._indices.insert(pos, index)

1250

1251

def iter_all_entries(self):

1252

"""Iterate over all keys within the index

1253

1254

Duplicate keys across child indices are presumed to have the same

1255

value and are only reported once.

1256

1257

:return: An iterable of (index, key, reference_lists, value).

1258

There is no defined order for the result iteration - it will be in

1259

the most efficient order for the index.

1260

"""

1261

seen_keys = set()

1262

while True:

1263

try:

1264

for index in self._indices:

1265

for node in index.iter_all_entries():

1266

if node[1] not in seen_keys:

1267

yield node

1268

seen_keys.add(node[1])

1269

return

1270

except errors.NoSuchFile:

1271

self._reload_or_raise()

1272

1273

def iter_entries(self, keys):

1274

"""Iterate over keys within the index.

1275

1276

Duplicate keys across child indices are presumed to have the same

1277

value and are only reported once.

1278

1279

:param keys: An iterable providing the keys to be retrieved.

1280

:return: An iterable of (index, key, reference_lists, value). There is no

1281

defined order for the result iteration - it will be in the most

1282

efficient order for the index.

1283

"""

1284

keys = set(keys)

1285

while True:

1286

try:

1287

for index in self._indices:

1288

if not keys:

1289

return

1290

for node in index.iter_entries(keys):

1291

keys.remove(node[1])

1292

yield node

1293

return

1294

except errors.NoSuchFile:

1295

self._reload_or_raise()

1296

1297

def iter_entries_prefix(self, keys):

1298

"""Iterate over keys within the index using prefix matching.

1299

1300

Duplicate keys across child indices are presumed to have the same

1301

value and are only reported once.

1302

1303

Prefix matching is applied within the tuple of a key, not to within

1304

the bytestring of each key element. e.g. if you have the keys ('foo',

1305

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1306

only the former key is returned.

1307

1308

:param keys: An iterable providing the key prefixes to be retrieved.

1309

Each key prefix takes the form of a tuple the length of a key, but

1310

with the last N elements 'None' rather than a regular bytestring.

1311

The first element cannot be 'None'.

1312

:return: An iterable as per iter_all_entries, but restricted to the

1313

keys with a matching prefix to those supplied. No additional keys

1314

will be returned, and every match that is in the index will be

1315

returned.

1316

"""

1317

keys = set(keys)

1318

if not keys:

1319

return

1320

seen_keys = set()

1321

while True:

1322

try:

1323

for index in self._indices:

1324

for node in index.iter_entries_prefix(keys):

1325

if node[1] in seen_keys:

1326

continue

1327

seen_keys.add(node[1])

1328

yield node

1329

return

1330

except errors.NoSuchFile:

1331

self._reload_or_raise()

1332

1333

def find_ancestry(self, keys, ref_list_num):

1334

"""Find the complete ancestry for the given set of keys.

1335

1336

Note that this is a whole-ancestry request, so it should be used

1337

sparingly.

1338

1339

:param keys: An iterable of keys to look for

1340

:param ref_list_num: The reference list which references the parents

1341

we care about.

1342

:return: (parent_map, missing_keys)

1343

"""

1344

missing_keys = set()

1345

parent_map = {}

1346

keys_to_lookup = set(keys)

1347

generation = 0

1348

while keys_to_lookup:

1349

# keys that *all* indexes claim are missing, stop searching them

1350

generation += 1

1351

all_index_missing = None

1352

# print 'gen\tidx\tsub\tn_keys\tn_pmap\tn_miss'

1353

# print '%4d\t\t\t%4d\t%5d\t%5d' % (generation, len(keys_to_lookup),

1354

# len(parent_map),

1355

# len(missing_keys))

1356

for index_idx, index in enumerate(self._indices):

1357

# TODO: we should probably be doing something with

1358

# 'missing_keys' since we've already determined that

1359

# those revisions have not been found anywhere

1360

index_missing_keys = set()

1361

# Find all of the ancestry we can from this index

1362

# keep looking until the search_keys set is empty, which means

1363

# things we didn't find should be in index_missing_keys

1364

search_keys = keys_to_lookup

1365

sub_generation = 0

1366

# print ' \t%2d\t\t%4d\t%5d\t%5d' % (

1367

# index_idx, len(search_keys),

1368

# len(parent_map), len(index_missing_keys))

1369

while search_keys:

1370

sub_generation += 1

1371

# TODO: ref_list_num should really be a parameter, since

1372

# CombinedGraphIndex does not know what the ref lists

1373

# mean.

1374

search_keys = index._find_ancestors(search_keys,

1375

ref_list_num, parent_map, index_missing_keys)

1376

# print ' \t \t%2d\t%4d\t%5d\t%5d' % (

1377

# sub_generation, len(search_keys),

1378

# len(parent_map), len(index_missing_keys))

1379

# Now set whatever was missing to be searched in the next index

1380

keys_to_lookup = index_missing_keys

1381

if all_index_missing is None:

1382

all_index_missing = set(index_missing_keys)

1383

else:

1384

all_index_missing.intersection_update(index_missing_keys)

1385

if not keys_to_lookup:

1386

break

1387

if all_index_missing is None:

1388

# There were no indexes, so all search keys are 'missing'

1389

missing_keys.update(keys_to_lookup)

1390

keys_to_lookup = None

1391

else:

1392

missing_keys.update(all_index_missing)

1393

keys_to_lookup.difference_update(all_index_missing)

1394

return parent_map, missing_keys

1395

1396

def key_count(self):

1397

"""Return an estimate of the number of keys in this index.

1398

1399

For CombinedGraphIndex this is approximated by the sum of the keys of

1400

the child indices. As child indices may have duplicate keys this can

1401

have a maximum error of the number of child indices * largest number of

1402

keys in any index.

1403

"""

1404

while True:

1405

try:

1406

return sum((index.key_count() for index in self._indices), 0)

1407

except errors.NoSuchFile:

1408

self._reload_or_raise()

1409

1410

missing_keys = _missing_keys_from_parent_map

1411

1412

def _reload_or_raise(self):

1413

"""We just got a NoSuchFile exception.

1414

1415

Try to reload the indices, if it fails, just raise the current

1416

exception.

1417

"""

1418

if self._reload_func is None:

1419

raise

1420

exc_type, exc_value, exc_traceback = sys.exc_info()

1421

trace.mutter('Trying to reload after getting exception: %s',

1422

exc_value)

1423

if not self._reload_func():

1424

# We tried to reload, but nothing changed, so we fail anyway

1425

trace.mutter('_reload_func indicated nothing has changed.'

1426

' Raising original exception.')

1427

raise exc_type, exc_value, exc_traceback

1428

1429

def validate(self):

1430

"""Validate that everything in the index can be accessed."""

1431

while True:

1432

try:

1433

for index in self._indices:

1434

index.validate()

1435

return

1436

except errors.NoSuchFile:

1437

self._reload_or_raise()

1438

1439

1440

class InMemoryGraphIndex(GraphIndexBuilder):

1441

"""A GraphIndex which operates entirely out of memory and is mutable.

1442

1443

This is designed to allow the accumulation of GraphIndex entries during a

1444

single write operation, where the accumulated entries need to be immediately

1445

available - for example via a CombinedGraphIndex.

1446

"""

1447

1448

def add_nodes(self, nodes):

1449

"""Add nodes to the index.

1450

1451

:param nodes: An iterable of (key, node_refs, value) entries to add.

1452

"""

1453

if self.reference_lists:

1454

for (key, value, node_refs) in nodes:

1455

self.add_node(key, value, node_refs)

1456

else:

1457

for (key, value) in nodes:

1458

self.add_node(key, value)

1459

1460

def iter_all_entries(self):

1461

"""Iterate over all keys within the index

1462

1463

:return: An iterable of (index, key, reference_lists, value). There is no

1464

defined order for the result iteration - it will be in the most

1465

efficient order for the index (in this case dictionary hash order).

1466

"""

1467

if 'evil' in debug.debug_flags:

1468

trace.mutter_callsite(3,

1469

"iter_all_entries scales with size of history.")

1470

if self.reference_lists:

1471

for key, (absent, references, value) in self._nodes.iteritems():

1472

if not absent:

1473

yield self, key, value, references

1474

else:

1475

for key, (absent, references, value) in self._nodes.iteritems():

1476

if not absent:

1477

yield self, key, value

1478

1479

def iter_entries(self, keys):

1480

"""Iterate over keys within the index.

1481

1482

:param keys: An iterable providing the keys to be retrieved.

1483

:return: An iterable of (index, key, value, reference_lists). There is no

1484

defined order for the result iteration - it will be in the most

1485

efficient order for the index (keys iteration order in this case).

1486

"""

1487

keys = set(keys)

1488

if self.reference_lists:

1489

for key in keys.intersection(self._keys):

1490

node = self._nodes[key]

1491

if not node[0]:

1492

yield self, key, node[2], node[1]

1493

else:

1494

for key in keys.intersection(self._keys):

1495

node = self._nodes[key]

1496

if not node[0]:

1497

yield self, key, node[2]

1498

1499

def iter_entries_prefix(self, keys):

1500

"""Iterate over keys within the index using prefix matching.

1501

1502

Prefix matching is applied within the tuple of a key, not to within

1503

the bytestring of each key element. e.g. if you have the keys ('foo',

1504

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1505

only the former key is returned.

1506

1507

:param keys: An iterable providing the key prefixes to be retrieved.

1508

Each key prefix takes the form of a tuple the length of a key, but

1509

with the last N elements 'None' rather than a regular bytestring.

1510

The first element cannot be 'None'.

1511

:return: An iterable as per iter_all_entries, but restricted to the

1512

keys with a matching prefix to those supplied. No additional keys

1513

will be returned, and every match that is in the index will be

1514

returned.

1515

"""

1516

# XXX: To much duplication with the GraphIndex class; consider finding

1517

# a good place to pull out the actual common logic.

1518

keys = set(keys)

1519

if not keys:

1520

return

1521

if self._key_length == 1:

1522

for key in keys:

1523

# sanity check

1524

if key[0] is None:

1525

raise errors.BadIndexKey(key)

1526

if len(key) != self._key_length:

1527

raise errors.BadIndexKey(key)

1528

node = self._nodes[key]

1529

if node[0]:

1530

continue

1531

if self.reference_lists:

1532

yield self, key, node[2], node[1]

1533

else:

1534

yield self, key, node[2]

1535

return

1536

nodes_by_key = self._get_nodes_by_key()

1537

for key in keys:

1538

# sanity check

1539

if key[0] is None:

1540

raise errors.BadIndexKey(key)

1541

if len(key) != self._key_length:

1542

raise errors.BadIndexKey(key)

1543

# find what it refers to:

1544

key_dict = nodes_by_key

1545

elements = list(key)

1546

# find the subdict to return

1547

try:

1548

while len(elements) and elements[0] is not None:

1549

key_dict = key_dict[elements[0]]

1550

elements.pop(0)

1551

except KeyError:

1552

# a non-existant lookup.

1553

continue

1554

if len(elements):

1555

dicts = [key_dict]

1556

while dicts:

1557

key_dict = dicts.pop(-1)

1558

# can't be empty or would not exist

1559

item, value = key_dict.iteritems().next()

1560

if type(value) == dict:

1561

# push keys

1562

dicts.extend(key_dict.itervalues())

1563

else:

1564

# yield keys

1565

for value in key_dict.itervalues():

1566

yield (self, ) + value

1567

else:

1568

yield (self, ) + key_dict

1569

1570

def key_count(self):

1571

"""Return an estimate of the number of keys in this index.

1572

1573

For InMemoryGraphIndex the estimate is exact.

1574

"""

1575

return len(self._keys)

1576

1577

def validate(self):

1578

"""In memory index's have no known corruption at the moment."""

1579

1580

1581

class GraphIndexPrefixAdapter(object):

1582

"""An adapter between GraphIndex with different key lengths.

1583

1584

Queries against this will emit queries against the adapted Graph with the

1585

prefix added, queries for all items use iter_entries_prefix. The returned

1586

nodes will have their keys and node references adjusted to remove the

1587

prefix. Finally, an add_nodes_callback can be supplied - when called the

1588

nodes and references being added will have prefix prepended.

1589

"""

1590

1591

def __init__(self, adapted, prefix, missing_key_length,

1592

add_nodes_callback=None):

1593

"""Construct an adapter against adapted with prefix."""

1594

self.adapted = adapted

1595

self.prefix_key = prefix + (None,)*missing_key_length

1596

self.prefix = prefix

1597

self.prefix_len = len(prefix)

1598

self.add_nodes_callback = add_nodes_callback

1599

1600

def add_nodes(self, nodes):

1601

"""Add nodes to the index.

1602

1603

:param nodes: An iterable of (key, node_refs, value) entries to add.

1604

"""

1605

# save nodes in case its an iterator

1606

nodes = tuple(nodes)

1607

translated_nodes = []

1608

try:

1609

# Add prefix_key to each reference node_refs is a tuple of tuples,

1610

# so split it apart, and add prefix_key to the internal reference

1611

for (key, value, node_refs) in nodes:

1612

adjusted_references = (

1613

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1614

for ref_list in node_refs))

1615

translated_nodes.append((self.prefix + key, value,

1616

adjusted_references))

1617

except ValueError:

1618

# XXX: TODO add an explicit interface for getting the reference list

1619

# status, to handle this bit of user-friendliness in the API more

1620

# explicitly.

1621

for (key, value) in nodes:

1622

translated_nodes.append((self.prefix + key, value))

1623

self.add_nodes_callback(translated_nodes)

1624

1625

def add_node(self, key, value, references=()):

1626

"""Add a node to the index.

1627

1628

:param key: The key. keys are non-empty tuples containing

1629

as many whitespace-free utf8 bytestrings as the key length

1630

defined for this index.

1631

:param references: An iterable of iterables of keys. Each is a

1632

reference to another key.

1633

:param value: The value to associate with the key. It may be any

1634

bytes as long as it does not contain \0 or \n.

1635

"""

1636

self.add_nodes(((key, value, references), ))

1637

1638

def _strip_prefix(self, an_iter):

1639

"""Strip prefix data from nodes and return it."""

1640

for node in an_iter:

1641

# cross checks

1642

if node[1][:self.prefix_len] != self.prefix:

1643

raise errors.BadIndexData(self)

1644

for ref_list in node[3]:

1645

for ref_node in ref_list:

1646

if ref_node[:self.prefix_len] != self.prefix:

1647

raise errors.BadIndexData(self)

1648

yield node[0], node[1][self.prefix_len:], node[2], (

1649

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1650

for ref_list in node[3]))

1651

1652

def iter_all_entries(self):

1653

"""Iterate over all keys within the index

1654

1655

iter_all_entries is implemented against the adapted index using

1656

iter_entries_prefix.

1657

1658

:return: An iterable of (index, key, reference_lists, value). There is no

1659

defined order for the result iteration - it will be in the most

1660

efficient order for the index (in this case dictionary hash order).

1661

"""

1662

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1663

1664

def iter_entries(self, keys):

1665

"""Iterate over keys within the index.

1666

1667

:param keys: An iterable providing the keys to be retrieved.

1668

:return: An iterable of (index, key, value, reference_lists). There is no

1669

defined order for the result iteration - it will be in the most

1670

efficient order for the index (keys iteration order in this case).

1671

"""

1672

return self._strip_prefix(self.adapted.iter_entries(

1673

self.prefix + key for key in keys))

1674

1675

def iter_entries_prefix(self, keys):

1676

"""Iterate over keys within the index using prefix matching.

1677

1678

Prefix matching is applied within the tuple of a key, not to within

1679

the bytestring of each key element. e.g. if you have the keys ('foo',

1680

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1681

only the former key is returned.

1682

1683

:param keys: An iterable providing the key prefixes to be retrieved.

1684

Each key prefix takes the form of a tuple the length of a key, but

1685

with the last N elements 'None' rather than a regular bytestring.

1686

The first element cannot be 'None'.

1687

:return: An iterable as per iter_all_entries, but restricted to the

1688

keys with a matching prefix to those supplied. No additional keys

1689

will be returned, and every match that is in the index will be

1690

returned.

1691

"""

1692

return self._strip_prefix(self.adapted.iter_entries_prefix(

1693

self.prefix + key for key in keys))

1694

1695

def key_count(self):

1696

"""Return an estimate of the number of keys in this index.

1697

1698

For GraphIndexPrefixAdapter this is relatively expensive - key

1699

iteration with the prefix is done.

1700

"""

1701

return len(list(self.iter_all_entries()))

1702

1703

def validate(self):

1704

"""Call the adapted's validate."""

1705

self.adapted.validate()

Older »