~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Martin Pool
Date: 2005-07-21 21:32:13 UTC
Revision ID: mbp@sourcefrog.net-20050721213213-c6ac0e8b06eaad0f

- bzr update-hashes shows some stats on what it did

files added:
build-api

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/upgrade.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/new-inventory-sample.xml

notes/performance.txt

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

plugins/changeset

plugins/changeset/__init__.py

plugins/changeset/apply_changeset.py

plugins/changeset/common.py

plugins/changeset/gen_changeset.py

plugins/changeset/read_changeset.py

plugins/checkperms

testbzr

testsweet.py

urlgrabber

urlgrabber/__init__.py

urlgrabber/byterange.py

urlgrabber/grabber.py

urlgrabber/keepalive.py

urlgrabber/mirror.py

urlgrabber/progress.py

files removed:
BRANCH.TODO

COPYING.txt

INSTALL

Makefile

bzr.ico

bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/annotate.py

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chunk_writer.py

bzrlib/cmd_version_info.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/win32utils.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/emacs

contrib/emacs/bzr-mode.el

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/HACKING.txt

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

doc/news-template.txt

generate_docs.py

man1

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files renamed:
tools/doc_generate/autodoc_man.py => bzr-man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

contrib/newinventory.py => bzrlib/newinventory.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/branch_implementations/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revisionspec.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/blackbox/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/__init__.py => bzrlib/store.py

bzrlib/xml_serializer.py => bzrlib/xml.py

bzrlib/util/effbot/ => effbot/

bzrlib/util/elementtree/ => elementtree/

bzrlib/plugins/ => plugins/

bzrlib/tests/test_weave.py => tools/testweave.py

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/selftest/__init__.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib/bash/bzr.simple

contrib/pwk

contrib/zsh/_bzr

elementtree/ElementTree.py

setup.py *

tools/convertfile.py

tools/convertinv.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

100

self._key_length = key_elements

101

self._optimize_for_size = False

102

103

def _check_key(self, key):

104

"""Raise BadIndexKey if key is not a valid key for this index."""

105

if type(key) != tuple:

106

raise errors.BadIndexKey(key)

107

if self._key_length != len(key):

108

raise errors.BadIndexKey(key)

109

for element in key:

110

if not element or _whitespace_re.search(element) is not None:

111

raise errors.BadIndexKey(element)

112

113

def _external_references(self):

114

"""Return references that are not present in this index.

115

"""

116

keys = set()

117

refs = set()

118

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

119

# lists are used. It is currently correct for pack-0.92 through

120

# 1.9, which use the node references (3rd column) second

121

# reference list as the compression parent. Perhaps this should

122

# be moved into something higher up the stack, since it

123

# makes assumptions about how the index is used.

124

if self.reference_lists > 1:

125

for node in self.iter_all_entries():

126

keys.add(node[1])

127

refs.update(node[3][1])

128

return refs - keys

129

else:

130

# If reference_lists == 0 there can be no external references, and

131

# if reference_lists == 1, then there isn't a place to store the

132

# compression parent

133

return set()

134

135

def _get_nodes_by_key(self):

136

if self._nodes_by_key is None:

137

nodes_by_key = {}

138

if self.reference_lists:

139

for key, (absent, references, value) in self._nodes.iteritems():

140

if absent:

141

continue

142

key_dict = nodes_by_key

143

for subkey in key[:-1]:

144

key_dict = key_dict.setdefault(subkey, {})

145

key_dict[key[-1]] = key, value, references

146

else:

147

for key, (absent, references, value) in self._nodes.iteritems():

148

if absent:

149

continue

150

key_dict = nodes_by_key

151

for subkey in key[:-1]:

152

key_dict = key_dict.setdefault(subkey, {})

153

key_dict[key[-1]] = key, value

154

self._nodes_by_key = nodes_by_key

155

return self._nodes_by_key

156

157

def _update_nodes_by_key(self, key, value, node_refs):

158

"""Update the _nodes_by_key dict with a new key.

159

160

For a key of (foo, bar, baz) create

161

_nodes_by_key[foo][bar][baz] = key_value

162

"""

163

if self._nodes_by_key is None:

164

return

165

key_dict = self._nodes_by_key

166

if self.reference_lists:

167

key_value = key, value, node_refs

168

else:

169

key_value = key, value

170

for subkey in key[:-1]:

171

key_dict = key_dict.setdefault(subkey, {})

172

key_dict[key[-1]] = key_value

173

174

def _check_key_ref_value(self, key, references, value):

175

"""Check that 'key' and 'references' are all valid.

176

177

:param key: A key tuple. Must conform to the key interface (be a tuple,

178

be of the right length, not have any whitespace or nulls in any key

179

element.)

180

:param references: An iterable of reference lists. Something like

181

[[(ref, key)], [(ref, key), (other, key)]]

182

:param value: The value associate with this key. Must not contain

183

newlines or null characters.

184

:return: (node_refs, absent_references)

185

node_refs basically a packed form of 'references' where all

186

iterables are tuples

187

absent_references reference keys that are not in self._nodes.

188

This may contain duplicates if the same key is

189

referenced in multiple lists.

190

"""

191

self._check_key(key)

192

if _newline_null_re.search(value) is not None:

193

raise errors.BadIndexValue(value)

194

if len(references) != self.reference_lists:

195

raise errors.BadIndexValue(references)

196

node_refs = []

197

absent_references = []

198

for reference_list in references:

199

for reference in reference_list:

200

# If reference *is* in self._nodes, then we know it has already

201

# been checked.

202

if reference not in self._nodes:

203

self._check_key(reference)

204

absent_references.append(reference)

205

node_refs.append(tuple(reference_list))

206

return tuple(node_refs), absent_references

207

208

def add_node(self, key, value, references=()):

209

"""Add a node to the index.

210

211

:param key: The key. keys are non-empty tuples containing

212

as many whitespace-free utf8 bytestrings as the key length

213

defined for this index.

214

:param references: An iterable of iterables of keys. Each is a

215

reference to another key.

216

:param value: The value to associate with the key. It may be any

217

bytes as long as it does not contain \0 or \n.

218

"""

219

(node_refs,

220

absent_references) = self._check_key_ref_value(key, references, value)

221

if key in self._nodes and self._nodes[key][0] != 'a':

222

raise errors.BadIndexDuplicateKey(key, self)

223

for reference in absent_references:

224

# There may be duplicates, but I don't think it is worth worrying

225

# about

226

self._nodes[reference] = ('a', (), '')

227

self._nodes[key] = ('', node_refs, value)

228

self._keys.add(key)

229

if self._nodes_by_key is not None and self._key_length > 1:

230

self._update_nodes_by_key(key, value, node_refs)

231

232

def finish(self):

233

lines = [_SIGNATURE]

234

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

235

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

236

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

237

prefix_length = sum(len(x) for x in lines)

238

# references are byte offsets. To avoid having to do nasty

239

# polynomial work to resolve offsets (references to later in the

240

# file cannot be determined until all the inbetween references have

241

# been calculated too) we pad the offsets with 0's to make them be

242

# of consistent length. Using binary offsets would break the trivial

243

# file parsing.

244

# to calculate the width of zero's needed we do three passes:

245

# one to gather all the non-reference data and the number of references.

246

# one to pad all the data with reference-length and determine entry

247

# addresses.

248

# One to serialise.

249

250

# forward sorted by key. In future we may consider topological sorting,

251

# at the cost of table scans for direct lookup, or a second index for

252

# direct lookup

253

nodes = sorted(self._nodes.items())

254

# if we do not prepass, we don't know how long it will be up front.

255

expected_bytes = None

256

# we only need to pre-pass if we have reference lists at all.

257

if self.reference_lists:

258

key_offset_info = []

259

non_ref_bytes = prefix_length

260

total_references = 0

261

# TODO use simple multiplication for the constants in this loop.

262

for key, (absent, references, value) in nodes:

263

# record the offset known *so far* for this key:

264

# the non reference bytes to date, and the total references to

265

# date - saves reaccumulating on the second pass

266

key_offset_info.append((key, non_ref_bytes, total_references))

267

# key is literal, value is literal, there are 3 null's, 1 NL

268

# key is variable length tuple, \x00 between elements

269

non_ref_bytes += sum(len(element) for element in key)

270

if self._key_length > 1:

271

non_ref_bytes += self._key_length - 1

272

# value is literal bytes, there are 3 null's, 1 NL.

273

non_ref_bytes += len(value) + 3 + 1

274

# one byte for absent if set.

275

if absent:

276

non_ref_bytes += 1

277

elif self.reference_lists:

278

# (ref_lists -1) tabs

279

non_ref_bytes += self.reference_lists - 1

280

# (ref-1 cr's per ref_list)

281

for ref_list in references:

282

# how many references across the whole file?

283

total_references += len(ref_list)

284

# accrue reference separators

285

if ref_list:

286

non_ref_bytes += len(ref_list) - 1

287

# how many digits are needed to represent the total byte count?

288

digits = 1

289

possible_total_bytes = non_ref_bytes + total_references*digits

290

while 10 ** digits < possible_total_bytes:

291

digits += 1

292

possible_total_bytes = non_ref_bytes + total_references*digits

293

expected_bytes = possible_total_bytes + 1 # terminating newline

294

# resolve key addresses.

295

key_addresses = {}

296

for key, non_ref_bytes, total_references in key_offset_info:

297

key_addresses[key] = non_ref_bytes + total_references*digits

298

# serialise

299

format_string = '%%0%sd' % digits

300

for key, (absent, references, value) in nodes:

301

flattened_references = []

302

for ref_list in references:

303

ref_addresses = []

304

for reference in ref_list:

305

ref_addresses.append(format_string % key_addresses[reference])

306

flattened_references.append('\r'.join(ref_addresses))

307

string_key = '\x00'.join(key)

308

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

309

'\t'.join(flattened_references), value))

310

lines.append('\n')

311

result = StringIO(''.join(lines))

312

if expected_bytes and len(result.getvalue()) != expected_bytes:

313

raise errors.BzrError('Failed index creation. Internal error:'

314

' mismatched output length and expected length: %d %d' %

315

(len(result.getvalue()), expected_bytes))

316

return result

317

318

def set_optimize(self, for_size=True):

319

"""Change how the builder tries to optimize the result.

320

321

:param for_size: Tell the builder to try and make the index as small as

322

possible.

323

:return: None

324

"""

325

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

326

# other builders do.

327

self._optimize_for_size = for_size

328

329

330

class GraphIndex(object):

331

"""An index for data with embedded graphs.

332

333

The index maps keys to a list of key reference lists, and a value.

334

Each node has the same number of key reference lists. Each key reference

335

list can be empty or an arbitrary length. The value is an opaque NULL

336

terminated string without any newlines. The storage of the index is

337

hidden in the interface: keys and key references are always tuples of

338

bytestrings, never the internal representation (e.g. dictionary offsets).

339

340

It is presumed that the index will not be mutated - it is static data.

341

342

Successive iter_all_entries calls will read the entire index each time.

343

Additionally, iter_entries calls will read the index linearly until the

344

desired keys are found. XXX: This must be fixed before the index is

345

suitable for production use. :XXX

346

"""

347

348

def __init__(self, transport, name, size):

349

"""Open an index called name on transport.

350

351

:param transport: A bzrlib.transport.Transport.

352

:param name: A path to provide to transport API calls.

353

:param size: The size of the index in bytes. This is used for bisection

354

logic to perform partial index reads. While the size could be

355

obtained by statting the file this introduced an additional round

356

trip as well as requiring stat'able transports, both of which are

357

avoided by having it supplied. If size is None, then bisection

358

support will be disabled and accessing the index will just stream

359

all the data.

360

"""

361

self._transport = transport

362

self._name = name

363

# Becomes a dict of key:(value, reference-list-byte-locations) used by

364

# the bisection interface to store parsed but not resolved keys.

365

self._bisect_nodes = None

366

# Becomes a dict of key:(value, reference-list-keys) which are ready to

367

# be returned directly to callers.

368

self._nodes = None

369

# a sorted list of slice-addresses for the parsed bytes of the file.

370

# e.g. (0,1) would mean that byte 0 is parsed.

371

self._parsed_byte_map = []

372

# a sorted list of keys matching each slice address for parsed bytes

373

# e.g. (None, 'foo@bar') would mean that the first byte contained no

374

# key, and the end byte of the slice is the of the data for 'foo@bar'

375

self._parsed_key_map = []

376

self._key_count = None

377

self._keys_by_offset = None

378

self._nodes_by_key = None

379

self._size = size

380

# The number of bytes we've read so far in trying to process this file

381

self._bytes_read = 0

382

383

def __eq__(self, other):

384

"""Equal when self and other were created with the same parameters."""

385

return (

386

type(self) == type(other) and

387

self._transport == other._transport and

388

self._name == other._name and

389

self._size == other._size)

390

391

def __ne__(self, other):

392

return not self.__eq__(other)

393

394

def __repr__(self):

395

return "%s(%r)" % (self.__class__.__name__,

396

self._transport.abspath(self._name))

397

398

def _buffer_all(self, stream=None):

399

"""Buffer all the index data.

400

401

Mutates self._nodes and self.keys_by_offset.

402

"""

403

if self._nodes is not None:

404

# We already did this

405

return

406

if 'index' in debug.debug_flags:

407

mutter('Reading entire index %s', self._transport.abspath(self._name))

408

if stream is None:

409

stream = self._transport.get(self._name)

410

self._read_prefix(stream)

411

self._expected_elements = 3 + self._key_length

412

line_count = 0

413

# raw data keyed by offset

414

self._keys_by_offset = {}

415

# ready-to-return key:value or key:value, node_ref_lists

416

self._nodes = {}

417

self._nodes_by_key = None

418

trailers = 0

419

pos = stream.tell()

420

lines = stream.read().split('\n')

421

del lines[-1]

422

_, _, _, trailers = self._parse_lines(lines, pos)

423

for key, absent, references, value in self._keys_by_offset.itervalues():

424

if absent:

425

continue

426

# resolve references:

427

if self.node_ref_lists:

428

node_value = (value, self._resolve_references(references))

429

else:

430

node_value = value

431

self._nodes[key] = node_value

432

# cache the keys for quick set intersections

433

self._keys = set(self._nodes)

434

if trailers != 1:

435

# there must be one line - the empty trailer line.

436

raise errors.BadIndexData(self)

437

438

def _get_nodes_by_key(self):

439

if self._nodes_by_key is None:

440

nodes_by_key = {}

441

if self.node_ref_lists:

442

for key, (value, references) in self._nodes.iteritems():

443

key_dict = nodes_by_key

444

for subkey in key[:-1]:

445

key_dict = key_dict.setdefault(subkey, {})

446

key_dict[key[-1]] = key, value, references

447

else:

448

for key, value in self._nodes.iteritems():

449

key_dict = nodes_by_key

450

for subkey in key[:-1]:

451

key_dict = key_dict.setdefault(subkey, {})

452

key_dict[key[-1]] = key, value

453

self._nodes_by_key = nodes_by_key

454

return self._nodes_by_key

455

456

def iter_all_entries(self):

457

"""Iterate over all keys within the index.

458

459

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

460

The former tuple is used when there are no reference lists in the

461

index, making the API compatible with simple key:value index types.

462

There is no defined order for the result iteration - it will be in

463

the most efficient order for the index.

464

"""

465

if 'evil' in debug.debug_flags:

466

trace.mutter_callsite(3,

467

"iter_all_entries scales with size of history.")

468

if self._nodes is None:

469

self._buffer_all()

470

if self.node_ref_lists:

471

for key, (value, node_ref_lists) in self._nodes.iteritems():

472

yield self, key, value, node_ref_lists

473

else:

474

for key, value in self._nodes.iteritems():

475

yield self, key, value

476

477

def _read_prefix(self, stream):

478

signature = stream.read(len(self._signature()))

479

if not signature == self._signature():

480

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

481

options_line = stream.readline()

482

if not options_line.startswith(_OPTION_NODE_REFS):

483

raise errors.BadIndexOptions(self)

484

try:

485

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

486

except ValueError:

487

raise errors.BadIndexOptions(self)

488

options_line = stream.readline()

489

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

490

raise errors.BadIndexOptions(self)

491

try:

492

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

493

except ValueError:

494

raise errors.BadIndexOptions(self)

495

options_line = stream.readline()

496

if not options_line.startswith(_OPTION_LEN):

497

raise errors.BadIndexOptions(self)

498

try:

499

self._key_count = int(options_line[len(_OPTION_LEN):-1])

500

except ValueError:

501

raise errors.BadIndexOptions(self)

502

503

def _resolve_references(self, references):

504

"""Return the resolved key references for references.

505

506

References are resolved by looking up the location of the key in the

507

_keys_by_offset map and substituting the key name, preserving ordering.

508

509

:param references: An iterable of iterables of key locations. e.g.

510

[[123, 456], [123]]

511

:return: A tuple of tuples of keys.

512

"""

513

node_refs = []

514

for ref_list in references:

515

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

516

return tuple(node_refs)

517

518

def _find_index(self, range_map, key):

519

"""Helper for the _parsed_*_index calls.

520

521

Given a range map - [(start, end), ...], finds the index of the range

522

in the map for key if it is in the map, and if it is not there, the

523

immediately preceeding range in the map.

524

"""

525

result = bisect_right(range_map, key) - 1

526

if result + 1 < len(range_map):

527

# check the border condition, it may be in result + 1

528

if range_map[result + 1][0] == key[0]:

529

return result + 1

530

return result

531

532

def _parsed_byte_index(self, offset):

533

"""Return the index of the entry immediately before offset.

534

535

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

536

there is one unparsed byte (the 11th, addressed as[10]). then:

537

asking for 0 will return 0

538

asking for 10 will return 0

539

asking for 11 will return 1

540

asking for 12 will return 1

541

"""

542

key = (offset, 0)

543

return self._find_index(self._parsed_byte_map, key)

544

545

def _parsed_key_index(self, key):

546

"""Return the index of the entry immediately before key.

547

548

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

549

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

550

have been parsed, then:

551

asking for '' will return 0

552

asking for 'a' will return 0

553

asking for 'b' will return 1

554

asking for 'e' will return 1

555

"""

556

search_key = (key, None)

557

return self._find_index(self._parsed_key_map, search_key)

558

559

def _is_parsed(self, offset):

560

"""Returns True if offset has been parsed."""

561

index = self._parsed_byte_index(offset)

562

if index == len(self._parsed_byte_map):

563

return offset < self._parsed_byte_map[index - 1][1]

564

start, end = self._parsed_byte_map[index]

565

return offset >= start and offset < end

566

567

def _iter_entries_from_total_buffer(self, keys):

568

"""Iterate over keys when the entire index is parsed."""

569

keys = keys.intersection(self._keys)

570

if self.node_ref_lists:

571

for key in keys:

572

value, node_refs = self._nodes[key]

573

yield self, key, value, node_refs

574

else:

575

for key in keys:

576

yield self, key, self._nodes[key]

577

578

def iter_entries(self, keys):

579

"""Iterate over keys within the index.

580

581

:param keys: An iterable providing the keys to be retrieved.

582

:return: An iterable as per iter_all_entries, but restricted to the

583

keys supplied. No additional keys will be returned, and every

584

key supplied that is in the index will be returned.

585

"""

586

keys = set(keys)

587

if not keys:

588

return []

589

if self._size is None and self._nodes is None:

590

self._buffer_all()

591

592

# We fit about 20 keys per minimum-read (4K), so if we are looking for

593

# more than 1/20th of the index its likely (assuming homogenous key

594

# spread) that we'll read the entire index. If we're going to do that,

595

# buffer the whole thing. A better analysis might take key spread into

596

# account - but B+Tree indices are better anyway.

597

# We could look at all data read, and use a threshold there, which will

598

# trigger on ancestry walks, but that is not yet fully mapped out.

599

if self._nodes is None and len(keys) * 20 > self.key_count():

600

self._buffer_all()

601

if self._nodes is not None:

602

return self._iter_entries_from_total_buffer(keys)

603

else:

604

return (result[1] for result in bisect_multi_bytes(

605

self._lookup_keys_via_location, self._size, keys))

606

607

def iter_entries_prefix(self, keys):

608

"""Iterate over keys within the index using prefix matching.

609

610

Prefix matching is applied within the tuple of a key, not to within

611

the bytestring of each key element. e.g. if you have the keys ('foo',

612

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

613

only the former key is returned.

614

615

WARNING: Note that this method currently causes a full index parse

616

unconditionally (which is reasonably appropriate as it is a means for

617

thunking many small indices into one larger one and still supplies

618

iter_all_entries at the thunk layer).

619

620

:param keys: An iterable providing the key prefixes to be retrieved.

621

Each key prefix takes the form of a tuple the length of a key, but

622

with the last N elements 'None' rather than a regular bytestring.

623

The first element cannot be 'None'.

624

:return: An iterable as per iter_all_entries, but restricted to the

625

keys with a matching prefix to those supplied. No additional keys

626

will be returned, and every match that is in the index will be

627

returned.

628

"""

629

keys = set(keys)

630

if not keys:

631

return

632

# load data - also finds key lengths

633

if self._nodes is None:

634

self._buffer_all()

635

if self._key_length == 1:

636

for key in keys:

637

# sanity check

638

if key[0] is None:

639

raise errors.BadIndexKey(key)

640

if len(key) != self._key_length:

641

raise errors.BadIndexKey(key)

642

if self.node_ref_lists:

643

value, node_refs = self._nodes[key]

644

yield self, key, value, node_refs

645

else:

646

yield self, key, self._nodes[key]

647

return

648

nodes_by_key = self._get_nodes_by_key()

649

for key in keys:

650

# sanity check

651

if key[0] is None:

652

raise errors.BadIndexKey(key)

653

if len(key) != self._key_length:

654

raise errors.BadIndexKey(key)

655

# find what it refers to:

656

key_dict = nodes_by_key

657

elements = list(key)

658

# find the subdict whose contents should be returned.

659

try:

660

while len(elements) and elements[0] is not None:

661

key_dict = key_dict[elements[0]]

662

elements.pop(0)

663

except KeyError:

664

# a non-existant lookup.

665

continue

666

if len(elements):

667

dicts = [key_dict]

668

while dicts:

669

key_dict = dicts.pop(-1)

670

# can't be empty or would not exist

671

item, value = key_dict.iteritems().next()

672

if type(value) == dict:

673

# push keys

674

dicts.extend(key_dict.itervalues())

675

else:

676

# yield keys

677

for value in key_dict.itervalues():

678

# each value is the key:value:node refs tuple

679

# ready to yield.

680

yield (self, ) + value

681

else:

682

# the last thing looked up was a terminal element

683

yield (self, ) + key_dict

684

685

def key_count(self):

686

"""Return an estimate of the number of keys in this index.

687

688

For GraphIndex the estimate is exact.

689

"""

690

if self._key_count is None:

691

self._read_and_parse([_HEADER_READV])

692

return self._key_count

693

694

def _lookup_keys_via_location(self, location_keys):

695

"""Public interface for implementing bisection.

696

697

If _buffer_all has been called, then all the data for the index is in

698

memory, and this method should not be called, as it uses a separate

699

cache because it cannot pre-resolve all indices, which buffer_all does

700

for performance.

701

702

:param location_keys: A list of location(byte offset), key tuples.

703

:return: A list of (location_key, result) tuples as expected by

704

bzrlib.bisect_multi.bisect_multi_bytes.

705

"""

706

# Possible improvements:

707

# - only bisect lookup each key once

708

# - sort the keys first, and use that to reduce the bisection window

709

# -----

710

# this progresses in three parts:

711

# read data

712

# parse it

713

# attempt to answer the question from the now in memory data.

714

# build the readv request

715

# for each location, ask for 800 bytes - much more than rows we've seen

716

# anywhere.

717

readv_ranges = []

718

for location, key in location_keys:

719

# can we answer from cache?

720

if self._bisect_nodes and key in self._bisect_nodes:

721

# We have the key parsed.

722

continue

723

index = self._parsed_key_index(key)

724

if (len(self._parsed_key_map) and

725

self._parsed_key_map[index][0] <= key and

726

(self._parsed_key_map[index][1] >= key or

727

# end of the file has been parsed

728

self._parsed_byte_map[index][1] == self._size)):

729

# the key has been parsed, so no lookup is needed even if its

730

# not present.

731

continue

732

# - if we have examined this part of the file already - yes

733

index = self._parsed_byte_index(location)

734

if (len(self._parsed_byte_map) and

735

self._parsed_byte_map[index][0] <= location and

736

self._parsed_byte_map[index][1] > location):

737

# the byte region has been parsed, so no read is needed.

738

continue

739

length = 800

740

if location + length > self._size:

741

length = self._size - location

742

# todo, trim out parsed locations.

743

if length > 0:

744

readv_ranges.append((location, length))

745

# read the header if needed

746

if self._bisect_nodes is None:

747

readv_ranges.append(_HEADER_READV)

748

self._read_and_parse(readv_ranges)

749

result = []

750

if self._nodes is not None:

751

# _read_and_parse triggered a _buffer_all because we requested the

752

# whole data range

753

for location, key in location_keys:

754

if key not in self._nodes: # not present

755

result.append(((location, key), False))

756

elif self.node_ref_lists:

757

value, refs = self._nodes[key]

758

result.append(((location, key),

759

(self, key, value, refs)))

760

else:

761

result.append(((location, key),

762

(self, key, self._nodes[key])))

763

return result

764

# generate results:

765

# - figure out <, >, missing, present

766

# - result present references so we can return them.

767

# keys that we cannot answer until we resolve references

768

pending_references = []

769

pending_locations = set()

770

for location, key in location_keys:

771

# can we answer from cache?

772

if key in self._bisect_nodes:

773

# the key has been parsed, so no lookup is needed

774

if self.node_ref_lists:

775

# the references may not have been all parsed.

776

value, refs = self._bisect_nodes[key]

777

wanted_locations = []

778

for ref_list in refs:

779

for ref in ref_list:

780

if ref not in self._keys_by_offset:

781

wanted_locations.append(ref)

782

if wanted_locations:

783

pending_locations.update(wanted_locations)

784

pending_references.append((location, key))

785

continue

786

result.append(((location, key), (self, key,

787

value, self._resolve_references(refs))))

788

else:

789

result.append(((location, key),

790

(self, key, self._bisect_nodes[key])))

791

continue

792

else:

793

# has the region the key should be in, been parsed?

794

index = self._parsed_key_index(key)

795

if (self._parsed_key_map[index][0] <= key and

796

(self._parsed_key_map[index][1] >= key or

797

# end of the file has been parsed

798

self._parsed_byte_map[index][1] == self._size)):

799

result.append(((location, key), False))

800

continue

801

# no, is the key above or below the probed location:

802

# get the range of the probed & parsed location

803

index = self._parsed_byte_index(location)

804

# if the key is below the start of the range, its below

805

if key < self._parsed_key_map[index][0]:

806

direction = -1

807

else:

808

direction = +1

809

result.append(((location, key), direction))

810

readv_ranges = []

811

# lookup data to resolve references

812

for location in pending_locations:

813

length = 800

814

if location + length > self._size:

815

length = self._size - location

816

# TODO: trim out parsed locations (e.g. if the 800 is into the

817

# parsed region trim it, and dont use the adjust_for_latency

818

# facility)

819

if length > 0:

820

readv_ranges.append((location, length))

821

self._read_and_parse(readv_ranges)

822

if self._nodes is not None:

823

# The _read_and_parse triggered a _buffer_all, grab the data and

824

# return it

825

for location, key in pending_references:

826

value, refs = self._nodes[key]

827

result.append(((location, key), (self, key, value, refs)))

828

return result

829

for location, key in pending_references:

830

# answer key references we had to look-up-late.

831

value, refs = self._bisect_nodes[key]

832

result.append(((location, key), (self, key,

833

value, self._resolve_references(refs))))

834

return result

835

836

def _parse_header_from_bytes(self, bytes):

837

"""Parse the header from a region of bytes.

838

839

:param bytes: The data to parse.

840

:return: An offset, data tuple such as readv yields, for the unparsed

841

data. (which may length 0).

842

"""

843

signature = bytes[0:len(self._signature())]

844

if not signature == self._signature():

845

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

846

lines = bytes[len(self._signature()):].splitlines()

847

options_line = lines[0]

848

if not options_line.startswith(_OPTION_NODE_REFS):

849

raise errors.BadIndexOptions(self)

850

try:

851

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

852

except ValueError:

853

raise errors.BadIndexOptions(self)

854

options_line = lines[1]

855

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

856

raise errors.BadIndexOptions(self)

857

try:

858

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

859

except ValueError:

860

raise errors.BadIndexOptions(self)

861

options_line = lines[2]

862

if not options_line.startswith(_OPTION_LEN):

863

raise errors.BadIndexOptions(self)

864

try:

865

self._key_count = int(options_line[len(_OPTION_LEN):])

866

except ValueError:

867

raise errors.BadIndexOptions(self)

868

# calculate the bytes we have processed

869

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

870

len(lines[2]) + 3)

871

self._parsed_bytes(0, None, header_end, None)

872

# setup parsing state

873

self._expected_elements = 3 + self._key_length

874

# raw data keyed by offset

875

self._keys_by_offset = {}

876

# keys with the value and node references

877

self._bisect_nodes = {}

878

return header_end, bytes[header_end:]

879

880

def _parse_region(self, offset, data):

881

"""Parse node data returned from a readv operation.

882

883

:param offset: The byte offset the data starts at.

884

:param data: The data to parse.

885

"""

886

# trim the data.

887

# end first:

888

end = offset + len(data)

889

high_parsed = offset

890

while True:

891

# Trivial test - if the current index's end is within the

892

# low-matching parsed range, we're done.

893

index = self._parsed_byte_index(high_parsed)

894

if end < self._parsed_byte_map[index][1]:

895

return

896

# print "[%d:%d]" % (offset, end), \

897

# self._parsed_byte_map[index:index + 2]

898

high_parsed, last_segment = self._parse_segment(

899

offset, data, end, index)

900

if last_segment:

901

return

902

903

def _parse_segment(self, offset, data, end, index):

904

"""Parse one segment of data.

905

906

:param offset: Where 'data' begins in the file.

907

:param data: Some data to parse a segment of.

908

:param end: Where data ends

909

:param index: The current index into the parsed bytes map.

910

:return: True if the parsed segment is the last possible one in the

911

range of data.

912

:return: high_parsed_byte, last_segment.

913

high_parsed_byte is the location of the highest parsed byte in this

914

segment, last_segment is True if the parsed segment is the last

915

possible one in the data block.

916

"""

917

# default is to use all data

918

trim_end = None

919

# accomodate overlap with data before this.

920

if offset < self._parsed_byte_map[index][1]:

921

# overlaps the lower parsed region

922

# skip the parsed data

923

trim_start = self._parsed_byte_map[index][1] - offset

924

# don't trim the start for \n

925

start_adjacent = True

926

elif offset == self._parsed_byte_map[index][1]:

927

# abuts the lower parsed region

928

# use all data

929

trim_start = None

930

# do not trim anything

931

start_adjacent = True

932

else:

933

# does not overlap the lower parsed region

934

# use all data

935

trim_start = None

936

# but trim the leading \n

937

start_adjacent = False

938

if end == self._size:

939

# lines up to the end of all data:

940

# use it all

941

trim_end = None

942

# do not strip to the last \n

943

end_adjacent = True

944

last_segment = True

945

elif index + 1 == len(self._parsed_byte_map):

946

# at the end of the parsed data

947

# use it all

948

trim_end = None

949

# but strip to the last \n

950

end_adjacent = False

951

last_segment = True

952

elif end == self._parsed_byte_map[index + 1][0]:

953

# buts up against the next parsed region

954

# use it all

955

trim_end = None

956

# do not strip to the last \n

957

end_adjacent = True

958

last_segment = True

959

elif end > self._parsed_byte_map[index + 1][0]:

960

# overlaps into the next parsed region

961

# only consider the unparsed data

962

trim_end = self._parsed_byte_map[index + 1][0] - offset

963

# do not strip to the last \n as we know its an entire record

964

end_adjacent = True

965

last_segment = end < self._parsed_byte_map[index + 1][1]

966

else:

967

# does not overlap into the next region

968

# use it all

969

trim_end = None

970

# but strip to the last \n

971

end_adjacent = False

972

last_segment = True

973

# now find bytes to discard if needed

974

if not start_adjacent:

975

# work around python bug in rfind

976

if trim_start is None:

977

trim_start = data.find('\n') + 1

978

else:

979

trim_start = data.find('\n', trim_start) + 1

980

if not (trim_start != 0):

981

raise AssertionError('no \n was present')

982

# print 'removing start', offset, trim_start, repr(data[:trim_start])

983

if not end_adjacent:

984

# work around python bug in rfind

985

if trim_end is None:

986

trim_end = data.rfind('\n') + 1

987

else:

988

trim_end = data.rfind('\n', None, trim_end) + 1

989

if not (trim_end != 0):

990

raise AssertionError('no \n was present')

991

# print 'removing end', offset, trim_end, repr(data[trim_end:])

992

# adjust offset and data to the parseable data.

993

trimmed_data = data[trim_start:trim_end]

994

if not (trimmed_data):

995

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

996

% (trim_start, trim_end, offset, offset + len(data)))

997

if trim_start:

998

offset += trim_start

999

# print "parsing", repr(trimmed_data)

1000

# splitlines mangles the \r delimiters.. don't use it.

1001

lines = trimmed_data.split('\n')

1002

del lines[-1]

1003

pos = offset

1004

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1005

for key, value in nodes:

1006

self._bisect_nodes[key] = value

1007

self._parsed_bytes(offset, first_key,

1008

offset + len(trimmed_data), last_key)

1009

return offset + len(trimmed_data), last_segment

1010

1011

def _parse_lines(self, lines, pos):

1012

key = None

1013

first_key = None

1014

trailers = 0

1015

nodes = []

1016

for line in lines:

1017

if line == '':

1018

# must be at the end

1019

if self._size:

1020

if not (self._size == pos + 1):

1021

raise AssertionError("%s %s" % (self._size, pos))

1022

trailers += 1

1023

continue

1024

elements = line.split('\0')

1025

if len(elements) != self._expected_elements:

1026

raise errors.BadIndexData(self)

1027

# keys are tuples. Each element is a string that may occur many

1028

# times, so we intern them to save space. AB, RC, 200807

1029

key = tuple([intern(element) for element in elements[:self._key_length]])

1030

if first_key is None:

1031

first_key = key

1032

absent, references, value = elements[-3:]

1033

ref_lists = []

1034

for ref_string in references.split('\t'):

1035

ref_lists.append(tuple([

1036

int(ref) for ref in ref_string.split('\r') if ref

1037

]))

1038

ref_lists = tuple(ref_lists)

1039

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1040

pos += len(line) + 1 # +1 for the \n

1041

if absent:

1042

continue

1043

if self.node_ref_lists:

1044

node_value = (value, ref_lists)

1045

else:

1046

node_value = value

1047

nodes.append((key, node_value))

1048

# print "parsed ", key

1049

return first_key, key, nodes, trailers

1050

1051

def _parsed_bytes(self, start, start_key, end, end_key):

1052

"""Mark the bytes from start to end as parsed.

1053

1054

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1055

1) as parsed.

1056

1057

:param start: The start of the parsed region.

1058

:param end: The end of the parsed region.

1059

"""

1060

index = self._parsed_byte_index(start)

1061

new_value = (start, end)

1062

new_key = (start_key, end_key)

1063

if index == -1:

1064

# first range parsed is always the beginning.

1065

self._parsed_byte_map.insert(index, new_value)

1066

self._parsed_key_map.insert(index, new_key)

1067

return

1068

# four cases:

1069

# new region

1070

# extend lower region

1071

# extend higher region

1072

# combine two regions

1073

if (index + 1 < len(self._parsed_byte_map) and

1074

self._parsed_byte_map[index][1] == start and

1075

self._parsed_byte_map[index + 1][0] == end):

1076

# combine two regions

1077

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1078

self._parsed_byte_map[index + 1][1])

1079

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1080

self._parsed_key_map[index + 1][1])

1081

del self._parsed_byte_map[index + 1]

1082

del self._parsed_key_map[index + 1]

1083

elif self._parsed_byte_map[index][1] == start:

1084

# extend the lower entry

1085

self._parsed_byte_map[index] = (

1086

self._parsed_byte_map[index][0], end)

1087

self._parsed_key_map[index] = (

1088

self._parsed_key_map[index][0], end_key)

1089

elif (index + 1 < len(self._parsed_byte_map) and

1090

self._parsed_byte_map[index + 1][0] == end):

1091

# extend the higher entry

1092

self._parsed_byte_map[index + 1] = (

1093

start, self._parsed_byte_map[index + 1][1])

1094

self._parsed_key_map[index + 1] = (

1095

start_key, self._parsed_key_map[index + 1][1])

1096

else:

1097

# new entry

1098

self._parsed_byte_map.insert(index + 1, new_value)

1099

self._parsed_key_map.insert(index + 1, new_key)

1100

1101

def _read_and_parse(self, readv_ranges):

1102

"""Read the the ranges and parse the resulting data.

1103

1104

:param readv_ranges: A prepared readv range list.

1105

"""

1106

if not readv_ranges:

1107

return

1108

if self._nodes is None and self._bytes_read * 2 >= self._size:

1109

# We've already read more than 50% of the file and we are about to

1110

# request more data, just _buffer_all() and be done

1111

self._buffer_all()

1112

return

1113

1114

readv_data = self._transport.readv(self._name, readv_ranges, True,

1115

self._size)

1116

# parse

1117

for offset, data in readv_data:

1118

self._bytes_read += len(data)

1119

if offset == 0 and len(data) == self._size:

1120

# We read the whole range, most likely because the

1121

# Transport upcast our readv ranges into one long request

1122

# for enough total data to grab the whole index.

1123

self._buffer_all(StringIO(data))

1124

return

1125

if self._bisect_nodes is None:

1126

# this must be the start

1127

if not (offset == 0):

1128

raise AssertionError()

1129

offset, data = self._parse_header_from_bytes(data)

1130

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1131

self._parse_region(offset, data)

1132

1133

def _signature(self):

1134

"""The file signature for this index type."""

1135

return _SIGNATURE

1136

1137

def validate(self):

1138

"""Validate that everything in the index can be accessed."""

1139

# iter_all validates completely at the moment, so just do that.

1140

for node in self.iter_all_entries():

1141

pass

1142

1143

1144

class CombinedGraphIndex(object):

1145

"""A GraphIndex made up from smaller GraphIndices.

1146

1147

The backing indices must implement GraphIndex, and are presumed to be

1148

static data.

1149

1150

Queries against the combined index will be made against the first index,

1151

and then the second and so on. The order of index's can thus influence

1152

performance significantly. For example, if one index is on local disk and a

1153

second on a remote server, the local disk index should be before the other

1154

in the index list.

1155

"""

1156

1157

def __init__(self, indices, reload_func=None):

1158

"""Create a CombinedGraphIndex backed by indices.

1159

1160

:param indices: An ordered list of indices to query for data.

1161

:param reload_func: A function to call if we find we are missing an

1162

index. Should have the form reload_func() => True/False to indicate

1163

if reloading actually changed anything.

1164

"""

1165

self._indices = indices

1166

self._reload_func = reload_func

1167

1168

def __repr__(self):

1169

return "%s(%s)" % (

1170

self.__class__.__name__,

1171

', '.join(map(repr, self._indices)))

1172

1173

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

1174

def get_parents(self, revision_ids):

1175

"""See graph._StackedParentsProvider.get_parents.

1176

1177

This implementation thunks the graph.Graph.get_parents api across to

1178

GraphIndex.

1179

1180

:param revision_ids: An iterable of graph keys for this graph.

1181

:return: A list of parent details for each key in revision_ids.

1182

Each parent details will be one of:

1183

* None when the key was missing

1184

* (NULL_REVISION,) when the key has no parents.

1185

* (parent_key, parent_key...) otherwise.

1186

"""

1187

parent_map = self.get_parent_map(revision_ids)

1188

return [parent_map.get(r, None) for r in revision_ids]

1189

1190

def get_parent_map(self, keys):

1191

"""See graph._StackedParentsProvider.get_parent_map"""

1192

search_keys = set(keys)

1193

if NULL_REVISION in search_keys:

1194

search_keys.discard(NULL_REVISION)

1195

found_parents = {NULL_REVISION:[]}

1196

else:

1197

found_parents = {}

1198

for index, key, value, refs in self.iter_entries(search_keys):

1199

parents = refs[0]

1200

if not parents:

1201

parents = (NULL_REVISION,)

1202

found_parents[key] = parents

1203

return found_parents

1204

1205

has_key = _has_key_from_parent_map

1206

1207

def insert_index(self, pos, index):

1208

"""Insert a new index in the list of indices to query.

1209

1210

:param pos: The position to insert the index.

1211

:param index: The index to insert.

1212

"""

1213

self._indices.insert(pos, index)

1214

1215

def iter_all_entries(self):

1216

"""Iterate over all keys within the index

1217

1218

Duplicate keys across child indices are presumed to have the same

1219

value and are only reported once.

1220

1221

:return: An iterable of (index, key, reference_lists, value).

1222

There is no defined order for the result iteration - it will be in

1223

the most efficient order for the index.

1224

"""

1225

seen_keys = set()

1226

while True:

1227

try:

1228

for index in self._indices:

1229

for node in index.iter_all_entries():

1230

if node[1] not in seen_keys:

1231

yield node

1232

seen_keys.add(node[1])

1233

return

1234

except errors.NoSuchFile:

1235

self._reload_or_raise()

1236

1237

def iter_entries(self, keys):

1238

"""Iterate over keys within the index.

1239

1240

Duplicate keys across child indices are presumed to have the same

1241

value and are only reported once.

1242

1243

:param keys: An iterable providing the keys to be retrieved.

1244

:return: An iterable of (index, key, reference_lists, value). There is no

1245

defined order for the result iteration - it will be in the most

1246

efficient order for the index.

1247

"""

1248

keys = set(keys)

1249

while True:

1250

try:

1251

for index in self._indices:

1252

if not keys:

1253

return

1254

for node in index.iter_entries(keys):

1255

keys.remove(node[1])

1256

yield node

1257

return

1258

except errors.NoSuchFile:

1259

self._reload_or_raise()

1260

1261

def iter_entries_prefix(self, keys):

1262

"""Iterate over keys within the index using prefix matching.

1263

1264

Duplicate keys across child indices are presumed to have the same

1265

value and are only reported once.

1266

1267

Prefix matching is applied within the tuple of a key, not to within

1268

the bytestring of each key element. e.g. if you have the keys ('foo',

1269

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1270

only the former key is returned.

1271

1272

:param keys: An iterable providing the key prefixes to be retrieved.

1273

Each key prefix takes the form of a tuple the length of a key, but

1274

with the last N elements 'None' rather than a regular bytestring.

1275

The first element cannot be 'None'.

1276

:return: An iterable as per iter_all_entries, but restricted to the

1277

keys with a matching prefix to those supplied. No additional keys

1278

will be returned, and every match that is in the index will be

1279

returned.

1280

"""

1281

keys = set(keys)

1282

if not keys:

1283

return

1284

seen_keys = set()

1285

while True:

1286

try:

1287

for index in self._indices:

1288

for node in index.iter_entries_prefix(keys):

1289

if node[1] in seen_keys:

1290

continue

1291

seen_keys.add(node[1])

1292

yield node

1293

return

1294

except errors.NoSuchFile:

1295

self._reload_or_raise()

1296

1297

def key_count(self):

1298

"""Return an estimate of the number of keys in this index.

1299

1300

For CombinedGraphIndex this is approximated by the sum of the keys of

1301

the child indices. As child indices may have duplicate keys this can

1302

have a maximum error of the number of child indices * largest number of

1303

keys in any index.

1304

"""

1305

while True:

1306

try:

1307

return sum((index.key_count() for index in self._indices), 0)

1308

except errors.NoSuchFile:

1309

self._reload_or_raise()

1310

1311

missing_keys = _missing_keys_from_parent_map

1312

1313

def _reload_or_raise(self):

1314

"""We just got a NoSuchFile exception.

1315

1316

Try to reload the indices, if it fails, just raise the current

1317

exception.

1318

"""

1319

if self._reload_func is None:

1320

raise

1321

exc_type, exc_value, exc_traceback = sys.exc_info()

1322

trace.mutter('Trying to reload after getting exception: %s',

1323

exc_value)

1324

if not self._reload_func():

1325

# We tried to reload, but nothing changed, so we fail anyway

1326

trace.mutter('_reload_func indicated nothing has changed.'

1327

' Raising original exception.')

1328

raise exc_type, exc_value, exc_traceback

1329

1330

def validate(self):

1331

"""Validate that everything in the index can be accessed."""

1332

while True:

1333

try:

1334

for index in self._indices:

1335

index.validate()

1336

return

1337

except errors.NoSuchFile:

1338

self._reload_or_raise()

1339

1340

1341

class InMemoryGraphIndex(GraphIndexBuilder):

1342

"""A GraphIndex which operates entirely out of memory and is mutable.

1343

1344

This is designed to allow the accumulation of GraphIndex entries during a

1345

single write operation, where the accumulated entries need to be immediately

1346

available - for example via a CombinedGraphIndex.

1347

"""

1348

1349

def add_nodes(self, nodes):

1350

"""Add nodes to the index.

1351

1352

:param nodes: An iterable of (key, node_refs, value) entries to add.

1353

"""

1354

if self.reference_lists:

1355

for (key, value, node_refs) in nodes:

1356

self.add_node(key, value, node_refs)

1357

else:

1358

for (key, value) in nodes:

1359

self.add_node(key, value)

1360

1361

def iter_all_entries(self):

1362

"""Iterate over all keys within the index

1363

1364

:return: An iterable of (index, key, reference_lists, value). There is no

1365

defined order for the result iteration - it will be in the most

1366

efficient order for the index (in this case dictionary hash order).

1367

"""

1368

if 'evil' in debug.debug_flags:

1369

trace.mutter_callsite(3,

1370

"iter_all_entries scales with size of history.")

1371

if self.reference_lists:

1372

for key, (absent, references, value) in self._nodes.iteritems():

1373

if not absent:

1374

yield self, key, value, references

1375

else:

1376

for key, (absent, references, value) in self._nodes.iteritems():

1377

if not absent:

1378

yield self, key, value

1379

1380

def iter_entries(self, keys):

1381

"""Iterate over keys within the index.

1382

1383

:param keys: An iterable providing the keys to be retrieved.

1384

:return: An iterable of (index, key, value, reference_lists). There is no

1385

defined order for the result iteration - it will be in the most

1386

efficient order for the index (keys iteration order in this case).

1387

"""

1388

keys = set(keys)

1389

if self.reference_lists:

1390

for key in keys.intersection(self._keys):

1391

node = self._nodes[key]

1392

if not node[0]:

1393

yield self, key, node[2], node[1]

1394

else:

1395

for key in keys.intersection(self._keys):

1396

node = self._nodes[key]

1397

if not node[0]:

1398

yield self, key, node[2]

1399

1400

def iter_entries_prefix(self, keys):

1401

"""Iterate over keys within the index using prefix matching.

1402

1403

Prefix matching is applied within the tuple of a key, not to within

1404

the bytestring of each key element. e.g. if you have the keys ('foo',

1405

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1406

only the former key is returned.

1407

1408

:param keys: An iterable providing the key prefixes to be retrieved.

1409

Each key prefix takes the form of a tuple the length of a key, but

1410

with the last N elements 'None' rather than a regular bytestring.

1411

The first element cannot be 'None'.

1412

:return: An iterable as per iter_all_entries, but restricted to the

1413

keys with a matching prefix to those supplied. No additional keys

1414

will be returned, and every match that is in the index will be

1415

returned.

1416

"""

1417

# XXX: To much duplication with the GraphIndex class; consider finding

1418

# a good place to pull out the actual common logic.

1419

keys = set(keys)

1420

if not keys:

1421

return

1422

if self._key_length == 1:

1423

for key in keys:

1424

# sanity check

1425

if key[0] is None:

1426

raise errors.BadIndexKey(key)

1427

if len(key) != self._key_length:

1428

raise errors.BadIndexKey(key)

1429

node = self._nodes[key]

1430

if node[0]:

1431

continue

1432

if self.reference_lists:

1433

yield self, key, node[2], node[1]

1434

else:

1435

yield self, key, node[2]

1436

return

1437

nodes_by_key = self._get_nodes_by_key()

1438

for key in keys:

1439

# sanity check

1440

if key[0] is None:

1441

raise errors.BadIndexKey(key)

1442

if len(key) != self._key_length:

1443

raise errors.BadIndexKey(key)

1444

# find what it refers to:

1445

key_dict = nodes_by_key

1446

elements = list(key)

1447

# find the subdict to return

1448

try:

1449

while len(elements) and elements[0] is not None:

1450

key_dict = key_dict[elements[0]]

1451

elements.pop(0)

1452

except KeyError:

1453

# a non-existant lookup.

1454

continue

1455

if len(elements):

1456

dicts = [key_dict]

1457

while dicts:

1458

key_dict = dicts.pop(-1)

1459

# can't be empty or would not exist

1460

item, value = key_dict.iteritems().next()

1461

if type(value) == dict:

1462

# push keys

1463

dicts.extend(key_dict.itervalues())

1464

else:

1465

# yield keys

1466

for value in key_dict.itervalues():

1467

yield (self, ) + value

1468

else:

1469

yield (self, ) + key_dict

1470

1471

def key_count(self):

1472

"""Return an estimate of the number of keys in this index.

1473

1474

For InMemoryGraphIndex the estimate is exact.

1475

"""

1476

return len(self._keys)

1477

1478

def validate(self):

1479

"""In memory index's have no known corruption at the moment."""

1480

1481

1482

class GraphIndexPrefixAdapter(object):

1483

"""An adapter between GraphIndex with different key lengths.

1484

1485

Queries against this will emit queries against the adapted Graph with the

1486

prefix added, queries for all items use iter_entries_prefix. The returned

1487

nodes will have their keys and node references adjusted to remove the

1488

prefix. Finally, an add_nodes_callback can be supplied - when called the

1489

nodes and references being added will have prefix prepended.

1490

"""

1491

1492

def __init__(self, adapted, prefix, missing_key_length,

1493

add_nodes_callback=None):

1494

"""Construct an adapter against adapted with prefix."""

1495

self.adapted = adapted

1496

self.prefix_key = prefix + (None,)*missing_key_length

1497

self.prefix = prefix

1498

self.prefix_len = len(prefix)

1499

self.add_nodes_callback = add_nodes_callback

1500

1501

def add_nodes(self, nodes):

1502

"""Add nodes to the index.

1503

1504

:param nodes: An iterable of (key, node_refs, value) entries to add.

1505

"""

1506

# save nodes in case its an iterator

1507

nodes = tuple(nodes)

1508

translated_nodes = []

1509

try:

1510

# Add prefix_key to each reference node_refs is a tuple of tuples,

1511

# so split it apart, and add prefix_key to the internal reference

1512

for (key, value, node_refs) in nodes:

1513

adjusted_references = (

1514

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1515

for ref_list in node_refs))

1516

translated_nodes.append((self.prefix + key, value,

1517

adjusted_references))

1518

except ValueError:

1519

# XXX: TODO add an explicit interface for getting the reference list

1520

# status, to handle this bit of user-friendliness in the API more

1521

# explicitly.

1522

for (key, value) in nodes:

1523

translated_nodes.append((self.prefix + key, value))

1524

self.add_nodes_callback(translated_nodes)

1525

1526

def add_node(self, key, value, references=()):

1527

"""Add a node to the index.

1528

1529

:param key: The key. keys are non-empty tuples containing

1530

as many whitespace-free utf8 bytestrings as the key length

1531

defined for this index.

1532

:param references: An iterable of iterables of keys. Each is a

1533

reference to another key.

1534

:param value: The value to associate with the key. It may be any

1535

bytes as long as it does not contain \0 or \n.

1536

"""

1537

self.add_nodes(((key, value, references), ))

1538

1539

def _strip_prefix(self, an_iter):

1540

"""Strip prefix data from nodes and return it."""

1541

for node in an_iter:

1542

# cross checks

1543

if node[1][:self.prefix_len] != self.prefix:

1544

raise errors.BadIndexData(self)

1545

for ref_list in node[3]:

1546

for ref_node in ref_list:

1547

if ref_node[:self.prefix_len] != self.prefix:

1548

raise errors.BadIndexData(self)

1549

yield node[0], node[1][self.prefix_len:], node[2], (

1550

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1551

for ref_list in node[3]))

1552

1553

def iter_all_entries(self):

1554

"""Iterate over all keys within the index

1555

1556

iter_all_entries is implemented against the adapted index using

1557

iter_entries_prefix.

1558

1559

:return: An iterable of (index, key, reference_lists, value). There is no

1560

defined order for the result iteration - it will be in the most

1561

efficient order for the index (in this case dictionary hash order).

1562

"""

1563

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1564

1565

def iter_entries(self, keys):

1566

"""Iterate over keys within the index.

1567

1568

:param keys: An iterable providing the keys to be retrieved.

1569

:return: An iterable of (index, key, value, reference_lists). There is no

1570

defined order for the result iteration - it will be in the most

1571

efficient order for the index (keys iteration order in this case).

1572

"""

1573

return self._strip_prefix(self.adapted.iter_entries(

1574

self.prefix + key for key in keys))

1575

1576

def iter_entries_prefix(self, keys):

1577

"""Iterate over keys within the index using prefix matching.

1578

1579

Prefix matching is applied within the tuple of a key, not to within

1580

the bytestring of each key element. e.g. if you have the keys ('foo',

1581

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1582

only the former key is returned.

1583

1584

:param keys: An iterable providing the key prefixes to be retrieved.

1585

Each key prefix takes the form of a tuple the length of a key, but

1586

with the last N elements 'None' rather than a regular bytestring.

1587

The first element cannot be 'None'.

1588

:return: An iterable as per iter_all_entries, but restricted to the

1589

keys with a matching prefix to those supplied. No additional keys

1590

will be returned, and every match that is in the index will be

1591

returned.

1592

"""

1593

return self._strip_prefix(self.adapted.iter_entries_prefix(

1594

self.prefix + key for key in keys))

1595

1596

def key_count(self):

1597

"""Return an estimate of the number of keys in this index.

1598

1599

For GraphIndexPrefixAdapter this is relatively expensive - key

1600

iteration with the prefix is done.

1601

"""

1602

return len(list(self.iter_all_entries()))

1603

1604

def validate(self):

1605

"""Call the adapted's validate."""

1606

self.adapted.validate()

Older »