~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Martin Pool
Date: 2007-04-04 06:17:31 UTC
mto: This revision was merged to the branch mainline in revision 2397.
Revision ID: mbp@sourcefrog.net-20070404061731-tt2xrzllqhbodn83

Contents of TODO file moved into bug tracker

files added:
build-api

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_escaped_store.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/xml6.py

doc/README.1st

files removed:
bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_pack.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/bundle/serializer/v4.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/counted_lock.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/email_message.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/inventory_delta.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/multiparent.py

bzrlib/pack.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconfigure.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/pack_repo.py

bzrlib/rules.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/switch.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_create_clone.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/bzrdir_implementations/test_push.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/https_server.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_eol_conversion.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/transport/brokenrename.py

bzrlib/transport/ftp

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/log.py

bzrlib/transport/nosmart.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version_info_formats/format_custom.py

bzrlib/views.py

bzrlib/xml5.py

bzrlib/xml6.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

doc/news-template.txt

man1

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/check-newsbugs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/rst2pdf.py

tools/win32/build_release.py

tools/win32/run_script.py

files renamed:
doc/developers/HACKING.txt => HACKING

bzrlib/deprecated_graph.py => bzrlib/graph.py

bzrlib/help_topics/__init__.py => bzrlib/help_topics.py

bzrlib/_patiencediff_py.py => bzrlib/patiencediff.py

bzrlib/plugins/launchpad/lp_directory.py => bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_directory.py => bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/tests/http_utils.py => bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/http_server.py => bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_send.py => bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/per_repository/ => bzrlib/tests/repository_implementations/

bzrlib/tests/test_deprecated_graph.py => bzrlib/tests/test_graph.py

bzrlib/tests/test_revisionspec.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/transport/ftp/__init__.py => bzrlib/transport/ftp.py

bzrlib/transport/remote.py => bzrlib/transport/smart.py

bzrlib/xml8.py => bzrlib/xml5.py

doc/en/tutorials/centralized_workflow.txt => doc/centralized_workflow.txt

bzrlib/help_topics/en/configuration.txt => doc/configuration.txt

doc/en/user-guide/http_smart_server.txt => doc/http_smart_server.txt

doc/en/user-guide/index.txt => doc/index.txt

doc/en/user-guide/plugins.txt => doc/plugins.txt

doc/en/user-guide/server.txt => doc/server.txt

doc/en/user-guide/setting_up_email.txt => doc/setting_up_email.txt

doc/en/user-guide/specifying_revisions.txt => doc/specifying_revisions.txt

doc/en/tutorials/tutorial.txt => doc/tutorial.txt

doc/en/user-guide/using_aliases.txt => doc/using_aliases.txt

doc/en/user-guide/version_info.txt => doc/version_info.txt

files modified:
.bzrignore

INSTALL

Makefile

NEWS

README

bzr.ico

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/util/configobj/configobj.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml7.py

bzrlib/xml_serializer.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

doc/bazaar-vcs.org.kid

doc/default.css

generate_docs.py

profile_imports.py

setup.py *

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

100

self._key_length = key_elements

101

self._optimize_for_size = False

102

self._combine_backing_indices = True

103

104

def _check_key(self, key):

105

"""Raise BadIndexKey if key is not a valid key for this index."""

106

if type(key) != tuple:

107

raise errors.BadIndexKey(key)

108

if self._key_length != len(key):

109

raise errors.BadIndexKey(key)

110

for element in key:

111

if not element or _whitespace_re.search(element) is not None:

112

raise errors.BadIndexKey(element)

113

114

def _external_references(self):

115

"""Return references that are not present in this index.

116

"""

117

keys = set()

118

refs = set()

119

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

120

# lists are used. It is currently correct for pack-0.92 through

121

# 1.9, which use the node references (3rd column) second

122

# reference list as the compression parent. Perhaps this should

123

# be moved into something higher up the stack, since it

124

# makes assumptions about how the index is used.

125

if self.reference_lists > 1:

126

for node in self.iter_all_entries():

127

keys.add(node[1])

128

refs.update(node[3][1])

129

return refs - keys

130

else:

131

# If reference_lists == 0 there can be no external references, and

132

# if reference_lists == 1, then there isn't a place to store the

133

# compression parent

134

return set()

135

136

def _get_nodes_by_key(self):

137

if self._nodes_by_key is None:

138

nodes_by_key = {}

139

if self.reference_lists:

140

for key, (absent, references, value) in self._nodes.iteritems():

141

if absent:

142

continue

143

key_dict = nodes_by_key

144

for subkey in key[:-1]:

145

key_dict = key_dict.setdefault(subkey, {})

146

key_dict[key[-1]] = key, value, references

147

else:

148

for key, (absent, references, value) in self._nodes.iteritems():

149

if absent:

150

continue

151

key_dict = nodes_by_key

152

for subkey in key[:-1]:

153

key_dict = key_dict.setdefault(subkey, {})

154

key_dict[key[-1]] = key, value

155

self._nodes_by_key = nodes_by_key

156

return self._nodes_by_key

157

158

def _update_nodes_by_key(self, key, value, node_refs):

159

"""Update the _nodes_by_key dict with a new key.

160

161

For a key of (foo, bar, baz) create

162

_nodes_by_key[foo][bar][baz] = key_value

163

"""

164

if self._nodes_by_key is None:

165

return

166

key_dict = self._nodes_by_key

167

if self.reference_lists:

168

key_value = key, value, node_refs

169

else:

170

key_value = key, value

171

for subkey in key[:-1]:

172

key_dict = key_dict.setdefault(subkey, {})

173

key_dict[key[-1]] = key_value

174

175

def _check_key_ref_value(self, key, references, value):

176

"""Check that 'key' and 'references' are all valid.

177

178

:param key: A key tuple. Must conform to the key interface (be a tuple,

179

be of the right length, not have any whitespace or nulls in any key

180

element.)

181

:param references: An iterable of reference lists. Something like

182

[[(ref, key)], [(ref, key), (other, key)]]

183

:param value: The value associate with this key. Must not contain

184

newlines or null characters.

185

:return: (node_refs, absent_references)

186

node_refs basically a packed form of 'references' where all

187

iterables are tuples

188

absent_references reference keys that are not in self._nodes.

189

This may contain duplicates if the same key is

190

referenced in multiple lists.

191

"""

192

self._check_key(key)

193

if _newline_null_re.search(value) is not None:

194

raise errors.BadIndexValue(value)

195

if len(references) != self.reference_lists:

196

raise errors.BadIndexValue(references)

197

node_refs = []

198

absent_references = []

199

for reference_list in references:

200

for reference in reference_list:

201

# If reference *is* in self._nodes, then we know it has already

202

# been checked.

203

if reference not in self._nodes:

204

self._check_key(reference)

205

absent_references.append(reference)

206

node_refs.append(tuple(reference_list))

207

return tuple(node_refs), absent_references

208

209

def add_node(self, key, value, references=()):

210

"""Add a node to the index.

211

212

:param key: The key. keys are non-empty tuples containing

213

as many whitespace-free utf8 bytestrings as the key length

214

defined for this index.

215

:param references: An iterable of iterables of keys. Each is a

216

reference to another key.

217

:param value: The value to associate with the key. It may be any

218

bytes as long as it does not contain \0 or \n.

219

"""

220

(node_refs,

221

absent_references) = self._check_key_ref_value(key, references, value)

222

if key in self._nodes and self._nodes[key][0] != 'a':

223

raise errors.BadIndexDuplicateKey(key, self)

224

for reference in absent_references:

225

# There may be duplicates, but I don't think it is worth worrying

226

# about

227

self._nodes[reference] = ('a', (), '')

228

self._nodes[key] = ('', node_refs, value)

229

self._keys.add(key)

230

if self._nodes_by_key is not None and self._key_length > 1:

231

self._update_nodes_by_key(key, value, node_refs)

232

233

def finish(self):

234

lines = [_SIGNATURE]

235

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

236

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

237

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

238

prefix_length = sum(len(x) for x in lines)

239

# references are byte offsets. To avoid having to do nasty

240

# polynomial work to resolve offsets (references to later in the

241

# file cannot be determined until all the inbetween references have

242

# been calculated too) we pad the offsets with 0's to make them be

243

# of consistent length. Using binary offsets would break the trivial

244

# file parsing.

245

# to calculate the width of zero's needed we do three passes:

246

# one to gather all the non-reference data and the number of references.

247

# one to pad all the data with reference-length and determine entry

248

# addresses.

249

# One to serialise.

250

251

# forward sorted by key. In future we may consider topological sorting,

252

# at the cost of table scans for direct lookup, or a second index for

253

# direct lookup

254

nodes = sorted(self._nodes.items())

255

# if we do not prepass, we don't know how long it will be up front.

256

expected_bytes = None

257

# we only need to pre-pass if we have reference lists at all.

258

if self.reference_lists:

259

key_offset_info = []

260

non_ref_bytes = prefix_length

261

total_references = 0

262

# TODO use simple multiplication for the constants in this loop.

263

for key, (absent, references, value) in nodes:

264

# record the offset known *so far* for this key:

265

# the non reference bytes to date, and the total references to

266

# date - saves reaccumulating on the second pass

267

key_offset_info.append((key, non_ref_bytes, total_references))

268

# key is literal, value is literal, there are 3 null's, 1 NL

269

# key is variable length tuple, \x00 between elements

270

non_ref_bytes += sum(len(element) for element in key)

271

if self._key_length > 1:

272

non_ref_bytes += self._key_length - 1

273

# value is literal bytes, there are 3 null's, 1 NL.

274

non_ref_bytes += len(value) + 3 + 1

275

# one byte for absent if set.

276

if absent:

277

non_ref_bytes += 1

278

elif self.reference_lists:

279

# (ref_lists -1) tabs

280

non_ref_bytes += self.reference_lists - 1

281

# (ref-1 cr's per ref_list)

282

for ref_list in references:

283

# how many references across the whole file?

284

total_references += len(ref_list)

285

# accrue reference separators

286

if ref_list:

287

non_ref_bytes += len(ref_list) - 1

288

# how many digits are needed to represent the total byte count?

289

digits = 1

290

possible_total_bytes = non_ref_bytes + total_references*digits

291

while 10 ** digits < possible_total_bytes:

292

digits += 1

293

possible_total_bytes = non_ref_bytes + total_references*digits

294

expected_bytes = possible_total_bytes + 1 # terminating newline

295

# resolve key addresses.

296

key_addresses = {}

297

for key, non_ref_bytes, total_references in key_offset_info:

298

key_addresses[key] = non_ref_bytes + total_references*digits

299

# serialise

300

format_string = '%%0%sd' % digits

301

for key, (absent, references, value) in nodes:

302

flattened_references = []

303

for ref_list in references:

304

ref_addresses = []

305

for reference in ref_list:

306

ref_addresses.append(format_string % key_addresses[reference])

307

flattened_references.append('\r'.join(ref_addresses))

308

string_key = '\x00'.join(key)

309

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

310

'\t'.join(flattened_references), value))

311

lines.append('\n')

312

result = StringIO(''.join(lines))

313

if expected_bytes and len(result.getvalue()) != expected_bytes:

314

raise errors.BzrError('Failed index creation. Internal error:'

315

' mismatched output length and expected length: %d %d' %

316

(len(result.getvalue()), expected_bytes))

317

return result

318

319

def set_optimize(self, for_size=None, combine_backing_indices=None):

320

"""Change how the builder tries to optimize the result.

321

322

:param for_size: Tell the builder to try and make the index as small as

323

possible.

324

:param combine_backing_indices: If the builder spills to disk to save

325

memory, should the on-disk indices be combined. Set to True if you

326

are going to be probing the index, but to False if you are not. (If

327

you are not querying, then the time spent combining is wasted.)

328

:return: None

329

"""

330

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

331

# other builders do.

332

if for_size is not None:

333

self._optimize_for_size = for_size

334

if combine_backing_indices is not None:

335

self._combine_backing_indices = combine_backing_indices

336

337

338

class GraphIndex(object):

339

"""An index for data with embedded graphs.

340

341

The index maps keys to a list of key reference lists, and a value.

342

Each node has the same number of key reference lists. Each key reference

343

list can be empty or an arbitrary length. The value is an opaque NULL

344

terminated string without any newlines. The storage of the index is

345

hidden in the interface: keys and key references are always tuples of

346

bytestrings, never the internal representation (e.g. dictionary offsets).

347

348

It is presumed that the index will not be mutated - it is static data.

349

350

Successive iter_all_entries calls will read the entire index each time.

351

Additionally, iter_entries calls will read the index linearly until the

352

desired keys are found. XXX: This must be fixed before the index is

353

suitable for production use. :XXX

354

"""

355

356

def __init__(self, transport, name, size):

357

"""Open an index called name on transport.

358

359

:param transport: A bzrlib.transport.Transport.

360

:param name: A path to provide to transport API calls.

361

:param size: The size of the index in bytes. This is used for bisection

362

logic to perform partial index reads. While the size could be

363

obtained by statting the file this introduced an additional round

364

trip as well as requiring stat'able transports, both of which are

365

avoided by having it supplied. If size is None, then bisection

366

support will be disabled and accessing the index will just stream

367

all the data.

368

"""

369

self._transport = transport

370

self._name = name

371

# Becomes a dict of key:(value, reference-list-byte-locations) used by

372

# the bisection interface to store parsed but not resolved keys.

373

self._bisect_nodes = None

374

# Becomes a dict of key:(value, reference-list-keys) which are ready to

375

# be returned directly to callers.

376

self._nodes = None

377

# a sorted list of slice-addresses for the parsed bytes of the file.

378

# e.g. (0,1) would mean that byte 0 is parsed.

379

self._parsed_byte_map = []

380

# a sorted list of keys matching each slice address for parsed bytes

381

# e.g. (None, 'foo@bar') would mean that the first byte contained no

382

# key, and the end byte of the slice is the of the data for 'foo@bar'

383

self._parsed_key_map = []

384

self._key_count = None

385

self._keys_by_offset = None

386

self._nodes_by_key = None

387

self._size = size

388

# The number of bytes we've read so far in trying to process this file

389

self._bytes_read = 0

390

391

def __eq__(self, other):

392

"""Equal when self and other were created with the same parameters."""

393

return (

394

type(self) == type(other) and

395

self._transport == other._transport and

396

self._name == other._name and

397

self._size == other._size)

398

399

def __ne__(self, other):

400

return not self.__eq__(other)

401

402

def __repr__(self):

403

return "%s(%r)" % (self.__class__.__name__,

404

self._transport.abspath(self._name))

405

406

def _buffer_all(self, stream=None):

407

"""Buffer all the index data.

408

409

Mutates self._nodes and self.keys_by_offset.

410

"""

411

if self._nodes is not None:

412

# We already did this

413

return

414

if 'index' in debug.debug_flags:

415

mutter('Reading entire index %s', self._transport.abspath(self._name))

416

if stream is None:

417

stream = self._transport.get(self._name)

418

self._read_prefix(stream)

419

self._expected_elements = 3 + self._key_length

420

line_count = 0

421

# raw data keyed by offset

422

self._keys_by_offset = {}

423

# ready-to-return key:value or key:value, node_ref_lists

424

self._nodes = {}

425

self._nodes_by_key = None

426

trailers = 0

427

pos = stream.tell()

428

lines = stream.read().split('\n')

429

del lines[-1]

430

_, _, _, trailers = self._parse_lines(lines, pos)

431

for key, absent, references, value in self._keys_by_offset.itervalues():

432

if absent:

433

continue

434

# resolve references:

435

if self.node_ref_lists:

436

node_value = (value, self._resolve_references(references))

437

else:

438

node_value = value

439

self._nodes[key] = node_value

440

# cache the keys for quick set intersections

441

self._keys = set(self._nodes)

442

if trailers != 1:

443

# there must be one line - the empty trailer line.

444

raise errors.BadIndexData(self)

445

446

def external_references(self, ref_list_num):

447

"""Return references that are not present in this index.

448

"""

449

self._buffer_all()

450

if ref_list_num + 1 > self.node_ref_lists:

451

raise ValueError('No ref list %d, index has %d ref lists'

452

% (ref_list_num, self.node_ref_lists))

453

refs = set()

454

for key, (value, ref_lists) in self._nodes.iteritems():

455

ref_list = ref_lists[ref_list_num]

456

refs.update(ref_list)

457

return refs - self._keys

458

459

def _get_nodes_by_key(self):

460

if self._nodes_by_key is None:

461

nodes_by_key = {}

462

if self.node_ref_lists:

463

for key, (value, references) in self._nodes.iteritems():

464

key_dict = nodes_by_key

465

for subkey in key[:-1]:

466

key_dict = key_dict.setdefault(subkey, {})

467

key_dict[key[-1]] = key, value, references

468

else:

469

for key, value in self._nodes.iteritems():

470

key_dict = nodes_by_key

471

for subkey in key[:-1]:

472

key_dict = key_dict.setdefault(subkey, {})

473

key_dict[key[-1]] = key, value

474

self._nodes_by_key = nodes_by_key

475

return self._nodes_by_key

476

477

def iter_all_entries(self):

478

"""Iterate over all keys within the index.

479

480

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

481

The former tuple is used when there are no reference lists in the

482

index, making the API compatible with simple key:value index types.

483

There is no defined order for the result iteration - it will be in

484

the most efficient order for the index.

485

"""

486

if 'evil' in debug.debug_flags:

487

trace.mutter_callsite(3,

488

"iter_all_entries scales with size of history.")

489

if self._nodes is None:

490

self._buffer_all()

491

if self.node_ref_lists:

492

for key, (value, node_ref_lists) in self._nodes.iteritems():

493

yield self, key, value, node_ref_lists

494

else:

495

for key, value in self._nodes.iteritems():

496

yield self, key, value

497

498

def _read_prefix(self, stream):

499

signature = stream.read(len(self._signature()))

500

if not signature == self._signature():

501

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

502

options_line = stream.readline()

503

if not options_line.startswith(_OPTION_NODE_REFS):

504

raise errors.BadIndexOptions(self)

505

try:

506

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

507

except ValueError:

508

raise errors.BadIndexOptions(self)

509

options_line = stream.readline()

510

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

511

raise errors.BadIndexOptions(self)

512

try:

513

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

514

except ValueError:

515

raise errors.BadIndexOptions(self)

516

options_line = stream.readline()

517

if not options_line.startswith(_OPTION_LEN):

518

raise errors.BadIndexOptions(self)

519

try:

520

self._key_count = int(options_line[len(_OPTION_LEN):-1])

521

except ValueError:

522

raise errors.BadIndexOptions(self)

523

524

def _resolve_references(self, references):

525

"""Return the resolved key references for references.

526

527

References are resolved by looking up the location of the key in the

528

_keys_by_offset map and substituting the key name, preserving ordering.

529

530

:param references: An iterable of iterables of key locations. e.g.

531

[[123, 456], [123]]

532

:return: A tuple of tuples of keys.

533

"""

534

node_refs = []

535

for ref_list in references:

536

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

537

return tuple(node_refs)

538

539

def _find_index(self, range_map, key):

540

"""Helper for the _parsed_*_index calls.

541

542

Given a range map - [(start, end), ...], finds the index of the range

543

in the map for key if it is in the map, and if it is not there, the

544

immediately preceeding range in the map.

545

"""

546

result = bisect_right(range_map, key) - 1

547

if result + 1 < len(range_map):

548

# check the border condition, it may be in result + 1

549

if range_map[result + 1][0] == key[0]:

550

return result + 1

551

return result

552

553

def _parsed_byte_index(self, offset):

554

"""Return the index of the entry immediately before offset.

555

556

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

557

there is one unparsed byte (the 11th, addressed as[10]). then:

558

asking for 0 will return 0

559

asking for 10 will return 0

560

asking for 11 will return 1

561

asking for 12 will return 1

562

"""

563

key = (offset, 0)

564

return self._find_index(self._parsed_byte_map, key)

565

566

def _parsed_key_index(self, key):

567

"""Return the index of the entry immediately before key.

568

569

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

570

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

571

have been parsed, then:

572

asking for '' will return 0

573

asking for 'a' will return 0

574

asking for 'b' will return 1

575

asking for 'e' will return 1

576

"""

577

search_key = (key, None)

578

return self._find_index(self._parsed_key_map, search_key)

579

580

def _is_parsed(self, offset):

581

"""Returns True if offset has been parsed."""

582

index = self._parsed_byte_index(offset)

583

if index == len(self._parsed_byte_map):

584

return offset < self._parsed_byte_map[index - 1][1]

585

start, end = self._parsed_byte_map[index]

586

return offset >= start and offset < end

587

588

def _iter_entries_from_total_buffer(self, keys):

589

"""Iterate over keys when the entire index is parsed."""

590

keys = keys.intersection(self._keys)

591

if self.node_ref_lists:

592

for key in keys:

593

value, node_refs = self._nodes[key]

594

yield self, key, value, node_refs

595

else:

596

for key in keys:

597

yield self, key, self._nodes[key]

598

599

def iter_entries(self, keys):

600

"""Iterate over keys within the index.

601

602

:param keys: An iterable providing the keys to be retrieved.

603

:return: An iterable as per iter_all_entries, but restricted to the

604

keys supplied. No additional keys will be returned, and every

605

key supplied that is in the index will be returned.

606

"""

607

keys = set(keys)

608

if not keys:

609

return []

610

if self._size is None and self._nodes is None:

611

self._buffer_all()

612

613

# We fit about 20 keys per minimum-read (4K), so if we are looking for

614

# more than 1/20th of the index its likely (assuming homogenous key

615

# spread) that we'll read the entire index. If we're going to do that,

616

# buffer the whole thing. A better analysis might take key spread into

617

# account - but B+Tree indices are better anyway.

618

# We could look at all data read, and use a threshold there, which will

619

# trigger on ancestry walks, but that is not yet fully mapped out.

620

if self._nodes is None and len(keys) * 20 > self.key_count():

621

self._buffer_all()

622

if self._nodes is not None:

623

return self._iter_entries_from_total_buffer(keys)

624

else:

625

return (result[1] for result in bisect_multi_bytes(

626

self._lookup_keys_via_location, self._size, keys))

627

628

def iter_entries_prefix(self, keys):

629

"""Iterate over keys within the index using prefix matching.

630

631

Prefix matching is applied within the tuple of a key, not to within

632

the bytestring of each key element. e.g. if you have the keys ('foo',

633

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

634

only the former key is returned.

635

636

WARNING: Note that this method currently causes a full index parse

637

unconditionally (which is reasonably appropriate as it is a means for

638

thunking many small indices into one larger one and still supplies

639

iter_all_entries at the thunk layer).

640

641

:param keys: An iterable providing the key prefixes to be retrieved.

642

Each key prefix takes the form of a tuple the length of a key, but

643

with the last N elements 'None' rather than a regular bytestring.

644

The first element cannot be 'None'.

645

:return: An iterable as per iter_all_entries, but restricted to the

646

keys with a matching prefix to those supplied. No additional keys

647

will be returned, and every match that is in the index will be

648

returned.

649

"""

650

keys = set(keys)

651

if not keys:

652

return

653

# load data - also finds key lengths

654

if self._nodes is None:

655

self._buffer_all()

656

if self._key_length == 1:

657

for key in keys:

658

# sanity check

659

if key[0] is None:

660

raise errors.BadIndexKey(key)

661

if len(key) != self._key_length:

662

raise errors.BadIndexKey(key)

663

if self.node_ref_lists:

664

value, node_refs = self._nodes[key]

665

yield self, key, value, node_refs

666

else:

667

yield self, key, self._nodes[key]

668

return

669

nodes_by_key = self._get_nodes_by_key()

670

for key in keys:

671

# sanity check

672

if key[0] is None:

673

raise errors.BadIndexKey(key)

674

if len(key) != self._key_length:

675

raise errors.BadIndexKey(key)

676

# find what it refers to:

677

key_dict = nodes_by_key

678

elements = list(key)

679

# find the subdict whose contents should be returned.

680

try:

681

while len(elements) and elements[0] is not None:

682

key_dict = key_dict[elements[0]]

683

elements.pop(0)

684

except KeyError:

685

# a non-existant lookup.

686

continue

687

if len(elements):

688

dicts = [key_dict]

689

while dicts:

690

key_dict = dicts.pop(-1)

691

# can't be empty or would not exist

692

item, value = key_dict.iteritems().next()

693

if type(value) == dict:

694

# push keys

695

dicts.extend(key_dict.itervalues())

696

else:

697

# yield keys

698

for value in key_dict.itervalues():

699

# each value is the key:value:node refs tuple

700

# ready to yield.

701

yield (self, ) + value

702

else:

703

# the last thing looked up was a terminal element

704

yield (self, ) + key_dict

705

706

def key_count(self):

707

"""Return an estimate of the number of keys in this index.

708

709

For GraphIndex the estimate is exact.

710

"""

711

if self._key_count is None:

712

self._read_and_parse([_HEADER_READV])

713

return self._key_count

714

715

def _lookup_keys_via_location(self, location_keys):

716

"""Public interface for implementing bisection.

717

718

If _buffer_all has been called, then all the data for the index is in

719

memory, and this method should not be called, as it uses a separate

720

cache because it cannot pre-resolve all indices, which buffer_all does

721

for performance.

722

723

:param location_keys: A list of location(byte offset), key tuples.

724

:return: A list of (location_key, result) tuples as expected by

725

bzrlib.bisect_multi.bisect_multi_bytes.

726

"""

727

# Possible improvements:

728

# - only bisect lookup each key once

729

# - sort the keys first, and use that to reduce the bisection window

730

# -----

731

# this progresses in three parts:

732

# read data

733

# parse it

734

# attempt to answer the question from the now in memory data.

735

# build the readv request

736

# for each location, ask for 800 bytes - much more than rows we've seen

737

# anywhere.

738

readv_ranges = []

739

for location, key in location_keys:

740

# can we answer from cache?

741

if self._bisect_nodes and key in self._bisect_nodes:

742

# We have the key parsed.

743

continue

744

index = self._parsed_key_index(key)

745

if (len(self._parsed_key_map) and

746

self._parsed_key_map[index][0] <= key and

747

(self._parsed_key_map[index][1] >= key or

748

# end of the file has been parsed

749

self._parsed_byte_map[index][1] == self._size)):

750

# the key has been parsed, so no lookup is needed even if its

751

# not present.

752

continue

753

# - if we have examined this part of the file already - yes

754

index = self._parsed_byte_index(location)

755

if (len(self._parsed_byte_map) and

756

self._parsed_byte_map[index][0] <= location and

757

self._parsed_byte_map[index][1] > location):

758

# the byte region has been parsed, so no read is needed.

759

continue

760

length = 800

761

if location + length > self._size:

762

length = self._size - location

763

# todo, trim out parsed locations.

764

if length > 0:

765

readv_ranges.append((location, length))

766

# read the header if needed

767

if self._bisect_nodes is None:

768

readv_ranges.append(_HEADER_READV)

769

self._read_and_parse(readv_ranges)

770

result = []

771

if self._nodes is not None:

772

# _read_and_parse triggered a _buffer_all because we requested the

773

# whole data range

774

for location, key in location_keys:

775

if key not in self._nodes: # not present

776

result.append(((location, key), False))

777

elif self.node_ref_lists:

778

value, refs = self._nodes[key]

779

result.append(((location, key),

780

(self, key, value, refs)))

781

else:

782

result.append(((location, key),

783

(self, key, self._nodes[key])))

784

return result

785

# generate results:

786

# - figure out <, >, missing, present

787

# - result present references so we can return them.

788

# keys that we cannot answer until we resolve references

789

pending_references = []

790

pending_locations = set()

791

for location, key in location_keys:

792

# can we answer from cache?

793

if key in self._bisect_nodes:

794

# the key has been parsed, so no lookup is needed

795

if self.node_ref_lists:

796

# the references may not have been all parsed.

797

value, refs = self._bisect_nodes[key]

798

wanted_locations = []

799

for ref_list in refs:

800

for ref in ref_list:

801

if ref not in self._keys_by_offset:

802

wanted_locations.append(ref)

803

if wanted_locations:

804

pending_locations.update(wanted_locations)

805

pending_references.append((location, key))

806

continue

807

result.append(((location, key), (self, key,

808

value, self._resolve_references(refs))))

809

else:

810

result.append(((location, key),

811

(self, key, self._bisect_nodes[key])))

812

continue

813

else:

814

# has the region the key should be in, been parsed?

815

index = self._parsed_key_index(key)

816

if (self._parsed_key_map[index][0] <= key and

817

(self._parsed_key_map[index][1] >= key or

818

# end of the file has been parsed

819

self._parsed_byte_map[index][1] == self._size)):

820

result.append(((location, key), False))

821

continue

822

# no, is the key above or below the probed location:

823

# get the range of the probed & parsed location

824

index = self._parsed_byte_index(location)

825

# if the key is below the start of the range, its below

826

if key < self._parsed_key_map[index][0]:

827

direction = -1

828

else:

829

direction = +1

830

result.append(((location, key), direction))

831

readv_ranges = []

832

# lookup data to resolve references

833

for location in pending_locations:

834

length = 800

835

if location + length > self._size:

836

length = self._size - location

837

# TODO: trim out parsed locations (e.g. if the 800 is into the

838

# parsed region trim it, and dont use the adjust_for_latency

839

# facility)

840

if length > 0:

841

readv_ranges.append((location, length))

842

self._read_and_parse(readv_ranges)

843

if self._nodes is not None:

844

# The _read_and_parse triggered a _buffer_all, grab the data and

845

# return it

846

for location, key in pending_references:

847

value, refs = self._nodes[key]

848

result.append(((location, key), (self, key, value, refs)))

849

return result

850

for location, key in pending_references:

851

# answer key references we had to look-up-late.

852

value, refs = self._bisect_nodes[key]

853

result.append(((location, key), (self, key,

854

value, self._resolve_references(refs))))

855

return result

856

857

def _parse_header_from_bytes(self, bytes):

858

"""Parse the header from a region of bytes.

859

860

:param bytes: The data to parse.

861

:return: An offset, data tuple such as readv yields, for the unparsed

862

data. (which may length 0).

863

"""

864

signature = bytes[0:len(self._signature())]

865

if not signature == self._signature():

866

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

867

lines = bytes[len(self._signature()):].splitlines()

868

options_line = lines[0]

869

if not options_line.startswith(_OPTION_NODE_REFS):

870

raise errors.BadIndexOptions(self)

871

try:

872

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

873

except ValueError:

874

raise errors.BadIndexOptions(self)

875

options_line = lines[1]

876

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

877

raise errors.BadIndexOptions(self)

878

try:

879

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

880

except ValueError:

881

raise errors.BadIndexOptions(self)

882

options_line = lines[2]

883

if not options_line.startswith(_OPTION_LEN):

884

raise errors.BadIndexOptions(self)

885

try:

886

self._key_count = int(options_line[len(_OPTION_LEN):])

887

except ValueError:

888

raise errors.BadIndexOptions(self)

889

# calculate the bytes we have processed

890

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

891

len(lines[2]) + 3)

892

self._parsed_bytes(0, None, header_end, None)

893

# setup parsing state

894

self._expected_elements = 3 + self._key_length

895

# raw data keyed by offset

896

self._keys_by_offset = {}

897

# keys with the value and node references

898

self._bisect_nodes = {}

899

return header_end, bytes[header_end:]

900

901

def _parse_region(self, offset, data):

902

"""Parse node data returned from a readv operation.

903

904

:param offset: The byte offset the data starts at.

905

:param data: The data to parse.

906

"""

907

# trim the data.

908

# end first:

909

end = offset + len(data)

910

high_parsed = offset

911

while True:

912

# Trivial test - if the current index's end is within the

913

# low-matching parsed range, we're done.

914

index = self._parsed_byte_index(high_parsed)

915

if end < self._parsed_byte_map[index][1]:

916

return

917

# print "[%d:%d]" % (offset, end), \

918

# self._parsed_byte_map[index:index + 2]

919

high_parsed, last_segment = self._parse_segment(

920

offset, data, end, index)

921

if last_segment:

922

return

923

924

def _parse_segment(self, offset, data, end, index):

925

"""Parse one segment of data.

926

927

:param offset: Where 'data' begins in the file.

928

:param data: Some data to parse a segment of.

929

:param end: Where data ends

930

:param index: The current index into the parsed bytes map.

931

:return: True if the parsed segment is the last possible one in the

932

range of data.

933

:return: high_parsed_byte, last_segment.

934

high_parsed_byte is the location of the highest parsed byte in this

935

segment, last_segment is True if the parsed segment is the last

936

possible one in the data block.

937

"""

938

# default is to use all data

939

trim_end = None

940

# accomodate overlap with data before this.

941

if offset < self._parsed_byte_map[index][1]:

942

# overlaps the lower parsed region

943

# skip the parsed data

944

trim_start = self._parsed_byte_map[index][1] - offset

945

# don't trim the start for \n

946

start_adjacent = True

947

elif offset == self._parsed_byte_map[index][1]:

948

# abuts the lower parsed region

949

# use all data

950

trim_start = None

951

# do not trim anything

952

start_adjacent = True

953

else:

954

# does not overlap the lower parsed region

955

# use all data

956

trim_start = None

957

# but trim the leading \n

958

start_adjacent = False

959

if end == self._size:

960

# lines up to the end of all data:

961

# use it all

962

trim_end = None

963

# do not strip to the last \n

964

end_adjacent = True

965

last_segment = True

966

elif index + 1 == len(self._parsed_byte_map):

967

# at the end of the parsed data

968

# use it all

969

trim_end = None

970

# but strip to the last \n

971

end_adjacent = False

972

last_segment = True

973

elif end == self._parsed_byte_map[index + 1][0]:

974

# buts up against the next parsed region

975

# use it all

976

trim_end = None

977

# do not strip to the last \n

978

end_adjacent = True

979

last_segment = True

980

elif end > self._parsed_byte_map[index + 1][0]:

981

# overlaps into the next parsed region

982

# only consider the unparsed data

983

trim_end = self._parsed_byte_map[index + 1][0] - offset

984

# do not strip to the last \n as we know its an entire record

985

end_adjacent = True

986

last_segment = end < self._parsed_byte_map[index + 1][1]

987

else:

988

# does not overlap into the next region

989

# use it all

990

trim_end = None

991

# but strip to the last \n

992

end_adjacent = False

993

last_segment = True

994

# now find bytes to discard if needed

995

if not start_adjacent:

996

# work around python bug in rfind

997

if trim_start is None:

998

trim_start = data.find('\n') + 1

999

else:

1000

trim_start = data.find('\n', trim_start) + 1

1001

if not (trim_start != 0):

1002

raise AssertionError('no \n was present')

1003

# print 'removing start', offset, trim_start, repr(data[:trim_start])

1004

if not end_adjacent:

1005

# work around python bug in rfind

1006

if trim_end is None:

1007

trim_end = data.rfind('\n') + 1

1008

else:

1009

trim_end = data.rfind('\n', None, trim_end) + 1

1010

if not (trim_end != 0):

1011

raise AssertionError('no \n was present')

1012

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1013

# adjust offset and data to the parseable data.

1014

trimmed_data = data[trim_start:trim_end]

1015

if not (trimmed_data):

1016

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1017

% (trim_start, trim_end, offset, offset + len(data)))

1018

if trim_start:

1019

offset += trim_start

1020

# print "parsing", repr(trimmed_data)

1021

# splitlines mangles the \r delimiters.. don't use it.

1022

lines = trimmed_data.split('\n')

1023

del lines[-1]

1024

pos = offset

1025

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1026

for key, value in nodes:

1027

self._bisect_nodes[key] = value

1028

self._parsed_bytes(offset, first_key,

1029

offset + len(trimmed_data), last_key)

1030

return offset + len(trimmed_data), last_segment

1031

1032

def _parse_lines(self, lines, pos):

1033

key = None

1034

first_key = None

1035

trailers = 0

1036

nodes = []

1037

for line in lines:

1038

if line == '':

1039

# must be at the end

1040

if self._size:

1041

if not (self._size == pos + 1):

1042

raise AssertionError("%s %s" % (self._size, pos))

1043

trailers += 1

1044

continue

1045

elements = line.split('\0')

1046

if len(elements) != self._expected_elements:

1047

raise errors.BadIndexData(self)

1048

# keys are tuples. Each element is a string that may occur many

1049

# times, so we intern them to save space. AB, RC, 200807

1050

key = tuple([intern(element) for element in elements[:self._key_length]])

1051

if first_key is None:

1052

first_key = key

1053

absent, references, value = elements[-3:]

1054

ref_lists = []

1055

for ref_string in references.split('\t'):

1056

ref_lists.append(tuple([

1057

int(ref) for ref in ref_string.split('\r') if ref

1058

]))

1059

ref_lists = tuple(ref_lists)

1060

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1061

pos += len(line) + 1 # +1 for the \n

1062

if absent:

1063

continue

1064

if self.node_ref_lists:

1065

node_value = (value, ref_lists)

1066

else:

1067

node_value = value

1068

nodes.append((key, node_value))

1069

# print "parsed ", key

1070

return first_key, key, nodes, trailers

1071

1072

def _parsed_bytes(self, start, start_key, end, end_key):

1073

"""Mark the bytes from start to end as parsed.

1074

1075

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1076

1) as parsed.

1077

1078

:param start: The start of the parsed region.

1079

:param end: The end of the parsed region.

1080

"""

1081

index = self._parsed_byte_index(start)

1082

new_value = (start, end)

1083

new_key = (start_key, end_key)

1084

if index == -1:

1085

# first range parsed is always the beginning.

1086

self._parsed_byte_map.insert(index, new_value)

1087

self._parsed_key_map.insert(index, new_key)

1088

return

1089

# four cases:

1090

# new region

1091

# extend lower region

1092

# extend higher region

1093

# combine two regions

1094

if (index + 1 < len(self._parsed_byte_map) and

1095

self._parsed_byte_map[index][1] == start and

1096

self._parsed_byte_map[index + 1][0] == end):

1097

# combine two regions

1098

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1099

self._parsed_byte_map[index + 1][1])

1100

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1101

self._parsed_key_map[index + 1][1])

1102

del self._parsed_byte_map[index + 1]

1103

del self._parsed_key_map[index + 1]

1104

elif self._parsed_byte_map[index][1] == start:

1105

# extend the lower entry

1106

self._parsed_byte_map[index] = (

1107

self._parsed_byte_map[index][0], end)

1108

self._parsed_key_map[index] = (

1109

self._parsed_key_map[index][0], end_key)

1110

elif (index + 1 < len(self._parsed_byte_map) and

1111

self._parsed_byte_map[index + 1][0] == end):

1112

# extend the higher entry

1113

self._parsed_byte_map[index + 1] = (

1114

start, self._parsed_byte_map[index + 1][1])

1115

self._parsed_key_map[index + 1] = (

1116

start_key, self._parsed_key_map[index + 1][1])

1117

else:

1118

# new entry

1119

self._parsed_byte_map.insert(index + 1, new_value)

1120

self._parsed_key_map.insert(index + 1, new_key)

1121

1122

def _read_and_parse(self, readv_ranges):

1123

"""Read the the ranges and parse the resulting data.

1124

1125

:param readv_ranges: A prepared readv range list.

1126

"""

1127

if not readv_ranges:

1128

return

1129

if self._nodes is None and self._bytes_read * 2 >= self._size:

1130

# We've already read more than 50% of the file and we are about to

1131

# request more data, just _buffer_all() and be done

1132

self._buffer_all()

1133

return

1134

1135

readv_data = self._transport.readv(self._name, readv_ranges, True,

1136

self._size)

1137

# parse

1138

for offset, data in readv_data:

1139

self._bytes_read += len(data)

1140

if offset == 0 and len(data) == self._size:

1141

# We read the whole range, most likely because the

1142

# Transport upcast our readv ranges into one long request

1143

# for enough total data to grab the whole index.

1144

self._buffer_all(StringIO(data))

1145

return

1146

if self._bisect_nodes is None:

1147

# this must be the start

1148

if not (offset == 0):

1149

raise AssertionError()

1150

offset, data = self._parse_header_from_bytes(data)

1151

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1152

self._parse_region(offset, data)

1153

1154

def _signature(self):

1155

"""The file signature for this index type."""

1156

return _SIGNATURE

1157

1158

def validate(self):

1159

"""Validate that everything in the index can be accessed."""

1160

# iter_all validates completely at the moment, so just do that.

1161

for node in self.iter_all_entries():

1162

pass

1163

1164

1165

class CombinedGraphIndex(object):

1166

"""A GraphIndex made up from smaller GraphIndices.

1167

1168

The backing indices must implement GraphIndex, and are presumed to be

1169

static data.

1170

1171

Queries against the combined index will be made against the first index,

1172

and then the second and so on. The order of index's can thus influence

1173

performance significantly. For example, if one index is on local disk and a

1174

second on a remote server, the local disk index should be before the other

1175

in the index list.

1176

"""

1177

1178

def __init__(self, indices, reload_func=None):

1179

"""Create a CombinedGraphIndex backed by indices.

1180

1181

:param indices: An ordered list of indices to query for data.

1182

:param reload_func: A function to call if we find we are missing an

1183

index. Should have the form reload_func() => True/False to indicate

1184

if reloading actually changed anything.

1185

"""

1186

self._indices = indices

1187

self._reload_func = reload_func

1188

1189

def __repr__(self):

1190

return "%s(%s)" % (

1191

self.__class__.__name__,

1192

', '.join(map(repr, self._indices)))

1193

1194

def get_parent_map(self, keys):

1195

"""See graph._StackedParentsProvider.get_parent_map"""

1196

search_keys = set(keys)

1197

if NULL_REVISION in search_keys:

1198

search_keys.discard(NULL_REVISION)

1199

found_parents = {NULL_REVISION:[]}

1200

else:

1201

found_parents = {}

1202

for index, key, value, refs in self.iter_entries(search_keys):

1203

parents = refs[0]

1204

if not parents:

1205

parents = (NULL_REVISION,)

1206

found_parents[key] = parents

1207

return found_parents

1208

1209

has_key = _has_key_from_parent_map

1210

1211

def insert_index(self, pos, index):

1212

"""Insert a new index in the list of indices to query.

1213

1214

:param pos: The position to insert the index.

1215

:param index: The index to insert.

1216

"""

1217

self._indices.insert(pos, index)

1218

1219

def iter_all_entries(self):

1220

"""Iterate over all keys within the index

1221

1222

Duplicate keys across child indices are presumed to have the same

1223

value and are only reported once.

1224

1225

:return: An iterable of (index, key, reference_lists, value).

1226

There is no defined order for the result iteration - it will be in

1227

the most efficient order for the index.

1228

"""

1229

seen_keys = set()

1230

while True:

1231

try:

1232

for index in self._indices:

1233

for node in index.iter_all_entries():

1234

if node[1] not in seen_keys:

1235

yield node

1236

seen_keys.add(node[1])

1237

return

1238

except errors.NoSuchFile:

1239

self._reload_or_raise()

1240

1241

def iter_entries(self, keys):

1242

"""Iterate over keys within the index.

1243

1244

Duplicate keys across child indices are presumed to have the same

1245

value and are only reported once.

1246

1247

:param keys: An iterable providing the keys to be retrieved.

1248

:return: An iterable of (index, key, reference_lists, value). There is no

1249

defined order for the result iteration - it will be in the most

1250

efficient order for the index.

1251

"""

1252

keys = set(keys)

1253

while True:

1254

try:

1255

for index in self._indices:

1256

if not keys:

1257

return

1258

for node in index.iter_entries(keys):

1259

keys.remove(node[1])

1260

yield node

1261

return

1262

except errors.NoSuchFile:

1263

self._reload_or_raise()

1264

1265

def iter_entries_prefix(self, keys):

1266

"""Iterate over keys within the index using prefix matching.

1267

1268

Duplicate keys across child indices are presumed to have the same

1269

value and are only reported once.

1270

1271

Prefix matching is applied within the tuple of a key, not to within

1272

the bytestring of each key element. e.g. if you have the keys ('foo',

1273

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1274

only the former key is returned.

1275

1276

:param keys: An iterable providing the key prefixes to be retrieved.

1277

Each key prefix takes the form of a tuple the length of a key, but

1278

with the last N elements 'None' rather than a regular bytestring.

1279

The first element cannot be 'None'.

1280

:return: An iterable as per iter_all_entries, but restricted to the

1281

keys with a matching prefix to those supplied. No additional keys

1282

will be returned, and every match that is in the index will be

1283

returned.

1284

"""

1285

keys = set(keys)

1286

if not keys:

1287

return

1288

seen_keys = set()

1289

while True:

1290

try:

1291

for index in self._indices:

1292

for node in index.iter_entries_prefix(keys):

1293

if node[1] in seen_keys:

1294

continue

1295

seen_keys.add(node[1])

1296

yield node

1297

return

1298

except errors.NoSuchFile:

1299

self._reload_or_raise()

1300

1301

def key_count(self):

1302

"""Return an estimate of the number of keys in this index.

1303

1304

For CombinedGraphIndex this is approximated by the sum of the keys of

1305

the child indices. As child indices may have duplicate keys this can

1306

have a maximum error of the number of child indices * largest number of

1307

keys in any index.

1308

"""

1309

while True:

1310

try:

1311

return sum((index.key_count() for index in self._indices), 0)

1312

except errors.NoSuchFile:

1313

self._reload_or_raise()

1314

1315

missing_keys = _missing_keys_from_parent_map

1316

1317

def _reload_or_raise(self):

1318

"""We just got a NoSuchFile exception.

1319

1320

Try to reload the indices, if it fails, just raise the current

1321

exception.

1322

"""

1323

if self._reload_func is None:

1324

raise

1325

exc_type, exc_value, exc_traceback = sys.exc_info()

1326

trace.mutter('Trying to reload after getting exception: %s',

1327

exc_value)

1328

if not self._reload_func():

1329

# We tried to reload, but nothing changed, so we fail anyway

1330

trace.mutter('_reload_func indicated nothing has changed.'

1331

' Raising original exception.')

1332

raise exc_type, exc_value, exc_traceback

1333

1334

def validate(self):

1335

"""Validate that everything in the index can be accessed."""

1336

while True:

1337

try:

1338

for index in self._indices:

1339

index.validate()

1340

return

1341

except errors.NoSuchFile:

1342

self._reload_or_raise()

1343

1344

1345

class InMemoryGraphIndex(GraphIndexBuilder):

1346

"""A GraphIndex which operates entirely out of memory and is mutable.

1347

1348

This is designed to allow the accumulation of GraphIndex entries during a

1349

single write operation, where the accumulated entries need to be immediately

1350

available - for example via a CombinedGraphIndex.

1351

"""

1352

1353

def add_nodes(self, nodes):

1354

"""Add nodes to the index.

1355

1356

:param nodes: An iterable of (key, node_refs, value) entries to add.

1357

"""

1358

if self.reference_lists:

1359

for (key, value, node_refs) in nodes:

1360

self.add_node(key, value, node_refs)

1361

else:

1362

for (key, value) in nodes:

1363

self.add_node(key, value)

1364

1365

def iter_all_entries(self):

1366

"""Iterate over all keys within the index

1367

1368

:return: An iterable of (index, key, reference_lists, value). There is no

1369

defined order for the result iteration - it will be in the most

1370

efficient order for the index (in this case dictionary hash order).

1371

"""

1372

if 'evil' in debug.debug_flags:

1373

trace.mutter_callsite(3,

1374

"iter_all_entries scales with size of history.")

1375

if self.reference_lists:

1376

for key, (absent, references, value) in self._nodes.iteritems():

1377

if not absent:

1378

yield self, key, value, references

1379

else:

1380

for key, (absent, references, value) in self._nodes.iteritems():

1381

if not absent:

1382

yield self, key, value

1383

1384

def iter_entries(self, keys):

1385

"""Iterate over keys within the index.

1386

1387

:param keys: An iterable providing the keys to be retrieved.

1388

:return: An iterable of (index, key, value, reference_lists). There is no

1389

defined order for the result iteration - it will be in the most

1390

efficient order for the index (keys iteration order in this case).

1391

"""

1392

keys = set(keys)

1393

if self.reference_lists:

1394

for key in keys.intersection(self._keys):

1395

node = self._nodes[key]

1396

if not node[0]:

1397

yield self, key, node[2], node[1]

1398

else:

1399

for key in keys.intersection(self._keys):

1400

node = self._nodes[key]

1401

if not node[0]:

1402

yield self, key, node[2]

1403

1404

def iter_entries_prefix(self, keys):

1405

"""Iterate over keys within the index using prefix matching.

1406

1407

Prefix matching is applied within the tuple of a key, not to within

1408

the bytestring of each key element. e.g. if you have the keys ('foo',

1409

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1410

only the former key is returned.

1411

1412

:param keys: An iterable providing the key prefixes to be retrieved.

1413

Each key prefix takes the form of a tuple the length of a key, but

1414

with the last N elements 'None' rather than a regular bytestring.

1415

The first element cannot be 'None'.

1416

:return: An iterable as per iter_all_entries, but restricted to the

1417

keys with a matching prefix to those supplied. No additional keys

1418

will be returned, and every match that is in the index will be

1419

returned.

1420

"""

1421

# XXX: To much duplication with the GraphIndex class; consider finding

1422

# a good place to pull out the actual common logic.

1423

keys = set(keys)

1424

if not keys:

1425

return

1426

if self._key_length == 1:

1427

for key in keys:

1428

# sanity check

1429

if key[0] is None:

1430

raise errors.BadIndexKey(key)

1431

if len(key) != self._key_length:

1432

raise errors.BadIndexKey(key)

1433

node = self._nodes[key]

1434

if node[0]:

1435

continue

1436

if self.reference_lists:

1437

yield self, key, node[2], node[1]

1438

else:

1439

yield self, key, node[2]

1440

return

1441

nodes_by_key = self._get_nodes_by_key()

1442

for key in keys:

1443

# sanity check

1444

if key[0] is None:

1445

raise errors.BadIndexKey(key)

1446

if len(key) != self._key_length:

1447

raise errors.BadIndexKey(key)

1448

# find what it refers to:

1449

key_dict = nodes_by_key

1450

elements = list(key)

1451

# find the subdict to return

1452

try:

1453

while len(elements) and elements[0] is not None:

1454

key_dict = key_dict[elements[0]]

1455

elements.pop(0)

1456

except KeyError:

1457

# a non-existant lookup.

1458

continue

1459

if len(elements):

1460

dicts = [key_dict]

1461

while dicts:

1462

key_dict = dicts.pop(-1)

1463

# can't be empty or would not exist

1464

item, value = key_dict.iteritems().next()

1465

if type(value) == dict:

1466

# push keys

1467

dicts.extend(key_dict.itervalues())

1468

else:

1469

# yield keys

1470

for value in key_dict.itervalues():

1471

yield (self, ) + value

1472

else:

1473

yield (self, ) + key_dict

1474

1475

def key_count(self):

1476

"""Return an estimate of the number of keys in this index.

1477

1478

For InMemoryGraphIndex the estimate is exact.

1479

"""

1480

return len(self._keys)

1481

1482

def validate(self):

1483

"""In memory index's have no known corruption at the moment."""

1484

1485

1486

class GraphIndexPrefixAdapter(object):

1487

"""An adapter between GraphIndex with different key lengths.

1488

1489

Queries against this will emit queries against the adapted Graph with the

1490

prefix added, queries for all items use iter_entries_prefix. The returned

1491

nodes will have their keys and node references adjusted to remove the

1492

prefix. Finally, an add_nodes_callback can be supplied - when called the

1493

nodes and references being added will have prefix prepended.

1494

"""

1495

1496

def __init__(self, adapted, prefix, missing_key_length,

1497

add_nodes_callback=None):

1498

"""Construct an adapter against adapted with prefix."""

1499

self.adapted = adapted

1500

self.prefix_key = prefix + (None,)*missing_key_length

1501

self.prefix = prefix

1502

self.prefix_len = len(prefix)

1503

self.add_nodes_callback = add_nodes_callback

1504

1505

def add_nodes(self, nodes):

1506

"""Add nodes to the index.

1507

1508

:param nodes: An iterable of (key, node_refs, value) entries to add.

1509

"""

1510

# save nodes in case its an iterator

1511

nodes = tuple(nodes)

1512

translated_nodes = []

1513

try:

1514

# Add prefix_key to each reference node_refs is a tuple of tuples,

1515

# so split it apart, and add prefix_key to the internal reference

1516

for (key, value, node_refs) in nodes:

1517

adjusted_references = (

1518

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1519

for ref_list in node_refs))

1520

translated_nodes.append((self.prefix + key, value,

1521

adjusted_references))

1522

except ValueError:

1523

# XXX: TODO add an explicit interface for getting the reference list

1524

# status, to handle this bit of user-friendliness in the API more

1525

# explicitly.

1526

for (key, value) in nodes:

1527

translated_nodes.append((self.prefix + key, value))

1528

self.add_nodes_callback(translated_nodes)

1529

1530

def add_node(self, key, value, references=()):

1531

"""Add a node to the index.

1532

1533

:param key: The key. keys are non-empty tuples containing

1534

as many whitespace-free utf8 bytestrings as the key length

1535

defined for this index.

1536

:param references: An iterable of iterables of keys. Each is a

1537

reference to another key.

1538

:param value: The value to associate with the key. It may be any

1539

bytes as long as it does not contain \0 or \n.

1540

"""

1541

self.add_nodes(((key, value, references), ))

1542

1543

def _strip_prefix(self, an_iter):

1544

"""Strip prefix data from nodes and return it."""

1545

for node in an_iter:

1546

# cross checks

1547

if node[1][:self.prefix_len] != self.prefix:

1548

raise errors.BadIndexData(self)

1549

for ref_list in node[3]:

1550

for ref_node in ref_list:

1551

if ref_node[:self.prefix_len] != self.prefix:

1552

raise errors.BadIndexData(self)

1553

yield node[0], node[1][self.prefix_len:], node[2], (

1554

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1555

for ref_list in node[3]))

1556

1557

def iter_all_entries(self):

1558

"""Iterate over all keys within the index

1559

1560

iter_all_entries is implemented against the adapted index using

1561

iter_entries_prefix.

1562

1563

:return: An iterable of (index, key, reference_lists, value). There is no

1564

defined order for the result iteration - it will be in the most

1565

efficient order for the index (in this case dictionary hash order).

1566

"""

1567

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1568

1569

def iter_entries(self, keys):

1570

"""Iterate over keys within the index.

1571

1572

:param keys: An iterable providing the keys to be retrieved.

1573

:return: An iterable of (index, key, value, reference_lists). There is no

1574

defined order for the result iteration - it will be in the most

1575

efficient order for the index (keys iteration order in this case).

1576

"""

1577

return self._strip_prefix(self.adapted.iter_entries(

1578

self.prefix + key for key in keys))

1579

1580

def iter_entries_prefix(self, keys):

1581

"""Iterate over keys within the index using prefix matching.

1582

1583

Prefix matching is applied within the tuple of a key, not to within

1584

the bytestring of each key element. e.g. if you have the keys ('foo',

1585

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1586

only the former key is returned.

1587

1588

:param keys: An iterable providing the key prefixes to be retrieved.

1589

Each key prefix takes the form of a tuple the length of a key, but

1590

with the last N elements 'None' rather than a regular bytestring.

1591

The first element cannot be 'None'.

1592

:return: An iterable as per iter_all_entries, but restricted to the

1593

keys with a matching prefix to those supplied. No additional keys

1594

will be returned, and every match that is in the index will be

1595

returned.

1596

"""

1597

return self._strip_prefix(self.adapted.iter_entries_prefix(

1598

self.prefix + key for key in keys))

1599

1600

def key_count(self):

1601

"""Return an estimate of the number of keys in this index.

1602

1603

For GraphIndexPrefixAdapter this is relatively expensive - key

1604

iteration with the prefix is done.

1605

"""

1606

return len(list(self.iter_all_entries()))

1607

1608

def validate(self):

1609

"""Call the adapted's validate."""

1610

self.adapted.validate()

Older »