~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Martin Pool
Date: 2009-06-10 02:22:58 UTC
mto: This revision was merged to the branch mainline in revision 4464.
Revision ID: mbp@sourcefrog.net-20090610022258-czra1150uv22976i

textwrap break_on_hyphens option is not available in python2.5

files added:
BRANCH.TODO

COPYING.txt

INSTALL

Makefile

bzr.ico

bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/annotate.py

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/deprecated_graph.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_create_clone.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave_commands.py

bzrlib/win32utils.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2-windows.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

doc/news-template.txt

man1

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/generate_docs.py

tools/history2revfiles.py

tools/http_client.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
build-api

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/upgrade.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

plugins/changeset

plugins/changeset/__init__.py

plugins/changeset/apply_changeset.py

plugins/changeset/common.py

plugins/changeset/gen_changeset.py

plugins/changeset/read_changeset.py

plugins/checkperms

testbzr

testsweet.py

urlgrabber

urlgrabber/__init__.py

urlgrabber/byterange.py

urlgrabber/grabber.py

urlgrabber/keepalive.py

urlgrabber/mirror.py

urlgrabber/progress.py

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

plugins/ => bzrlib/plugins/

bzrlib/store.py => bzrlib/store/__init__.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/testbranch.py => bzrlib/tests/branch_implementations/test_branch.py

bzrlib/selftest/testdiff.py => bzrlib/tests/test_diff.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testlog.py => bzrlib/tests/test_log.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevision.py => bzrlib/tests/test_revision.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionspec.py

tools/testweave.py => bzrlib/tests/test_weave.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

effbot/ => bzrlib/util/effbot/

elementtree/ => bzrlib/util/elementtree/

bzrlib/xml.py => bzrlib/xml_serializer.py

bzrlib/newinventory.py => contrib/newinventory.py

HACKING => doc/developers/HACKING.txt

tutorial.txt => doc/en/tutorials/tutorial.txt

bzr-man.py => tools/doc_generate/autodoc_man.py

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/status.py

bzrlib/tests/__init__.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib/bash/bzr.simple

contrib/pwk

contrib/zsh/_bzr

setup.py *

tools/convertfile.py

tools/convertinv.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

100

self._key_length = key_elements

101

self._optimize_for_size = False

102

103

def _check_key(self, key):

104

"""Raise BadIndexKey if key is not a valid key for this index."""

105

if type(key) != tuple:

106

raise errors.BadIndexKey(key)

107

if self._key_length != len(key):

108

raise errors.BadIndexKey(key)

109

for element in key:

110

if not element or _whitespace_re.search(element) is not None:

111

raise errors.BadIndexKey(element)

112

113

def _external_references(self):

114

"""Return references that are not present in this index.

115

"""

116

keys = set()

117

refs = set()

118

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

119

# lists are used. It is currently correct for pack-0.92 through

120

# 1.9, which use the node references (3rd column) second

121

# reference list as the compression parent. Perhaps this should

122

# be moved into something higher up the stack, since it

123

# makes assumptions about how the index is used.

124

if self.reference_lists > 1:

125

for node in self.iter_all_entries():

126

keys.add(node[1])

127

refs.update(node[3][1])

128

return refs - keys

129

else:

130

# If reference_lists == 0 there can be no external references, and

131

# if reference_lists == 1, then there isn't a place to store the

132

# compression parent

133

return set()

134

135

def _get_nodes_by_key(self):

136

if self._nodes_by_key is None:

137

nodes_by_key = {}

138

if self.reference_lists:

139

for key, (absent, references, value) in self._nodes.iteritems():

140

if absent:

141

continue

142

key_dict = nodes_by_key

143

for subkey in key[:-1]:

144

key_dict = key_dict.setdefault(subkey, {})

145

key_dict[key[-1]] = key, value, references

146

else:

147

for key, (absent, references, value) in self._nodes.iteritems():

148

if absent:

149

continue

150

key_dict = nodes_by_key

151

for subkey in key[:-1]:

152

key_dict = key_dict.setdefault(subkey, {})

153

key_dict[key[-1]] = key, value

154

self._nodes_by_key = nodes_by_key

155

return self._nodes_by_key

156

157

def _update_nodes_by_key(self, key, value, node_refs):

158

"""Update the _nodes_by_key dict with a new key.

159

160

For a key of (foo, bar, baz) create

161

_nodes_by_key[foo][bar][baz] = key_value

162

"""

163

if self._nodes_by_key is None:

164

return

165

key_dict = self._nodes_by_key

166

if self.reference_lists:

167

key_value = key, value, node_refs

168

else:

169

key_value = key, value

170

for subkey in key[:-1]:

171

key_dict = key_dict.setdefault(subkey, {})

172

key_dict[key[-1]] = key_value

173

174

def _check_key_ref_value(self, key, references, value):

175

"""Check that 'key' and 'references' are all valid.

176

177

:param key: A key tuple. Must conform to the key interface (be a tuple,

178

be of the right length, not have any whitespace or nulls in any key

179

element.)

180

:param references: An iterable of reference lists. Something like

181

[[(ref, key)], [(ref, key), (other, key)]]

182

:param value: The value associate with this key. Must not contain

183

newlines or null characters.

184

:return: (node_refs, absent_references)

185

node_refs basically a packed form of 'references' where all

186

iterables are tuples

187

absent_references reference keys that are not in self._nodes.

188

This may contain duplicates if the same key is

189

referenced in multiple lists.

190

"""

191

self._check_key(key)

192

if _newline_null_re.search(value) is not None:

193

raise errors.BadIndexValue(value)

194

if len(references) != self.reference_lists:

195

raise errors.BadIndexValue(references)

196

node_refs = []

197

absent_references = []

198

for reference_list in references:

199

for reference in reference_list:

200

# If reference *is* in self._nodes, then we know it has already

201

# been checked.

202

if reference not in self._nodes:

203

self._check_key(reference)

204

absent_references.append(reference)

205

node_refs.append(tuple(reference_list))

206

return tuple(node_refs), absent_references

207

208

def add_node(self, key, value, references=()):

209

"""Add a node to the index.

210

211

:param key: The key. keys are non-empty tuples containing

212

as many whitespace-free utf8 bytestrings as the key length

213

defined for this index.

214

:param references: An iterable of iterables of keys. Each is a

215

reference to another key.

216

:param value: The value to associate with the key. It may be any

217

bytes as long as it does not contain \0 or \n.

218

"""

219

(node_refs,

220

absent_references) = self._check_key_ref_value(key, references, value)

221

if key in self._nodes and self._nodes[key][0] != 'a':

222

raise errors.BadIndexDuplicateKey(key, self)

223

for reference in absent_references:

224

# There may be duplicates, but I don't think it is worth worrying

225

# about

226

self._nodes[reference] = ('a', (), '')

227

self._nodes[key] = ('', node_refs, value)

228

self._keys.add(key)

229

if self._nodes_by_key is not None and self._key_length > 1:

230

self._update_nodes_by_key(key, value, node_refs)

231

232

def finish(self):

233

lines = [_SIGNATURE]

234

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

235

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

236

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

237

prefix_length = sum(len(x) for x in lines)

238

# references are byte offsets. To avoid having to do nasty

239

# polynomial work to resolve offsets (references to later in the

240

# file cannot be determined until all the inbetween references have

241

# been calculated too) we pad the offsets with 0's to make them be

242

# of consistent length. Using binary offsets would break the trivial

243

# file parsing.

244

# to calculate the width of zero's needed we do three passes:

245

# one to gather all the non-reference data and the number of references.

246

# one to pad all the data with reference-length and determine entry

247

# addresses.

248

# One to serialise.

249

250

# forward sorted by key. In future we may consider topological sorting,

251

# at the cost of table scans for direct lookup, or a second index for

252

# direct lookup

253

nodes = sorted(self._nodes.items())

254

# if we do not prepass, we don't know how long it will be up front.

255

expected_bytes = None

256

# we only need to pre-pass if we have reference lists at all.

257

if self.reference_lists:

258

key_offset_info = []

259

non_ref_bytes = prefix_length

260

total_references = 0

261

# TODO use simple multiplication for the constants in this loop.

262

for key, (absent, references, value) in nodes:

263

# record the offset known *so far* for this key:

264

# the non reference bytes to date, and the total references to

265

# date - saves reaccumulating on the second pass

266

key_offset_info.append((key, non_ref_bytes, total_references))

267

# key is literal, value is literal, there are 3 null's, 1 NL

268

# key is variable length tuple, \x00 between elements

269

non_ref_bytes += sum(len(element) for element in key)

270

if self._key_length > 1:

271

non_ref_bytes += self._key_length - 1

272

# value is literal bytes, there are 3 null's, 1 NL.

273

non_ref_bytes += len(value) + 3 + 1

274

# one byte for absent if set.

275

if absent:

276

non_ref_bytes += 1

277

elif self.reference_lists:

278

# (ref_lists -1) tabs

279

non_ref_bytes += self.reference_lists - 1

280

# (ref-1 cr's per ref_list)

281

for ref_list in references:

282

# how many references across the whole file?

283

total_references += len(ref_list)

284

# accrue reference separators

285

if ref_list:

286

non_ref_bytes += len(ref_list) - 1

287

# how many digits are needed to represent the total byte count?

288

digits = 1

289

possible_total_bytes = non_ref_bytes + total_references*digits

290

while 10 ** digits < possible_total_bytes:

291

digits += 1

292

possible_total_bytes = non_ref_bytes + total_references*digits

293

expected_bytes = possible_total_bytes + 1 # terminating newline

294

# resolve key addresses.

295

key_addresses = {}

296

for key, non_ref_bytes, total_references in key_offset_info:

297

key_addresses[key] = non_ref_bytes + total_references*digits

298

# serialise

299

format_string = '%%0%sd' % digits

300

for key, (absent, references, value) in nodes:

301

flattened_references = []

302

for ref_list in references:

303

ref_addresses = []

304

for reference in ref_list:

305

ref_addresses.append(format_string % key_addresses[reference])

306

flattened_references.append('\r'.join(ref_addresses))

307

string_key = '\x00'.join(key)

308

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

309

'\t'.join(flattened_references), value))

310

lines.append('\n')

311

result = StringIO(''.join(lines))

312

if expected_bytes and len(result.getvalue()) != expected_bytes:

313

raise errors.BzrError('Failed index creation. Internal error:'

314

' mismatched output length and expected length: %d %d' %

315

(len(result.getvalue()), expected_bytes))

316

return result

317

318

def set_optimize(self, for_size=True):

319

"""Change how the builder tries to optimize the result.

320

321

:param for_size: Tell the builder to try and make the index as small as

322

possible.

323

:return: None

324

"""

325

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

326

# other builders do.

327

self._optimize_for_size = for_size

328

329

330

class GraphIndex(object):

331

"""An index for data with embedded graphs.

332

333

The index maps keys to a list of key reference lists, and a value.

334

Each node has the same number of key reference lists. Each key reference

335

list can be empty or an arbitrary length. The value is an opaque NULL

336

terminated string without any newlines. The storage of the index is

337

hidden in the interface: keys and key references are always tuples of

338

bytestrings, never the internal representation (e.g. dictionary offsets).

339

340

It is presumed that the index will not be mutated - it is static data.

341

342

Successive iter_all_entries calls will read the entire index each time.

343

Additionally, iter_entries calls will read the index linearly until the

344

desired keys are found. XXX: This must be fixed before the index is

345

suitable for production use. :XXX

346

"""

347

348

def __init__(self, transport, name, size):

349

"""Open an index called name on transport.

350

351

:param transport: A bzrlib.transport.Transport.

352

:param name: A path to provide to transport API calls.

353

:param size: The size of the index in bytes. This is used for bisection

354

logic to perform partial index reads. While the size could be

355

obtained by statting the file this introduced an additional round

356

trip as well as requiring stat'able transports, both of which are

357

avoided by having it supplied. If size is None, then bisection

358

support will be disabled and accessing the index will just stream

359

all the data.

360

"""

361

self._transport = transport

362

self._name = name

363

# Becomes a dict of key:(value, reference-list-byte-locations) used by

364

# the bisection interface to store parsed but not resolved keys.

365

self._bisect_nodes = None

366

# Becomes a dict of key:(value, reference-list-keys) which are ready to

367

# be returned directly to callers.

368

self._nodes = None

369

# a sorted list of slice-addresses for the parsed bytes of the file.

370

# e.g. (0,1) would mean that byte 0 is parsed.

371

self._parsed_byte_map = []

372

# a sorted list of keys matching each slice address for parsed bytes

373

# e.g. (None, 'foo@bar') would mean that the first byte contained no

374

# key, and the end byte of the slice is the of the data for 'foo@bar'

375

self._parsed_key_map = []

376

self._key_count = None

377

self._keys_by_offset = None

378

self._nodes_by_key = None

379

self._size = size

380

# The number of bytes we've read so far in trying to process this file

381

self._bytes_read = 0

382

383

def __eq__(self, other):

384

"""Equal when self and other were created with the same parameters."""

385

return (

386

type(self) == type(other) and

387

self._transport == other._transport and

388

self._name == other._name and

389

self._size == other._size)

390

391

def __ne__(self, other):

392

return not self.__eq__(other)

393

394

def __repr__(self):

395

return "%s(%r)" % (self.__class__.__name__,

396

self._transport.abspath(self._name))

397

398

def _buffer_all(self, stream=None):

399

"""Buffer all the index data.

400

401

Mutates self._nodes and self.keys_by_offset.

402

"""

403

if self._nodes is not None:

404

# We already did this

405

return

406

if 'index' in debug.debug_flags:

407

mutter('Reading entire index %s', self._transport.abspath(self._name))

408

if stream is None:

409

stream = self._transport.get(self._name)

410

self._read_prefix(stream)

411

self._expected_elements = 3 + self._key_length

412

line_count = 0

413

# raw data keyed by offset

414

self._keys_by_offset = {}

415

# ready-to-return key:value or key:value, node_ref_lists

416

self._nodes = {}

417

self._nodes_by_key = None

418

trailers = 0

419

pos = stream.tell()

420

lines = stream.read().split('\n')

421

del lines[-1]

422

_, _, _, trailers = self._parse_lines(lines, pos)

423

for key, absent, references, value in self._keys_by_offset.itervalues():

424

if absent:

425

continue

426

# resolve references:

427

if self.node_ref_lists:

428

node_value = (value, self._resolve_references(references))

429

else:

430

node_value = value

431

self._nodes[key] = node_value

432

# cache the keys for quick set intersections

433

self._keys = set(self._nodes)

434

if trailers != 1:

435

# there must be one line - the empty trailer line.

436

raise errors.BadIndexData(self)

437

438

def external_references(self, ref_list_num):

439

"""Return references that are not present in this index.

440

"""

441

self._buffer_all()

442

if ref_list_num + 1 > self.node_ref_lists:

443

raise ValueError('No ref list %d, index has %d ref lists'

444

% (ref_list_num, self.node_ref_lists))

445

refs = set()

446

for key, (value, ref_lists) in self._nodes.iteritems():

447

ref_list = ref_lists[ref_list_num]

448

refs.update(ref_list)

449

return refs - self._keys

450

451

def _get_nodes_by_key(self):

452

if self._nodes_by_key is None:

453

nodes_by_key = {}

454

if self.node_ref_lists:

455

for key, (value, references) in self._nodes.iteritems():

456

key_dict = nodes_by_key

457

for subkey in key[:-1]:

458

key_dict = key_dict.setdefault(subkey, {})

459

key_dict[key[-1]] = key, value, references

460

else:

461

for key, value in self._nodes.iteritems():

462

key_dict = nodes_by_key

463

for subkey in key[:-1]:

464

key_dict = key_dict.setdefault(subkey, {})

465

key_dict[key[-1]] = key, value

466

self._nodes_by_key = nodes_by_key

467

return self._nodes_by_key

468

469

def iter_all_entries(self):

470

"""Iterate over all keys within the index.

471

472

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

473

The former tuple is used when there are no reference lists in the

474

index, making the API compatible with simple key:value index types.

475

There is no defined order for the result iteration - it will be in

476

the most efficient order for the index.

477

"""

478

if 'evil' in debug.debug_flags:

479

trace.mutter_callsite(3,

480

"iter_all_entries scales with size of history.")

481

if self._nodes is None:

482

self._buffer_all()

483

if self.node_ref_lists:

484

for key, (value, node_ref_lists) in self._nodes.iteritems():

485

yield self, key, value, node_ref_lists

486

else:

487

for key, value in self._nodes.iteritems():

488

yield self, key, value

489

490

def _read_prefix(self, stream):

491

signature = stream.read(len(self._signature()))

492

if not signature == self._signature():

493

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

494

options_line = stream.readline()

495

if not options_line.startswith(_OPTION_NODE_REFS):

496

raise errors.BadIndexOptions(self)

497

try:

498

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

499

except ValueError:

500

raise errors.BadIndexOptions(self)

501

options_line = stream.readline()

502

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

503

raise errors.BadIndexOptions(self)

504

try:

505

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

506

except ValueError:

507

raise errors.BadIndexOptions(self)

508

options_line = stream.readline()

509

if not options_line.startswith(_OPTION_LEN):

510

raise errors.BadIndexOptions(self)

511

try:

512

self._key_count = int(options_line[len(_OPTION_LEN):-1])

513

except ValueError:

514

raise errors.BadIndexOptions(self)

515

516

def _resolve_references(self, references):

517

"""Return the resolved key references for references.

518

519

References are resolved by looking up the location of the key in the

520

_keys_by_offset map and substituting the key name, preserving ordering.

521

522

:param references: An iterable of iterables of key locations. e.g.

523

[[123, 456], [123]]

524

:return: A tuple of tuples of keys.

525

"""

526

node_refs = []

527

for ref_list in references:

528

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

529

return tuple(node_refs)

530

531

def _find_index(self, range_map, key):

532

"""Helper for the _parsed_*_index calls.

533

534

Given a range map - [(start, end), ...], finds the index of the range

535

in the map for key if it is in the map, and if it is not there, the

536

immediately preceeding range in the map.

537

"""

538

result = bisect_right(range_map, key) - 1

539

if result + 1 < len(range_map):

540

# check the border condition, it may be in result + 1

541

if range_map[result + 1][0] == key[0]:

542

return result + 1

543

return result

544

545

def _parsed_byte_index(self, offset):

546

"""Return the index of the entry immediately before offset.

547

548

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

549

there is one unparsed byte (the 11th, addressed as[10]). then:

550

asking for 0 will return 0

551

asking for 10 will return 0

552

asking for 11 will return 1

553

asking for 12 will return 1

554

"""

555

key = (offset, 0)

556

return self._find_index(self._parsed_byte_map, key)

557

558

def _parsed_key_index(self, key):

559

"""Return the index of the entry immediately before key.

560

561

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

562

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

563

have been parsed, then:

564

asking for '' will return 0

565

asking for 'a' will return 0

566

asking for 'b' will return 1

567

asking for 'e' will return 1

568

"""

569

search_key = (key, None)

570

return self._find_index(self._parsed_key_map, search_key)

571

572

def _is_parsed(self, offset):

573

"""Returns True if offset has been parsed."""

574

index = self._parsed_byte_index(offset)

575

if index == len(self._parsed_byte_map):

576

return offset < self._parsed_byte_map[index - 1][1]

577

start, end = self._parsed_byte_map[index]

578

return offset >= start and offset < end

579

580

def _iter_entries_from_total_buffer(self, keys):

581

"""Iterate over keys when the entire index is parsed."""

582

keys = keys.intersection(self._keys)

583

if self.node_ref_lists:

584

for key in keys:

585

value, node_refs = self._nodes[key]

586

yield self, key, value, node_refs

587

else:

588

for key in keys:

589

yield self, key, self._nodes[key]

590

591

def iter_entries(self, keys):

592

"""Iterate over keys within the index.

593

594

:param keys: An iterable providing the keys to be retrieved.

595

:return: An iterable as per iter_all_entries, but restricted to the

596

keys supplied. No additional keys will be returned, and every

597

key supplied that is in the index will be returned.

598

"""

599

keys = set(keys)

600

if not keys:

601

return []

602

if self._size is None and self._nodes is None:

603

self._buffer_all()

604

605

# We fit about 20 keys per minimum-read (4K), so if we are looking for

606

# more than 1/20th of the index its likely (assuming homogenous key

607

# spread) that we'll read the entire index. If we're going to do that,

608

# buffer the whole thing. A better analysis might take key spread into

609

# account - but B+Tree indices are better anyway.

610

# We could look at all data read, and use a threshold there, which will

611

# trigger on ancestry walks, but that is not yet fully mapped out.

612

if self._nodes is None and len(keys) * 20 > self.key_count():

613

self._buffer_all()

614

if self._nodes is not None:

615

return self._iter_entries_from_total_buffer(keys)

616

else:

617

return (result[1] for result in bisect_multi_bytes(

618

self._lookup_keys_via_location, self._size, keys))

619

620

def iter_entries_prefix(self, keys):

621

"""Iterate over keys within the index using prefix matching.

622

623

Prefix matching is applied within the tuple of a key, not to within

624

the bytestring of each key element. e.g. if you have the keys ('foo',

625

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

626

only the former key is returned.

627

628

WARNING: Note that this method currently causes a full index parse

629

unconditionally (which is reasonably appropriate as it is a means for

630

thunking many small indices into one larger one and still supplies

631

iter_all_entries at the thunk layer).

632

633

:param keys: An iterable providing the key prefixes to be retrieved.

634

Each key prefix takes the form of a tuple the length of a key, but

635

with the last N elements 'None' rather than a regular bytestring.

636

The first element cannot be 'None'.

637

:return: An iterable as per iter_all_entries, but restricted to the

638

keys with a matching prefix to those supplied. No additional keys

639

will be returned, and every match that is in the index will be

640

returned.

641

"""

642

keys = set(keys)

643

if not keys:

644

return

645

# load data - also finds key lengths

646

if self._nodes is None:

647

self._buffer_all()

648

if self._key_length == 1:

649

for key in keys:

650

# sanity check

651

if key[0] is None:

652

raise errors.BadIndexKey(key)

653

if len(key) != self._key_length:

654

raise errors.BadIndexKey(key)

655

if self.node_ref_lists:

656

value, node_refs = self._nodes[key]

657

yield self, key, value, node_refs

658

else:

659

yield self, key, self._nodes[key]

660

return

661

nodes_by_key = self._get_nodes_by_key()

662

for key in keys:

663

# sanity check

664

if key[0] is None:

665

raise errors.BadIndexKey(key)

666

if len(key) != self._key_length:

667

raise errors.BadIndexKey(key)

668

# find what it refers to:

669

key_dict = nodes_by_key

670

elements = list(key)

671

# find the subdict whose contents should be returned.

672

try:

673

while len(elements) and elements[0] is not None:

674

key_dict = key_dict[elements[0]]

675

elements.pop(0)

676

except KeyError:

677

# a non-existant lookup.

678

continue

679

if len(elements):

680

dicts = [key_dict]

681

while dicts:

682

key_dict = dicts.pop(-1)

683

# can't be empty or would not exist

684

item, value = key_dict.iteritems().next()

685

if type(value) == dict:

686

# push keys

687

dicts.extend(key_dict.itervalues())

688

else:

689

# yield keys

690

for value in key_dict.itervalues():

691

# each value is the key:value:node refs tuple

692

# ready to yield.

693

yield (self, ) + value

694

else:

695

# the last thing looked up was a terminal element

696

yield (self, ) + key_dict

697

698

def key_count(self):

699

"""Return an estimate of the number of keys in this index.

700

701

For GraphIndex the estimate is exact.

702

"""

703

if self._key_count is None:

704

self._read_and_parse([_HEADER_READV])

705

return self._key_count

706

707

def _lookup_keys_via_location(self, location_keys):

708

"""Public interface for implementing bisection.

709

710

If _buffer_all has been called, then all the data for the index is in

711

memory, and this method should not be called, as it uses a separate

712

cache because it cannot pre-resolve all indices, which buffer_all does

713

for performance.

714

715

:param location_keys: A list of location(byte offset), key tuples.

716

:return: A list of (location_key, result) tuples as expected by

717

bzrlib.bisect_multi.bisect_multi_bytes.

718

"""

719

# Possible improvements:

720

# - only bisect lookup each key once

721

# - sort the keys first, and use that to reduce the bisection window

722

# -----

723

# this progresses in three parts:

724

# read data

725

# parse it

726

# attempt to answer the question from the now in memory data.

727

# build the readv request

728

# for each location, ask for 800 bytes - much more than rows we've seen

729

# anywhere.

730

readv_ranges = []

731

for location, key in location_keys:

732

# can we answer from cache?

733

if self._bisect_nodes and key in self._bisect_nodes:

734

# We have the key parsed.

735

continue

736

index = self._parsed_key_index(key)

737

if (len(self._parsed_key_map) and

738

self._parsed_key_map[index][0] <= key and

739

(self._parsed_key_map[index][1] >= key or

740

# end of the file has been parsed

741

self._parsed_byte_map[index][1] == self._size)):

742

# the key has been parsed, so no lookup is needed even if its

743

# not present.

744

continue

745

# - if we have examined this part of the file already - yes

746

index = self._parsed_byte_index(location)

747

if (len(self._parsed_byte_map) and

748

self._parsed_byte_map[index][0] <= location and

749

self._parsed_byte_map[index][1] > location):

750

# the byte region has been parsed, so no read is needed.

751

continue

752

length = 800

753

if location + length > self._size:

754

length = self._size - location

755

# todo, trim out parsed locations.

756

if length > 0:

757

readv_ranges.append((location, length))

758

# read the header if needed

759

if self._bisect_nodes is None:

760

readv_ranges.append(_HEADER_READV)

761

self._read_and_parse(readv_ranges)

762

result = []

763

if self._nodes is not None:

764

# _read_and_parse triggered a _buffer_all because we requested the

765

# whole data range

766

for location, key in location_keys:

767

if key not in self._nodes: # not present

768

result.append(((location, key), False))

769

elif self.node_ref_lists:

770

value, refs = self._nodes[key]

771

result.append(((location, key),

772

(self, key, value, refs)))

773

else:

774

result.append(((location, key),

775

(self, key, self._nodes[key])))

776

return result

777

# generate results:

778

# - figure out <, >, missing, present

779

# - result present references so we can return them.

780

# keys that we cannot answer until we resolve references

781

pending_references = []

782

pending_locations = set()

783

for location, key in location_keys:

784

# can we answer from cache?

785

if key in self._bisect_nodes:

786

# the key has been parsed, so no lookup is needed

787

if self.node_ref_lists:

788

# the references may not have been all parsed.

789

value, refs = self._bisect_nodes[key]

790

wanted_locations = []

791

for ref_list in refs:

792

for ref in ref_list:

793

if ref not in self._keys_by_offset:

794

wanted_locations.append(ref)

795

if wanted_locations:

796

pending_locations.update(wanted_locations)

797

pending_references.append((location, key))

798

continue

799

result.append(((location, key), (self, key,

800

value, self._resolve_references(refs))))

801

else:

802

result.append(((location, key),

803

(self, key, self._bisect_nodes[key])))

804

continue

805

else:

806

# has the region the key should be in, been parsed?

807

index = self._parsed_key_index(key)

808

if (self._parsed_key_map[index][0] <= key and

809

(self._parsed_key_map[index][1] >= key or

810

# end of the file has been parsed

811

self._parsed_byte_map[index][1] == self._size)):

812

result.append(((location, key), False))

813

continue

814

# no, is the key above or below the probed location:

815

# get the range of the probed & parsed location

816

index = self._parsed_byte_index(location)

817

# if the key is below the start of the range, its below

818

if key < self._parsed_key_map[index][0]:

819

direction = -1

820

else:

821

direction = +1

822

result.append(((location, key), direction))

823

readv_ranges = []

824

# lookup data to resolve references

825

for location in pending_locations:

826

length = 800

827

if location + length > self._size:

828

length = self._size - location

829

# TODO: trim out parsed locations (e.g. if the 800 is into the

830

# parsed region trim it, and dont use the adjust_for_latency

831

# facility)

832

if length > 0:

833

readv_ranges.append((location, length))

834

self._read_and_parse(readv_ranges)

835

if self._nodes is not None:

836

# The _read_and_parse triggered a _buffer_all, grab the data and

837

# return it

838

for location, key in pending_references:

839

value, refs = self._nodes[key]

840

result.append(((location, key), (self, key, value, refs)))

841

return result

842

for location, key in pending_references:

843

# answer key references we had to look-up-late.

844

value, refs = self._bisect_nodes[key]

845

result.append(((location, key), (self, key,

846

value, self._resolve_references(refs))))

847

return result

848

849

def _parse_header_from_bytes(self, bytes):

850

"""Parse the header from a region of bytes.

851

852

:param bytes: The data to parse.

853

:return: An offset, data tuple such as readv yields, for the unparsed

854

data. (which may length 0).

855

"""

856

signature = bytes[0:len(self._signature())]

857

if not signature == self._signature():

858

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

859

lines = bytes[len(self._signature()):].splitlines()

860

options_line = lines[0]

861

if not options_line.startswith(_OPTION_NODE_REFS):

862

raise errors.BadIndexOptions(self)

863

try:

864

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

865

except ValueError:

866

raise errors.BadIndexOptions(self)

867

options_line = lines[1]

868

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

869

raise errors.BadIndexOptions(self)

870

try:

871

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

872

except ValueError:

873

raise errors.BadIndexOptions(self)

874

options_line = lines[2]

875

if not options_line.startswith(_OPTION_LEN):

876

raise errors.BadIndexOptions(self)

877

try:

878

self._key_count = int(options_line[len(_OPTION_LEN):])

879

except ValueError:

880

raise errors.BadIndexOptions(self)

881

# calculate the bytes we have processed

882

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

883

len(lines[2]) + 3)

884

self._parsed_bytes(0, None, header_end, None)

885

# setup parsing state

886

self._expected_elements = 3 + self._key_length

887

# raw data keyed by offset

888

self._keys_by_offset = {}

889

# keys with the value and node references

890

self._bisect_nodes = {}

891

return header_end, bytes[header_end:]

892

893

def _parse_region(self, offset, data):

894

"""Parse node data returned from a readv operation.

895

896

:param offset: The byte offset the data starts at.

897

:param data: The data to parse.

898

"""

899

# trim the data.

900

# end first:

901

end = offset + len(data)

902

high_parsed = offset

903

while True:

904

# Trivial test - if the current index's end is within the

905

# low-matching parsed range, we're done.

906

index = self._parsed_byte_index(high_parsed)

907

if end < self._parsed_byte_map[index][1]:

908

return

909

# print "[%d:%d]" % (offset, end), \

910

# self._parsed_byte_map[index:index + 2]

911

high_parsed, last_segment = self._parse_segment(

912

offset, data, end, index)

913

if last_segment:

914

return

915

916

def _parse_segment(self, offset, data, end, index):

917

"""Parse one segment of data.

918

919

:param offset: Where 'data' begins in the file.

920

:param data: Some data to parse a segment of.

921

:param end: Where data ends

922

:param index: The current index into the parsed bytes map.

923

:return: True if the parsed segment is the last possible one in the

924

range of data.

925

:return: high_parsed_byte, last_segment.

926

high_parsed_byte is the location of the highest parsed byte in this

927

segment, last_segment is True if the parsed segment is the last

928

possible one in the data block.

929

"""

930

# default is to use all data

931

trim_end = None

932

# accomodate overlap with data before this.

933

if offset < self._parsed_byte_map[index][1]:

934

# overlaps the lower parsed region

935

# skip the parsed data

936

trim_start = self._parsed_byte_map[index][1] - offset

937

# don't trim the start for \n

938

start_adjacent = True

939

elif offset == self._parsed_byte_map[index][1]:

940

# abuts the lower parsed region

941

# use all data

942

trim_start = None

943

# do not trim anything

944

start_adjacent = True

945

else:

946

# does not overlap the lower parsed region

947

# use all data

948

trim_start = None

949

# but trim the leading \n

950

start_adjacent = False

951

if end == self._size:

952

# lines up to the end of all data:

953

# use it all

954

trim_end = None

955

# do not strip to the last \n

956

end_adjacent = True

957

last_segment = True

958

elif index + 1 == len(self._parsed_byte_map):

959

# at the end of the parsed data

960

# use it all

961

trim_end = None

962

# but strip to the last \n

963

end_adjacent = False

964

last_segment = True

965

elif end == self._parsed_byte_map[index + 1][0]:

966

# buts up against the next parsed region

967

# use it all

968

trim_end = None

969

# do not strip to the last \n

970

end_adjacent = True

971

last_segment = True

972

elif end > self._parsed_byte_map[index + 1][0]:

973

# overlaps into the next parsed region

974

# only consider the unparsed data

975

trim_end = self._parsed_byte_map[index + 1][0] - offset

976

# do not strip to the last \n as we know its an entire record

977

end_adjacent = True

978

last_segment = end < self._parsed_byte_map[index + 1][1]

979

else:

980

# does not overlap into the next region

981

# use it all

982

trim_end = None

983

# but strip to the last \n

984

end_adjacent = False

985

last_segment = True

986

# now find bytes to discard if needed

987

if not start_adjacent:

988

# work around python bug in rfind

989

if trim_start is None:

990

trim_start = data.find('\n') + 1

991

else:

992

trim_start = data.find('\n', trim_start) + 1

993

if not (trim_start != 0):

994

raise AssertionError('no \n was present')

995

# print 'removing start', offset, trim_start, repr(data[:trim_start])

996

if not end_adjacent:

997

# work around python bug in rfind

998

if trim_end is None:

999

trim_end = data.rfind('\n') + 1

1000

else:

1001

trim_end = data.rfind('\n', None, trim_end) + 1

1002

if not (trim_end != 0):

1003

raise AssertionError('no \n was present')

1004

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1005

# adjust offset and data to the parseable data.

1006

trimmed_data = data[trim_start:trim_end]

1007

if not (trimmed_data):

1008

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1009

% (trim_start, trim_end, offset, offset + len(data)))

1010

if trim_start:

1011

offset += trim_start

1012

# print "parsing", repr(trimmed_data)

1013

# splitlines mangles the \r delimiters.. don't use it.

1014

lines = trimmed_data.split('\n')

1015

del lines[-1]

1016

pos = offset

1017

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1018

for key, value in nodes:

1019

self._bisect_nodes[key] = value

1020

self._parsed_bytes(offset, first_key,

1021

offset + len(trimmed_data), last_key)

1022

return offset + len(trimmed_data), last_segment

1023

1024

def _parse_lines(self, lines, pos):

1025

key = None

1026

first_key = None

1027

trailers = 0

1028

nodes = []

1029

for line in lines:

1030

if line == '':

1031

# must be at the end

1032

if self._size:

1033

if not (self._size == pos + 1):

1034

raise AssertionError("%s %s" % (self._size, pos))

1035

trailers += 1

1036

continue

1037

elements = line.split('\0')

1038

if len(elements) != self._expected_elements:

1039

raise errors.BadIndexData(self)

1040

# keys are tuples. Each element is a string that may occur many

1041

# times, so we intern them to save space. AB, RC, 200807

1042

key = tuple([intern(element) for element in elements[:self._key_length]])

1043

if first_key is None:

1044

first_key = key

1045

absent, references, value = elements[-3:]

1046

ref_lists = []

1047

for ref_string in references.split('\t'):

1048

ref_lists.append(tuple([

1049

int(ref) for ref in ref_string.split('\r') if ref

1050

]))

1051

ref_lists = tuple(ref_lists)

1052

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1053

pos += len(line) + 1 # +1 for the \n

1054

if absent:

1055

continue

1056

if self.node_ref_lists:

1057

node_value = (value, ref_lists)

1058

else:

1059

node_value = value

1060

nodes.append((key, node_value))

1061

# print "parsed ", key

1062

return first_key, key, nodes, trailers

1063

1064

def _parsed_bytes(self, start, start_key, end, end_key):

1065

"""Mark the bytes from start to end as parsed.

1066

1067

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1068

1) as parsed.

1069

1070

:param start: The start of the parsed region.

1071

:param end: The end of the parsed region.

1072

"""

1073

index = self._parsed_byte_index(start)

1074

new_value = (start, end)

1075

new_key = (start_key, end_key)

1076

if index == -1:

1077

# first range parsed is always the beginning.

1078

self._parsed_byte_map.insert(index, new_value)

1079

self._parsed_key_map.insert(index, new_key)

1080

return

1081

# four cases:

1082

# new region

1083

# extend lower region

1084

# extend higher region

1085

# combine two regions

1086

if (index + 1 < len(self._parsed_byte_map) and

1087

self._parsed_byte_map[index][1] == start and

1088

self._parsed_byte_map[index + 1][0] == end):

1089

# combine two regions

1090

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1091

self._parsed_byte_map[index + 1][1])

1092

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1093

self._parsed_key_map[index + 1][1])

1094

del self._parsed_byte_map[index + 1]

1095

del self._parsed_key_map[index + 1]

1096

elif self._parsed_byte_map[index][1] == start:

1097

# extend the lower entry

1098

self._parsed_byte_map[index] = (

1099

self._parsed_byte_map[index][0], end)

1100

self._parsed_key_map[index] = (

1101

self._parsed_key_map[index][0], end_key)

1102

elif (index + 1 < len(self._parsed_byte_map) and

1103

self._parsed_byte_map[index + 1][0] == end):

1104

# extend the higher entry

1105

self._parsed_byte_map[index + 1] = (

1106

start, self._parsed_byte_map[index + 1][1])

1107

self._parsed_key_map[index + 1] = (

1108

start_key, self._parsed_key_map[index + 1][1])

1109

else:

1110

# new entry

1111

self._parsed_byte_map.insert(index + 1, new_value)

1112

self._parsed_key_map.insert(index + 1, new_key)

1113

1114

def _read_and_parse(self, readv_ranges):

1115

"""Read the the ranges and parse the resulting data.

1116

1117

:param readv_ranges: A prepared readv range list.

1118

"""

1119

if not readv_ranges:

1120

return

1121

if self._nodes is None and self._bytes_read * 2 >= self._size:

1122

# We've already read more than 50% of the file and we are about to

1123

# request more data, just _buffer_all() and be done

1124

self._buffer_all()

1125

return

1126

1127

readv_data = self._transport.readv(self._name, readv_ranges, True,

1128

self._size)

1129

# parse

1130

for offset, data in readv_data:

1131

self._bytes_read += len(data)

1132

if offset == 0 and len(data) == self._size:

1133

# We read the whole range, most likely because the

1134

# Transport upcast our readv ranges into one long request

1135

# for enough total data to grab the whole index.

1136

self._buffer_all(StringIO(data))

1137

return

1138

if self._bisect_nodes is None:

1139

# this must be the start

1140

if not (offset == 0):

1141

raise AssertionError()

1142

offset, data = self._parse_header_from_bytes(data)

1143

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1144

self._parse_region(offset, data)

1145

1146

def _signature(self):

1147

"""The file signature for this index type."""

1148

return _SIGNATURE

1149

1150

def validate(self):

1151

"""Validate that everything in the index can be accessed."""

1152

# iter_all validates completely at the moment, so just do that.

1153

for node in self.iter_all_entries():

1154

pass

1155

1156

1157

class CombinedGraphIndex(object):

1158

"""A GraphIndex made up from smaller GraphIndices.

1159

1160

The backing indices must implement GraphIndex, and are presumed to be

1161

static data.

1162

1163

Queries against the combined index will be made against the first index,

1164

and then the second and so on. The order of index's can thus influence

1165

performance significantly. For example, if one index is on local disk and a

1166

second on a remote server, the local disk index should be before the other

1167

in the index list.

1168

"""

1169

1170

def __init__(self, indices, reload_func=None):

1171

"""Create a CombinedGraphIndex backed by indices.

1172

1173

:param indices: An ordered list of indices to query for data.

1174

:param reload_func: A function to call if we find we are missing an

1175

index. Should have the form reload_func() => True/False to indicate

1176

if reloading actually changed anything.

1177

"""

1178

self._indices = indices

1179

self._reload_func = reload_func

1180

1181

def __repr__(self):

1182

return "%s(%s)" % (

1183

self.__class__.__name__,

1184

', '.join(map(repr, self._indices)))

1185

1186

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

1187

def get_parents(self, revision_ids):

1188

"""See graph._StackedParentsProvider.get_parents.

1189

1190

This implementation thunks the graph.Graph.get_parents api across to

1191

GraphIndex.

1192

1193

:param revision_ids: An iterable of graph keys for this graph.

1194

:return: A list of parent details for each key in revision_ids.

1195

Each parent details will be one of:

1196

* None when the key was missing

1197

* (NULL_REVISION,) when the key has no parents.

1198

* (parent_key, parent_key...) otherwise.

1199

"""

1200

parent_map = self.get_parent_map(revision_ids)

1201

return [parent_map.get(r, None) for r in revision_ids]

1202

1203

def get_parent_map(self, keys):

1204

"""See graph._StackedParentsProvider.get_parent_map"""

1205

search_keys = set(keys)

1206

if NULL_REVISION in search_keys:

1207

search_keys.discard(NULL_REVISION)

1208

found_parents = {NULL_REVISION:[]}

1209

else:

1210

found_parents = {}

1211

for index, key, value, refs in self.iter_entries(search_keys):

1212

parents = refs[0]

1213

if not parents:

1214

parents = (NULL_REVISION,)

1215

found_parents[key] = parents

1216

return found_parents

1217

1218

has_key = _has_key_from_parent_map

1219

1220

def insert_index(self, pos, index):

1221

"""Insert a new index in the list of indices to query.

1222

1223

:param pos: The position to insert the index.

1224

:param index: The index to insert.

1225

"""

1226

self._indices.insert(pos, index)

1227

1228

def iter_all_entries(self):

1229

"""Iterate over all keys within the index

1230

1231

Duplicate keys across child indices are presumed to have the same

1232

value and are only reported once.

1233

1234

:return: An iterable of (index, key, reference_lists, value).

1235

There is no defined order for the result iteration - it will be in

1236

the most efficient order for the index.

1237

"""

1238

seen_keys = set()

1239

while True:

1240

try:

1241

for index in self._indices:

1242

for node in index.iter_all_entries():

1243

if node[1] not in seen_keys:

1244

yield node

1245

seen_keys.add(node[1])

1246

return

1247

except errors.NoSuchFile:

1248

self._reload_or_raise()

1249

1250

def iter_entries(self, keys):

1251

"""Iterate over keys within the index.

1252

1253

Duplicate keys across child indices are presumed to have the same

1254

value and are only reported once.

1255

1256

:param keys: An iterable providing the keys to be retrieved.

1257

:return: An iterable of (index, key, reference_lists, value). There is no

1258

defined order for the result iteration - it will be in the most

1259

efficient order for the index.

1260

"""

1261

keys = set(keys)

1262

while True:

1263

try:

1264

for index in self._indices:

1265

if not keys:

1266

return

1267

for node in index.iter_entries(keys):

1268

keys.remove(node[1])

1269

yield node

1270

return

1271

except errors.NoSuchFile:

1272

self._reload_or_raise()

1273

1274

def iter_entries_prefix(self, keys):

1275

"""Iterate over keys within the index using prefix matching.

1276

1277

Duplicate keys across child indices are presumed to have the same

1278

value and are only reported once.

1279

1280

Prefix matching is applied within the tuple of a key, not to within

1281

the bytestring of each key element. e.g. if you have the keys ('foo',

1282

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1283

only the former key is returned.

1284

1285

:param keys: An iterable providing the key prefixes to be retrieved.

1286

Each key prefix takes the form of a tuple the length of a key, but

1287

with the last N elements 'None' rather than a regular bytestring.

1288

The first element cannot be 'None'.

1289

:return: An iterable as per iter_all_entries, but restricted to the

1290

keys with a matching prefix to those supplied. No additional keys

1291

will be returned, and every match that is in the index will be

1292

returned.

1293

"""

1294

keys = set(keys)

1295

if not keys:

1296

return

1297

seen_keys = set()

1298

while True:

1299

try:

1300

for index in self._indices:

1301

for node in index.iter_entries_prefix(keys):

1302

if node[1] in seen_keys:

1303

continue

1304

seen_keys.add(node[1])

1305

yield node

1306

return

1307

except errors.NoSuchFile:

1308

self._reload_or_raise()

1309

1310

def key_count(self):

1311

"""Return an estimate of the number of keys in this index.

1312

1313

For CombinedGraphIndex this is approximated by the sum of the keys of

1314

the child indices. As child indices may have duplicate keys this can

1315

have a maximum error of the number of child indices * largest number of

1316

keys in any index.

1317

"""

1318

while True:

1319

try:

1320

return sum((index.key_count() for index in self._indices), 0)

1321

except errors.NoSuchFile:

1322

self._reload_or_raise()

1323

1324

missing_keys = _missing_keys_from_parent_map

1325

1326

def _reload_or_raise(self):

1327

"""We just got a NoSuchFile exception.

1328

1329

Try to reload the indices, if it fails, just raise the current

1330

exception.

1331

"""

1332

if self._reload_func is None:

1333

raise

1334

exc_type, exc_value, exc_traceback = sys.exc_info()

1335

trace.mutter('Trying to reload after getting exception: %s',

1336

exc_value)

1337

if not self._reload_func():

1338

# We tried to reload, but nothing changed, so we fail anyway

1339

trace.mutter('_reload_func indicated nothing has changed.'

1340

' Raising original exception.')

1341

raise exc_type, exc_value, exc_traceback

1342

1343

def validate(self):

1344

"""Validate that everything in the index can be accessed."""

1345

while True:

1346

try:

1347

for index in self._indices:

1348

index.validate()

1349

return

1350

except errors.NoSuchFile:

1351

self._reload_or_raise()

1352

1353

1354

class InMemoryGraphIndex(GraphIndexBuilder):

1355

"""A GraphIndex which operates entirely out of memory and is mutable.

1356

1357

This is designed to allow the accumulation of GraphIndex entries during a

1358

single write operation, where the accumulated entries need to be immediately

1359

available - for example via a CombinedGraphIndex.

1360

"""

1361

1362

def add_nodes(self, nodes):

1363

"""Add nodes to the index.

1364

1365

:param nodes: An iterable of (key, node_refs, value) entries to add.

1366

"""

1367

if self.reference_lists:

1368

for (key, value, node_refs) in nodes:

1369

self.add_node(key, value, node_refs)

1370

else:

1371

for (key, value) in nodes:

1372

self.add_node(key, value)

1373

1374

def iter_all_entries(self):

1375

"""Iterate over all keys within the index

1376

1377

:return: An iterable of (index, key, reference_lists, value). There is no

1378

defined order for the result iteration - it will be in the most

1379

efficient order for the index (in this case dictionary hash order).

1380

"""

1381

if 'evil' in debug.debug_flags:

1382

trace.mutter_callsite(3,

1383

"iter_all_entries scales with size of history.")

1384

if self.reference_lists:

1385

for key, (absent, references, value) in self._nodes.iteritems():

1386

if not absent:

1387

yield self, key, value, references

1388

else:

1389

for key, (absent, references, value) in self._nodes.iteritems():

1390

if not absent:

1391

yield self, key, value

1392

1393

def iter_entries(self, keys):

1394

"""Iterate over keys within the index.

1395

1396

:param keys: An iterable providing the keys to be retrieved.

1397

:return: An iterable of (index, key, value, reference_lists). There is no

1398

defined order for the result iteration - it will be in the most

1399

efficient order for the index (keys iteration order in this case).

1400

"""

1401

keys = set(keys)

1402

if self.reference_lists:

1403

for key in keys.intersection(self._keys):

1404

node = self._nodes[key]

1405

if not node[0]:

1406

yield self, key, node[2], node[1]

1407

else:

1408

for key in keys.intersection(self._keys):

1409

node = self._nodes[key]

1410

if not node[0]:

1411

yield self, key, node[2]

1412

1413

def iter_entries_prefix(self, keys):

1414

"""Iterate over keys within the index using prefix matching.

1415

1416

Prefix matching is applied within the tuple of a key, not to within

1417

the bytestring of each key element. e.g. if you have the keys ('foo',

1418

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1419

only the former key is returned.

1420

1421

:param keys: An iterable providing the key prefixes to be retrieved.

1422

Each key prefix takes the form of a tuple the length of a key, but

1423

with the last N elements 'None' rather than a regular bytestring.

1424

The first element cannot be 'None'.

1425

:return: An iterable as per iter_all_entries, but restricted to the

1426

keys with a matching prefix to those supplied. No additional keys

1427

will be returned, and every match that is in the index will be

1428

returned.

1429

"""

1430

# XXX: To much duplication with the GraphIndex class; consider finding

1431

# a good place to pull out the actual common logic.

1432

keys = set(keys)

1433

if not keys:

1434

return

1435

if self._key_length == 1:

1436

for key in keys:

1437

# sanity check

1438

if key[0] is None:

1439

raise errors.BadIndexKey(key)

1440

if len(key) != self._key_length:

1441

raise errors.BadIndexKey(key)

1442

node = self._nodes[key]

1443

if node[0]:

1444

continue

1445

if self.reference_lists:

1446

yield self, key, node[2], node[1]

1447

else:

1448

yield self, key, node[2]

1449

return

1450

nodes_by_key = self._get_nodes_by_key()

1451

for key in keys:

1452

# sanity check

1453

if key[0] is None:

1454

raise errors.BadIndexKey(key)

1455

if len(key) != self._key_length:

1456

raise errors.BadIndexKey(key)

1457

# find what it refers to:

1458

key_dict = nodes_by_key

1459

elements = list(key)

1460

# find the subdict to return

1461

try:

1462

while len(elements) and elements[0] is not None:

1463

key_dict = key_dict[elements[0]]

1464

elements.pop(0)

1465

except KeyError:

1466

# a non-existant lookup.

1467

continue

1468

if len(elements):

1469

dicts = [key_dict]

1470

while dicts:

1471

key_dict = dicts.pop(-1)

1472

# can't be empty or would not exist

1473

item, value = key_dict.iteritems().next()

1474

if type(value) == dict:

1475

# push keys

1476

dicts.extend(key_dict.itervalues())

1477

else:

1478

# yield keys

1479

for value in key_dict.itervalues():

1480

yield (self, ) + value

1481

else:

1482

yield (self, ) + key_dict

1483

1484

def key_count(self):

1485

"""Return an estimate of the number of keys in this index.

1486

1487

For InMemoryGraphIndex the estimate is exact.

1488

"""

1489

return len(self._keys)

1490

1491

def validate(self):

1492

"""In memory index's have no known corruption at the moment."""

1493

1494

1495

class GraphIndexPrefixAdapter(object):

1496

"""An adapter between GraphIndex with different key lengths.

1497

1498

Queries against this will emit queries against the adapted Graph with the

1499

prefix added, queries for all items use iter_entries_prefix. The returned

1500

nodes will have their keys and node references adjusted to remove the

1501

prefix. Finally, an add_nodes_callback can be supplied - when called the

1502

nodes and references being added will have prefix prepended.

1503

"""

1504

1505

def __init__(self, adapted, prefix, missing_key_length,

1506

add_nodes_callback=None):

1507

"""Construct an adapter against adapted with prefix."""

1508

self.adapted = adapted

1509

self.prefix_key = prefix + (None,)*missing_key_length

1510

self.prefix = prefix

1511

self.prefix_len = len(prefix)

1512

self.add_nodes_callback = add_nodes_callback

1513

1514

def add_nodes(self, nodes):

1515

"""Add nodes to the index.

1516

1517

:param nodes: An iterable of (key, node_refs, value) entries to add.

1518

"""

1519

# save nodes in case its an iterator

1520

nodes = tuple(nodes)

1521

translated_nodes = []

1522

try:

1523

# Add prefix_key to each reference node_refs is a tuple of tuples,

1524

# so split it apart, and add prefix_key to the internal reference

1525

for (key, value, node_refs) in nodes:

1526

adjusted_references = (

1527

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1528

for ref_list in node_refs))

1529

translated_nodes.append((self.prefix + key, value,

1530

adjusted_references))

1531

except ValueError:

1532

# XXX: TODO add an explicit interface for getting the reference list

1533

# status, to handle this bit of user-friendliness in the API more

1534

# explicitly.

1535

for (key, value) in nodes:

1536

translated_nodes.append((self.prefix + key, value))

1537

self.add_nodes_callback(translated_nodes)

1538

1539

def add_node(self, key, value, references=()):

1540

"""Add a node to the index.

1541

1542

:param key: The key. keys are non-empty tuples containing

1543

as many whitespace-free utf8 bytestrings as the key length

1544

defined for this index.

1545

:param references: An iterable of iterables of keys. Each is a

1546

reference to another key.

1547

:param value: The value to associate with the key. It may be any

1548

bytes as long as it does not contain \0 or \n.

1549

"""

1550

self.add_nodes(((key, value, references), ))

1551

1552

def _strip_prefix(self, an_iter):

1553

"""Strip prefix data from nodes and return it."""

1554

for node in an_iter:

1555

# cross checks

1556

if node[1][:self.prefix_len] != self.prefix:

1557

raise errors.BadIndexData(self)

1558

for ref_list in node[3]:

1559

for ref_node in ref_list:

1560

if ref_node[:self.prefix_len] != self.prefix:

1561

raise errors.BadIndexData(self)

1562

yield node[0], node[1][self.prefix_len:], node[2], (

1563

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1564

for ref_list in node[3]))

1565

1566

def iter_all_entries(self):

1567

"""Iterate over all keys within the index

1568

1569

iter_all_entries is implemented against the adapted index using

1570

iter_entries_prefix.

1571

1572

:return: An iterable of (index, key, reference_lists, value). There is no

1573

defined order for the result iteration - it will be in the most

1574

efficient order for the index (in this case dictionary hash order).

1575

"""

1576

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1577

1578

def iter_entries(self, keys):

1579

"""Iterate over keys within the index.

1580

1581

:param keys: An iterable providing the keys to be retrieved.

1582

:return: An iterable of (index, key, value, reference_lists). There is no

1583

defined order for the result iteration - it will be in the most

1584

efficient order for the index (keys iteration order in this case).

1585

"""

1586

return self._strip_prefix(self.adapted.iter_entries(

1587

self.prefix + key for key in keys))

1588

1589

def iter_entries_prefix(self, keys):

1590

"""Iterate over keys within the index using prefix matching.

1591

1592

Prefix matching is applied within the tuple of a key, not to within

1593

the bytestring of each key element. e.g. if you have the keys ('foo',

1594

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1595

only the former key is returned.

1596

1597

:param keys: An iterable providing the key prefixes to be retrieved.

1598

Each key prefix takes the form of a tuple the length of a key, but

1599

with the last N elements 'None' rather than a regular bytestring.

1600

The first element cannot be 'None'.

1601

:return: An iterable as per iter_all_entries, but restricted to the

1602

keys with a matching prefix to those supplied. No additional keys

1603

will be returned, and every match that is in the index will be

1604

returned.

1605

"""

1606

return self._strip_prefix(self.adapted.iter_entries_prefix(

1607

self.prefix + key for key in keys))

1608

1609

def key_count(self):

1610

"""Return an estimate of the number of keys in this index.

1611

1612

For GraphIndexPrefixAdapter this is relatively expensive - key

1613

iteration with the prefix is done.

1614

"""

1615

return len(list(self.iter_all_entries()))

1616

1617

def validate(self):

1618

"""Call the adapted's validate."""

1619

self.adapted.validate()

Older »