~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Martin Pool
Date: 2005-11-04 01:46:31 UTC
mto: (1185.33.49 bzr.dev)
mto: This revision was merged to the branch mainline in revision 1512.
Revision ID: mbp@sourcefrog.net-20051104014631-750e0ad4172c952c

Make biobench directly executable

files added:
NEWS.developers

build-api

bzrlib/basicio.py

bzrlib/clone.py

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/revfile.py

bzrlib/selftest/testbasicio.py

bzrlib/selftest/testreweave.py

bzrlib/store/compressed_text.py

bzrlib/util/configobj/validate.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files removed:
BRANCH.TODO

COPYING.txt

bzr.ico

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transform.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/workingtree_4.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bzr_access

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/profiling.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/best_practice_intro.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/revnos.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

tools/__init__.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/package_mf.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

tools/win32/survey.txt

files renamed:
doc/developers/HACKING.txt => HACKING

tools/doc_generate/autodoc_man.py => bzr_man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

bzrlib/deprecated_graph.py => bzrlib/graph.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/http_utils.py => bzrlib/selftest/HTTPTestUtil.py

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_commands.py => bzrlib/selftest/test_command.py

bzrlib/tests/branch_implementations/test_parent.py => bzrlib/selftest/test_parent.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/selftest/test_revision_info.py

bzrlib/tests/blackbox/test_annotate.py => bzrlib/selftest/testannotate.py

bzrlib/tests/test_api.py => bzrlib/selftest/testapi.py

bzrlib/tests/branch_implementations/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_config.py => bzrlib/selftest/testconfig.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_gpg.py => bzrlib/selftest/testgpg.py

bzrlib/tests/test_deprecated_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_http.py => bzrlib/selftest/testhttp.py

bzrlib/tests/test_identitymap.py => bzrlib/selftest/testidentitymap.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_nonascii.py => bzrlib/selftest/testnonascii.py

bzrlib/tests/test_options.py => bzrlib/selftest/testoptions.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/testplugins.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/repository_implementations/test_revision.py => bzrlib/selftest/testrevprops.py

bzrlib/tests/test_sampler.py => bzrlib/selftest/testsampler.py

bzrlib/tests/test_sftp_transport.py => bzrlib/selftest/testsftp.py

bzrlib/tests/blackbox/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/test_testament.py => bzrlib/selftest/testtestament.py

bzrlib/tests/test_transactions.py => bzrlib/selftest/testtransactions.py

bzrlib/tests/test_transport.py => bzrlib/selftest/testtransport.py

bzrlib/tests/test_tsort.py => bzrlib/selftest/testtsort.py

bzrlib/tests/test_workingtree.py => bzrlib/selftest/testworkingtree.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/versioned/__init__.py => bzrlib/store/weave.py

bzrlib/transport/http/__init__.py => bzrlib/transport/http.py

bzrlib/ui/__init__.py => bzrlib/ui.py

bzrlib/win32utils.py => bzrlib/win32console.py

bzrlib/xml_serializer.py => bzrlib/xml.py

doc/en/tutorials/tutorial.txt => tutorial.txt

files modified:
.bzrignore

.rsyncexclude

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/stub_sftp.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_conflicts.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/treeshape.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/testament.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport/__init__.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/upgrade.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwk

setup.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

self._nodes = {}

self._nodes_by_key = {}

self._key_length = key_elements

def _check_key(self, key):

"""Raise BadIndexKey if key is not a valid key for this index."""

if type(key) != tuple:

raise errors.BadIndexKey(key)

if self._key_length != len(key):

raise errors.BadIndexKey(key)

for element in key:

if not element or _whitespace_re.search(element) is not None:

raise errors.BadIndexKey(element)

def add_node(self, key, value, references=()):

"""Add a node to the index.

100

:param key: The key. keys are non-empty tuples containing

101

as many whitespace-free utf8 bytestrings as the key length

102

defined for this index.

103

:param references: An iterable of iterables of keys. Each is a

104

reference to another key.

105

:param value: The value to associate with the key. It may be any

106

bytes as long as it does not contain \0 or \n.

107

"""

108

self._check_key(key)

109

if _newline_null_re.search(value) is not None:

110

raise errors.BadIndexValue(value)

111

if len(references) != self.reference_lists:

112

raise errors.BadIndexValue(references)

113

node_refs = []

114

for reference_list in references:

115

for reference in reference_list:

116

self._check_key(reference)

117

if reference not in self._nodes:

118

self._nodes[reference] = ('a', (), '')

119

node_refs.append(tuple(reference_list))

120

if key in self._nodes and self._nodes[key][0] == '':

121

raise errors.BadIndexDuplicateKey(key, self)

122

self._nodes[key] = ('', tuple(node_refs), value)

123

self._keys.add(key)

124

if self._key_length > 1:

125

key_dict = self._nodes_by_key

126

if self.reference_lists:

127

key_value = key, value, tuple(node_refs)

128

else:

129

key_value = key, value

130

# possibly should do this on-demand, but it seems likely it is

131

# always wanted

132

# For a key of (foo, bar, baz) create

133

# _nodes_by_key[foo][bar][baz] = key_value

134

for subkey in key[:-1]:

135

key_dict = key_dict.setdefault(subkey, {})

136

key_dict[key[-1]] = key_value

137

138

def finish(self):

139

lines = [_SIGNATURE]

140

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

141

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

142

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

143

prefix_length = sum(len(x) for x in lines)

144

# references are byte offsets. To avoid having to do nasty

145

# polynomial work to resolve offsets (references to later in the

146

# file cannot be determined until all the inbetween references have

147

# been calculated too) we pad the offsets with 0's to make them be

148

# of consistent length. Using binary offsets would break the trivial

149

# file parsing.

150

# to calculate the width of zero's needed we do three passes:

151

# one to gather all the non-reference data and the number of references.

152

# one to pad all the data with reference-length and determine entry

153

# addresses.

154

# One to serialise.

155

156

# forward sorted by key. In future we may consider topological sorting,

157

# at the cost of table scans for direct lookup, or a second index for

158

# direct lookup

159

nodes = sorted(self._nodes.items())

160

# if we do not prepass, we don't know how long it will be up front.

161

expected_bytes = None

162

# we only need to pre-pass if we have reference lists at all.

163

if self.reference_lists:

164

key_offset_info = []

165

non_ref_bytes = prefix_length

166

total_references = 0

167

# TODO use simple multiplication for the constants in this loop.

168

for key, (absent, references, value) in nodes:

169

# record the offset known *so far* for this key:

170

# the non reference bytes to date, and the total references to

171

# date - saves reaccumulating on the second pass

172

key_offset_info.append((key, non_ref_bytes, total_references))

173

# key is literal, value is literal, there are 3 null's, 1 NL

174

# key is variable length tuple, \x00 between elements

175

non_ref_bytes += sum(len(element) for element in key)

176

if self._key_length > 1:

177

non_ref_bytes += self._key_length - 1

178

# value is literal bytes, there are 3 null's, 1 NL.

179

non_ref_bytes += len(value) + 3 + 1

180

# one byte for absent if set.

181

if absent:

182

non_ref_bytes += 1

183

elif self.reference_lists:

184

# (ref_lists -1) tabs

185

non_ref_bytes += self.reference_lists - 1

186

# (ref-1 cr's per ref_list)

187

for ref_list in references:

188

# how many references across the whole file?

189

total_references += len(ref_list)

190

# accrue reference separators

191

if ref_list:

192

non_ref_bytes += len(ref_list) - 1

193

# how many digits are needed to represent the total byte count?

194

digits = 1

195

possible_total_bytes = non_ref_bytes + total_references*digits

196

while 10 ** digits < possible_total_bytes:

197

digits += 1

198

possible_total_bytes = non_ref_bytes + total_references*digits

199

expected_bytes = possible_total_bytes + 1 # terminating newline

200

# resolve key addresses.

201

key_addresses = {}

202

for key, non_ref_bytes, total_references in key_offset_info:

203

key_addresses[key] = non_ref_bytes + total_references*digits

204

# serialise

205

format_string = '%%0%sd' % digits

206

for key, (absent, references, value) in nodes:

207

flattened_references = []

208

for ref_list in references:

209

ref_addresses = []

210

for reference in ref_list:

211

ref_addresses.append(format_string % key_addresses[reference])

212

flattened_references.append('\r'.join(ref_addresses))

213

string_key = '\x00'.join(key)

214

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

215

'\t'.join(flattened_references), value))

216

lines.append('\n')

217

result = StringIO(''.join(lines))

218

if expected_bytes and len(result.getvalue()) != expected_bytes:

219

raise errors.BzrError('Failed index creation. Internal error:'

220

' mismatched output length and expected length: %d %d' %

221

(len(result.getvalue()), expected_bytes))

222

return StringIO(''.join(lines))

223

224

225

class GraphIndex(object):

226

"""An index for data with embedded graphs.

227

228

The index maps keys to a list of key reference lists, and a value.

229

Each node has the same number of key reference lists. Each key reference

230

list can be empty or an arbitrary length. The value is an opaque NULL

231

terminated string without any newlines. The storage of the index is

232

hidden in the interface: keys and key references are always tuples of

233

bytestrings, never the internal representation (e.g. dictionary offsets).

234

235

It is presumed that the index will not be mutated - it is static data.

236

237

Successive iter_all_entries calls will read the entire index each time.

238

Additionally, iter_entries calls will read the index linearly until the

239

desired keys are found. XXX: This must be fixed before the index is

240

suitable for production use. :XXX

241

"""

242

243

def __init__(self, transport, name, size):

244

"""Open an index called name on transport.

245

246

:param transport: A bzrlib.transport.Transport.

247

:param name: A path to provide to transport API calls.

248

:param size: The size of the index in bytes. This is used for bisection

249

logic to perform partial index reads. While the size could be

250

obtained by statting the file this introduced an additional round

251

trip as well as requiring stat'able transports, both of which are

252

avoided by having it supplied. If size is None, then bisection

253

support will be disabled and accessing the index will just stream

254

all the data.

255

"""

256

self._transport = transport

257

self._name = name

258

# Becomes a dict of key:(value, reference-list-byte-locations) used by

259

# the bisection interface to store parsed but not resolved keys.

260

self._bisect_nodes = None

261

# Becomes a dict of key:(value, reference-list-keys) which are ready to

262

# be returned directly to callers.

263

self._nodes = None

264

# a sorted list of slice-addresses for the parsed bytes of the file.

265

# e.g. (0,1) would mean that byte 0 is parsed.

266

self._parsed_byte_map = []

267

# a sorted list of keys matching each slice address for parsed bytes

268

# e.g. (None, 'foo@bar') would mean that the first byte contained no

269

# key, and the end byte of the slice is the of the data for 'foo@bar'

270

self._parsed_key_map = []

271

self._key_count = None

272

self._keys_by_offset = None

273

self._nodes_by_key = None

274

self._size = size

275

276

def __eq__(self, other):

277

"""Equal when self and other were created with the same parameters."""

278

return (

279

type(self) == type(other) and

280

self._transport == other._transport and

281

self._name == other._name and

282

self._size == other._size)

283

284

def __ne__(self, other):

285

return not self.__eq__(other)

286

287

def _buffer_all(self):

288

"""Buffer all the index data.

289

290

Mutates self._nodes and self.keys_by_offset.

291

"""

292

if 'index' in debug.debug_flags:

293

mutter('Reading entire index %s', self._transport.abspath(self._name))

294

stream = self._transport.get(self._name)

295

self._read_prefix(stream)

296

self._expected_elements = 3 + self._key_length

297

line_count = 0

298

# raw data keyed by offset

299

self._keys_by_offset = {}

300

# ready-to-return key:value or key:value, node_ref_lists

301

self._nodes = {}

302

self._nodes_by_key = {}

303

trailers = 0

304

pos = stream.tell()

305

lines = stream.read().split('\n')

306

del lines[-1]

307

_, _, _, trailers = self._parse_lines(lines, pos)

308

for key, absent, references, value in self._keys_by_offset.itervalues():

309

if absent:

310

continue

311

# resolve references:

312

if self.node_ref_lists:

313

node_value = (value, self._resolve_references(references))

314

else:

315

node_value = value

316

self._nodes[key] = node_value

317

if self._key_length > 1:

318

subkey = list(reversed(key[:-1]))

319

key_dict = self._nodes_by_key

320

if self.node_ref_lists:

321

key_value = key, node_value[0], node_value[1]

322

else:

323

key_value = key, node_value

324

# possibly should do this on-demand, but it seems likely it is

325

# always wanted

326

# For a key of (foo, bar, baz) create

327

# _nodes_by_key[foo][bar][baz] = key_value

328

for subkey in key[:-1]:

329

key_dict = key_dict.setdefault(subkey, {})

330

key_dict[key[-1]] = key_value

331

# cache the keys for quick set intersections

332

self._keys = set(self._nodes)

333

if trailers != 1:

334

# there must be one line - the empty trailer line.

335

raise errors.BadIndexData(self)

336

337

def iter_all_entries(self):

338

"""Iterate over all keys within the index.

339

340

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

341

The former tuple is used when there are no reference lists in the

342

index, making the API compatible with simple key:value index types.

343

There is no defined order for the result iteration - it will be in

344

the most efficient order for the index.

345

"""

346

if 'evil' in debug.debug_flags:

347

trace.mutter_callsite(3,

348

"iter_all_entries scales with size of history.")

349

if self._nodes is None:

350

self._buffer_all()

351

if self.node_ref_lists:

352

for key, (value, node_ref_lists) in self._nodes.iteritems():

353

yield self, key, value, node_ref_lists

354

else:

355

for key, value in self._nodes.iteritems():

356

yield self, key, value

357

358

def _read_prefix(self, stream):

359

signature = stream.read(len(self._signature()))

360

if not signature == self._signature():

361

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

362

options_line = stream.readline()

363

if not options_line.startswith(_OPTION_NODE_REFS):

364

raise errors.BadIndexOptions(self)

365

try:

366

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

367

except ValueError:

368

raise errors.BadIndexOptions(self)

369

options_line = stream.readline()

370

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

371

raise errors.BadIndexOptions(self)

372

try:

373

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

374

except ValueError:

375

raise errors.BadIndexOptions(self)

376

options_line = stream.readline()

377

if not options_line.startswith(_OPTION_LEN):

378

raise errors.BadIndexOptions(self)

379

try:

380

self._key_count = int(options_line[len(_OPTION_LEN):-1])

381

except ValueError:

382

raise errors.BadIndexOptions(self)

383

384

def _resolve_references(self, references):

385

"""Return the resolved key references for references.

386

387

References are resolved by looking up the location of the key in the

388

_keys_by_offset map and substituting the key name, preserving ordering.

389

390

:param references: An iterable of iterables of key locations. e.g.

391

[[123, 456], [123]]

392

:return: A tuple of tuples of keys.

393

"""

394

node_refs = []

395

for ref_list in references:

396

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

397

return tuple(node_refs)

398

399

def _find_index(self, range_map, key):

400

"""Helper for the _parsed_*_index calls.

401

402

Given a range map - [(start, end), ...], finds the index of the range

403

in the map for key if it is in the map, and if it is not there, the

404

immediately preceeding range in the map.

405

"""

406

result = bisect_right(range_map, key) - 1

407

if result + 1 < len(range_map):

408

# check the border condition, it may be in result + 1

409

if range_map[result + 1][0] == key[0]:

410

return result + 1

411

return result

412

413

def _parsed_byte_index(self, offset):

414

"""Return the index of the entry immediately before offset.

415

416

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

417

there is one unparsed byte (the 11th, addressed as[10]). then:

418

asking for 0 will return 0

419

asking for 10 will return 0

420

asking for 11 will return 1

421

asking for 12 will return 1

422

"""

423

key = (offset, 0)

424

return self._find_index(self._parsed_byte_map, key)

425

426

def _parsed_key_index(self, key):

427

"""Return the index of the entry immediately before key.

428

429

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

430

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

431

have been parsed, then:

432

asking for '' will return 0

433

asking for 'a' will return 0

434

asking for 'b' will return 1

435

asking for 'e' will return 1

436

"""

437

search_key = (key, None)

438

return self._find_index(self._parsed_key_map, search_key)

439

440

def _is_parsed(self, offset):

441

"""Returns True if offset has been parsed."""

442

index = self._parsed_byte_index(offset)

443

if index == len(self._parsed_byte_map):

444

return offset < self._parsed_byte_map[index - 1][1]

445

start, end = self._parsed_byte_map[index]

446

return offset >= start and offset < end

447

448

def _iter_entries_from_total_buffer(self, keys):

449

"""Iterate over keys when the entire index is parsed."""

450

keys = keys.intersection(self._keys)

451

if self.node_ref_lists:

452

for key in keys:

453

value, node_refs = self._nodes[key]

454

yield self, key, value, node_refs

455

else:

456

for key in keys:

457

yield self, key, self._nodes[key]

458

459

def iter_entries(self, keys):

460

"""Iterate over keys within the index.

461

462

:param keys: An iterable providing the keys to be retrieved.

463

:return: An iterable as per iter_all_entries, but restricted to the

464

keys supplied. No additional keys will be returned, and every

465

key supplied that is in the index will be returned.

466

"""

467

# PERFORMANCE TODO: parse and bisect all remaining data at some

468

# threshold of total-index processing/get calling layers that expect to

469

# read the entire index to use the iter_all_entries method instead.

470

keys = set(keys)

471

if not keys:

472

return []

473

if self._size is None and self._nodes is None:

474

self._buffer_all()

475

if self._nodes is not None:

476

return self._iter_entries_from_total_buffer(keys)

477

else:

478

return (result[1] for result in bisect_multi_bytes(

479

self._lookup_keys_via_location, self._size, keys))

480

481

def iter_entries_prefix(self, keys):

482

"""Iterate over keys within the index using prefix matching.

483

484

Prefix matching is applied within the tuple of a key, not to within

485

the bytestring of each key element. e.g. if you have the keys ('foo',

486

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

487

only the former key is returned.

488

489

WARNING: Note that this method currently causes a full index parse

490

unconditionally (which is reasonably appropriate as it is a means for

491

thunking many small indices into one larger one and still supplies

492

iter_all_entries at the thunk layer).

493

494

:param keys: An iterable providing the key prefixes to be retrieved.

495

Each key prefix takes the form of a tuple the length of a key, but

496

with the last N elements 'None' rather than a regular bytestring.

497

The first element cannot be 'None'.

498

:return: An iterable as per iter_all_entries, but restricted to the

499

keys with a matching prefix to those supplied. No additional keys

500

will be returned, and every match that is in the index will be

501

returned.

502

"""

503

keys = set(keys)

504

if not keys:

505

return

506

# load data - also finds key lengths

507

if self._nodes is None:

508

self._buffer_all()

509

if self._key_length == 1:

510

for key in keys:

511

# sanity check

512

if key[0] is None:

513

raise errors.BadIndexKey(key)

514

if len(key) != self._key_length:

515

raise errors.BadIndexKey(key)

516

if self.node_ref_lists:

517

value, node_refs = self._nodes[key]

518

yield self, key, value, node_refs

519

else:

520

yield self, key, self._nodes[key]

521

return

522

for key in keys:

523

# sanity check

524

if key[0] is None:

525

raise errors.BadIndexKey(key)

526

if len(key) != self._key_length:

527

raise errors.BadIndexKey(key)

528

# find what it refers to:

529

key_dict = self._nodes_by_key

530

elements = list(key)

531

# find the subdict whose contents should be returned.

532

try:

533

while len(elements) and elements[0] is not None:

534

key_dict = key_dict[elements[0]]

535

elements.pop(0)

536

except KeyError:

537

# a non-existant lookup.

538

continue

539

if len(elements):

540

dicts = [key_dict]

541

while dicts:

542

key_dict = dicts.pop(-1)

543

# can't be empty or would not exist

544

item, value = key_dict.iteritems().next()

545

if type(value) == dict:

546

# push keys

547

dicts.extend(key_dict.itervalues())

548

else:

549

# yield keys

550

for value in key_dict.itervalues():

551

# each value is the key:value:node refs tuple

552

# ready to yield.

553

yield (self, ) + value

554

else:

555

# the last thing looked up was a terminal element

556

yield (self, ) + key_dict

557

558

def key_count(self):

559

"""Return an estimate of the number of keys in this index.

560

561

For GraphIndex the estimate is exact.

562

"""

563

if self._key_count is None:

564

self._read_and_parse([_HEADER_READV])

565

return self._key_count

566

567

def _lookup_keys_via_location(self, location_keys):

568

"""Public interface for implementing bisection.

569

570

If _buffer_all has been called, then all the data for the index is in

571

memory, and this method should not be called, as it uses a separate

572

cache because it cannot pre-resolve all indices, which buffer_all does

573

for performance.

574

575

:param location_keys: A list of location(byte offset), key tuples.

576

:return: A list of (location_key, result) tuples as expected by

577

bzrlib.bisect_multi.bisect_multi_bytes.

578

"""

579

# Possible improvements:

580

# - only bisect lookup each key once

581

# - sort the keys first, and use that to reduce the bisection window

582

# -----

583

# this progresses in three parts:

584

# read data

585

# parse it

586

# attempt to answer the question from the now in memory data.

587

# build the readv request

588

# for each location, ask for 800 bytes - much more than rows we've seen

589

# anywhere.

590

readv_ranges = []

591

for location, key in location_keys:

592

# can we answer from cache?

593

if self._bisect_nodes and key in self._bisect_nodes:

594

# We have the key parsed.

595

continue

596

index = self._parsed_key_index(key)

597

if (len(self._parsed_key_map) and

598

self._parsed_key_map[index][0] <= key and

599

(self._parsed_key_map[index][1] >= key or

600

# end of the file has been parsed

601

self._parsed_byte_map[index][1] == self._size)):

602

# the key has been parsed, so no lookup is needed even if its

603

# not present.

604

continue

605

# - if we have examined this part of the file already - yes

606

index = self._parsed_byte_index(location)

607

if (len(self._parsed_byte_map) and

608

self._parsed_byte_map[index][0] <= location and

609

self._parsed_byte_map[index][1] > location):

610

# the byte region has been parsed, so no read is needed.

611

continue

612

length = 800

613

if location + length > self._size:

614

length = self._size - location

615

# todo, trim out parsed locations.

616

if length > 0:

617

readv_ranges.append((location, length))

618

# read the header if needed

619

if self._bisect_nodes is None:

620

readv_ranges.append(_HEADER_READV)

621

self._read_and_parse(readv_ranges)

622

# generate results:

623

# - figure out <, >, missing, present

624

# - result present references so we can return them.

625

result = []

626

# keys that we cannot answer until we resolve references

627

pending_references = []

628

pending_locations = set()

629

for location, key in location_keys:

630

# can we answer from cache?

631

if key in self._bisect_nodes:

632

# the key has been parsed, so no lookup is needed

633

if self.node_ref_lists:

634

# the references may not have been all parsed.

635

value, refs = self._bisect_nodes[key]

636

wanted_locations = []

637

for ref_list in refs:

638

for ref in ref_list:

639

if ref not in self._keys_by_offset:

640

wanted_locations.append(ref)

641

if wanted_locations:

642

pending_locations.update(wanted_locations)

643

pending_references.append((location, key))

644

continue

645

result.append(((location, key), (self, key,

646

value, self._resolve_references(refs))))

647

else:

648

result.append(((location, key),

649

(self, key, self._bisect_nodes[key])))

650

continue

651

else:

652

# has the region the key should be in, been parsed?

653

index = self._parsed_key_index(key)

654

if (self._parsed_key_map[index][0] <= key and

655

(self._parsed_key_map[index][1] >= key or

656

# end of the file has been parsed

657

self._parsed_byte_map[index][1] == self._size)):

658

result.append(((location, key), False))

659

continue

660

# no, is the key above or below the probed location:

661

# get the range of the probed & parsed location

662

index = self._parsed_byte_index(location)

663

# if the key is below the start of the range, its below

664

if key < self._parsed_key_map[index][0]:

665

direction = -1

666

else:

667

direction = +1

668

result.append(((location, key), direction))

669

readv_ranges = []

670

# lookup data to resolve references

671

for location in pending_locations:

672

length = 800

673

if location + length > self._size:

674

length = self._size - location

675

# TODO: trim out parsed locations (e.g. if the 800 is into the

676

# parsed region trim it, and dont use the adjust_for_latency

677

# facility)

678

if length > 0:

679

readv_ranges.append((location, length))

680

self._read_and_parse(readv_ranges)

681

for location, key in pending_references:

682

# answer key references we had to look-up-late.

683

index = self._parsed_key_index(key)

684

value, refs = self._bisect_nodes[key]

685

result.append(((location, key), (self, key,

686

value, self._resolve_references(refs))))

687

return result

688

689

def _parse_header_from_bytes(self, bytes):

690

"""Parse the header from a region of bytes.

691

692

:param bytes: The data to parse.

693

:return: An offset, data tuple such as readv yields, for the unparsed

694

data. (which may length 0).

695

"""

696

signature = bytes[0:len(self._signature())]

697

if not signature == self._signature():

698

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

699

lines = bytes[len(self._signature()):].splitlines()

700

options_line = lines[0]

701

if not options_line.startswith(_OPTION_NODE_REFS):

702

raise errors.BadIndexOptions(self)

703

try:

704

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

705

except ValueError:

706

raise errors.BadIndexOptions(self)

707

options_line = lines[1]

708

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

709

raise errors.BadIndexOptions(self)

710

try:

711

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

712

except ValueError:

713

raise errors.BadIndexOptions(self)

714

options_line = lines[2]

715

if not options_line.startswith(_OPTION_LEN):

716

raise errors.BadIndexOptions(self)

717

try:

718

self._key_count = int(options_line[len(_OPTION_LEN):])

719

except ValueError:

720

raise errors.BadIndexOptions(self)

721

# calculate the bytes we have processed

722

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

723

len(lines[2]) + 3)

724

self._parsed_bytes(0, None, header_end, None)

725

# setup parsing state

726

self._expected_elements = 3 + self._key_length

727

# raw data keyed by offset

728

self._keys_by_offset = {}

729

# keys with the value and node references

730

self._bisect_nodes = {}

731

return header_end, bytes[header_end:]

732

733

def _parse_region(self, offset, data):

734

"""Parse node data returned from a readv operation.

735

736

:param offset: The byte offset the data starts at.

737

:param data: The data to parse.

738

"""

739

# trim the data.

740

# end first:

741

end = offset + len(data)

742

high_parsed = offset

743

while True:

744

# Trivial test - if the current index's end is within the

745

# low-matching parsed range, we're done.

746

index = self._parsed_byte_index(high_parsed)

747

if end < self._parsed_byte_map[index][1]:

748

return

749

# print "[%d:%d]" % (offset, end), \

750

# self._parsed_byte_map[index:index + 2]

751

high_parsed, last_segment = self._parse_segment(

752

offset, data, end, index)

753

if last_segment:

754

return

755

756

def _parse_segment(self, offset, data, end, index):

757

"""Parse one segment of data.

758

759

:param offset: Where 'data' begins in the file.

760

:param data: Some data to parse a segment of.

761

:param end: Where data ends

762

:param index: The current index into the parsed bytes map.

763

:return: True if the parsed segment is the last possible one in the

764

range of data.

765

:return: high_parsed_byte, last_segment.

766

high_parsed_byte is the location of the highest parsed byte in this

767

segment, last_segment is True if the parsed segment is the last

768

possible one in the data block.

769

"""

770

# default is to use all data

771

trim_end = None

772

# accomodate overlap with data before this.

773

if offset < self._parsed_byte_map[index][1]:

774

# overlaps the lower parsed region

775

# skip the parsed data

776

trim_start = self._parsed_byte_map[index][1] - offset

777

# don't trim the start for \n

778

start_adjacent = True

779

elif offset == self._parsed_byte_map[index][1]:

780

# abuts the lower parsed region

781

# use all data

782

trim_start = None

783

# do not trim anything

784

start_adjacent = True

785

else:

786

# does not overlap the lower parsed region

787

# use all data

788

trim_start = None

789

# but trim the leading \n

790

start_adjacent = False

791

if end == self._size:

792

# lines up to the end of all data:

793

# use it all

794

trim_end = None

795

# do not strip to the last \n

796

end_adjacent = True

797

last_segment = True

798

elif index + 1 == len(self._parsed_byte_map):

799

# at the end of the parsed data

800

# use it all

801

trim_end = None

802

# but strip to the last \n

803

end_adjacent = False

804

last_segment = True

805

elif end == self._parsed_byte_map[index + 1][0]:

806

# buts up against the next parsed region

807

# use it all

808

trim_end = None

809

# do not strip to the last \n

810

end_adjacent = True

811

last_segment = True

812

elif end > self._parsed_byte_map[index + 1][0]:

813

# overlaps into the next parsed region

814

# only consider the unparsed data

815

trim_end = self._parsed_byte_map[index + 1][0] - offset

816

# do not strip to the last \n as we know its an entire record

817

end_adjacent = True

818

last_segment = end < self._parsed_byte_map[index + 1][1]

819

else:

820

# does not overlap into the next region

821

# use it all

822

trim_end = None

823

# but strip to the last \n

824

end_adjacent = False

825

last_segment = True

826

# now find bytes to discard if needed

827

if not start_adjacent:

828

# work around python bug in rfind

829

if trim_start is None:

830

trim_start = data.find('\n') + 1

831

else:

832

trim_start = data.find('\n', trim_start) + 1

833

assert trim_start != 0, 'no \n was present'

834

# print 'removing start', offset, trim_start, repr(data[:trim_start])

835

if not end_adjacent:

836

# work around python bug in rfind

837

if trim_end is None:

838

trim_end = data.rfind('\n') + 1

839

else:

840

trim_end = data.rfind('\n', None, trim_end) + 1

841

assert trim_end != 0, 'no \n was present'

842

# print 'removing end', offset, trim_end, repr(data[trim_end:])

843

# adjust offset and data to the parseable data.

844

trimmed_data = data[trim_start:trim_end]

845

assert trimmed_data, 'read unneeded data [%d:%d] from [%d:%d]' % (

846

trim_start, trim_end, offset, offset + len(data))

847

if trim_start:

848

offset += trim_start

849

# print "parsing", repr(trimmed_data)

850

# splitlines mangles the \r delimiters.. don't use it.

851

lines = trimmed_data.split('\n')

852

del lines[-1]

853

pos = offset

854

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

855

for key, value in nodes:

856

self._bisect_nodes[key] = value

857

self._parsed_bytes(offset, first_key,

858

offset + len(trimmed_data), last_key)

859

return offset + len(trimmed_data), last_segment

860

861

def _parse_lines(self, lines, pos):

862

key = None

863

first_key = None

864

trailers = 0

865

nodes = []

866

for line in lines:

867

if line == '':

868

# must be at the end

869

if self._size:

870

assert self._size == pos + 1, "%s %s" % (self._size, pos)

871

trailers += 1

872

continue

873

elements = line.split('\0')

874

if len(elements) != self._expected_elements:

875

raise errors.BadIndexData(self)

876

# keys are tuples

877

key = tuple(elements[:self._key_length])

878

if first_key is None:

879

first_key = key

880

absent, references, value = elements[-3:]

881

ref_lists = []

882

for ref_string in references.split('\t'):

883

ref_lists.append(tuple([

884

int(ref) for ref in ref_string.split('\r') if ref

885

]))

886

ref_lists = tuple(ref_lists)

887

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

888

pos += len(line) + 1 # +1 for the \n

889

if absent:

890

continue

891

if self.node_ref_lists:

892

node_value = (value, ref_lists)

893

else:

894

node_value = value

895

nodes.append((key, node_value))

896

# print "parsed ", key

897

return first_key, key, nodes, trailers

898

899

def _parsed_bytes(self, start, start_key, end, end_key):

900

"""Mark the bytes from start to end as parsed.

901

902

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

903

1) as parsed.

904

905

:param start: The start of the parsed region.

906

:param end: The end of the parsed region.

907

"""

908

index = self._parsed_byte_index(start)

909

new_value = (start, end)

910

new_key = (start_key, end_key)

911

if index == -1:

912

# first range parsed is always the beginning.

913

self._parsed_byte_map.insert(index, new_value)

914

self._parsed_key_map.insert(index, new_key)

915

return

916

# four cases:

917

# new region

918

# extend lower region

919

# extend higher region

920

# combine two regions

921

if (index + 1 < len(self._parsed_byte_map) and

922

self._parsed_byte_map[index][1] == start and

923

self._parsed_byte_map[index + 1][0] == end):

924

# combine two regions

925

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

926

self._parsed_byte_map[index + 1][1])

927

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

928

self._parsed_key_map[index + 1][1])

929

del self._parsed_byte_map[index + 1]

930

del self._parsed_key_map[index + 1]

931

elif self._parsed_byte_map[index][1] == start:

932

# extend the lower entry

933

self._parsed_byte_map[index] = (

934

self._parsed_byte_map[index][0], end)

935

self._parsed_key_map[index] = (

936

self._parsed_key_map[index][0], end_key)

937

elif (index + 1 < len(self._parsed_byte_map) and

938

self._parsed_byte_map[index + 1][0] == end):

939

# extend the higher entry

940

self._parsed_byte_map[index + 1] = (

941

start, self._parsed_byte_map[index + 1][1])

942

self._parsed_key_map[index + 1] = (

943

start_key, self._parsed_key_map[index + 1][1])

944

else:

945

# new entry

946

self._parsed_byte_map.insert(index + 1, new_value)

947

self._parsed_key_map.insert(index + 1, new_key)

948

949

def _read_and_parse(self, readv_ranges):

950

"""Read the the ranges and parse the resulting data.

951

952

:param readv_ranges: A prepared readv range list.

953

"""

954

if readv_ranges:

955

readv_data = self._transport.readv(self._name, readv_ranges, True,

956

self._size)

957

# parse

958

for offset, data in readv_data:

959

if self._bisect_nodes is None:

960

# this must be the start

961

assert offset == 0

962

offset, data = self._parse_header_from_bytes(data)

963

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

964

self._parse_region(offset, data)

965

966

def _signature(self):

967

"""The file signature for this index type."""

968

return _SIGNATURE

969

970

def validate(self):

971

"""Validate that everything in the index can be accessed."""

972

# iter_all validates completely at the moment, so just do that.

973

for node in self.iter_all_entries():

974

pass

975

976

977

class CombinedGraphIndex(object):

978

"""A GraphIndex made up from smaller GraphIndices.

979

980

The backing indices must implement GraphIndex, and are presumed to be

981

static data.

982

983

Queries against the combined index will be made against the first index,

984

and then the second and so on. The order of index's can thus influence

985

performance significantly. For example, if one index is on local disk and a

986

second on a remote server, the local disk index should be before the other

987

in the index list.

988

"""

989

990

def __init__(self, indices):

991

"""Create a CombinedGraphIndex backed by indices.

992

993

:param indices: An ordered list of indices to query for data.

994

"""

995

self._indices = indices

996

997

def __repr__(self):

998

return "%s(%s)" % (

999

self.__class__.__name__,

1000

', '.join(map(repr, self._indices)))

1001

1002

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

1003

def get_parents(self, revision_ids):

1004

"""See graph._StackedParentsProvider.get_parents.

1005

1006

This implementation thunks the graph.Graph.get_parents api across to

1007

GraphIndex.

1008

1009

:param revision_ids: An iterable of graph keys for this graph.

1010

:return: A list of parent details for each key in revision_ids.

1011

Each parent details will be one of:

1012

* None when the key was missing

1013

* (NULL_REVISION,) when the key has no parents.

1014

* (parent_key, parent_key...) otherwise.

1015

"""

1016

parent_map = self.get_parent_map(revision_ids)

1017

return [parent_map.get(r, None) for r in revision_ids]

1018

1019

def get_parent_map(self, keys):

1020

"""See graph._StackedParentsProvider.get_parent_map"""

1021

search_keys = set(keys)

1022

if NULL_REVISION in search_keys:

1023

search_keys.discard(NULL_REVISION)

1024

found_parents = {NULL_REVISION:[]}

1025

else:

1026

found_parents = {}

1027

for index, key, value, refs in self.iter_entries(search_keys):

1028

parents = refs[0]

1029

if not parents:

1030

parents = (NULL_REVISION,)

1031

found_parents[key] = parents

1032

return found_parents

1033

1034

def insert_index(self, pos, index):

1035

"""Insert a new index in the list of indices to query.

1036

1037

:param pos: The position to insert the index.

1038

:param index: The index to insert.

1039

"""

1040

self._indices.insert(pos, index)

1041

1042

def iter_all_entries(self):

1043

"""Iterate over all keys within the index

1044

1045

Duplicate keys across child indices are presumed to have the same

1046

value and are only reported once.

1047

1048

:return: An iterable of (index, key, reference_lists, value).

1049

There is no defined order for the result iteration - it will be in

1050

the most efficient order for the index.

1051

"""

1052

seen_keys = set()

1053

for index in self._indices:

1054

for node in index.iter_all_entries():

1055

if node[1] not in seen_keys:

1056

yield node

1057

seen_keys.add(node[1])

1058

1059

def iter_entries(self, keys):

1060

"""Iterate over keys within the index.

1061

1062

Duplicate keys across child indices are presumed to have the same

1063

value and are only reported once.

1064

1065

:param keys: An iterable providing the keys to be retrieved.

1066

:return: An iterable of (index, key, reference_lists, value). There is no

1067

defined order for the result iteration - it will be in the most

1068

efficient order for the index.

1069

"""

1070

keys = set(keys)

1071

for index in self._indices:

1072

if not keys:

1073

return

1074

for node in index.iter_entries(keys):

1075

keys.remove(node[1])

1076

yield node

1077

1078

def iter_entries_prefix(self, keys):

1079

"""Iterate over keys within the index using prefix matching.

1080

1081

Duplicate keys across child indices are presumed to have the same

1082

value and are only reported once.

1083

1084

Prefix matching is applied within the tuple of a key, not to within

1085

the bytestring of each key element. e.g. if you have the keys ('foo',

1086

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1087

only the former key is returned.

1088

1089

:param keys: An iterable providing the key prefixes to be retrieved.

1090

Each key prefix takes the form of a tuple the length of a key, but

1091

with the last N elements 'None' rather than a regular bytestring.

1092

The first element cannot be 'None'.

1093

:return: An iterable as per iter_all_entries, but restricted to the

1094

keys with a matching prefix to those supplied. No additional keys

1095

will be returned, and every match that is in the index will be

1096

returned.

1097

"""

1098

keys = set(keys)

1099

if not keys:

1100

return

1101

seen_keys = set()

1102

for index in self._indices:

1103

for node in index.iter_entries_prefix(keys):

1104

if node[1] in seen_keys:

1105

continue

1106

seen_keys.add(node[1])

1107

yield node

1108

1109

def key_count(self):

1110

"""Return an estimate of the number of keys in this index.

1111

1112

For CombinedGraphIndex this is approximated by the sum of the keys of

1113

the child indices. As child indices may have duplicate keys this can

1114

have a maximum error of the number of child indices * largest number of

1115

keys in any index.

1116

"""

1117

return sum((index.key_count() for index in self._indices), 0)

1118

1119

def validate(self):

1120

"""Validate that everything in the index can be accessed."""

1121

for index in self._indices:

1122

index.validate()

1123

1124

1125

class InMemoryGraphIndex(GraphIndexBuilder):

1126

"""A GraphIndex which operates entirely out of memory and is mutable.

1127

1128

This is designed to allow the accumulation of GraphIndex entries during a

1129

single write operation, where the accumulated entries need to be immediately

1130

available - for example via a CombinedGraphIndex.

1131

"""

1132

1133

def add_nodes(self, nodes):

1134

"""Add nodes to the index.

1135

1136

:param nodes: An iterable of (key, node_refs, value) entries to add.

1137

"""

1138

if self.reference_lists:

1139

for (key, value, node_refs) in nodes:

1140

self.add_node(key, value, node_refs)

1141

else:

1142

for (key, value) in nodes:

1143

self.add_node(key, value)

1144

1145

def iter_all_entries(self):

1146

"""Iterate over all keys within the index

1147

1148

:return: An iterable of (index, key, reference_lists, value). There is no

1149

defined order for the result iteration - it will be in the most

1150

efficient order for the index (in this case dictionary hash order).

1151

"""

1152

if 'evil' in debug.debug_flags:

1153

trace.mutter_callsite(3,

1154

"iter_all_entries scales with size of history.")

1155

if self.reference_lists:

1156

for key, (absent, references, value) in self._nodes.iteritems():

1157

if not absent:

1158

yield self, key, value, references

1159

else:

1160

for key, (absent, references, value) in self._nodes.iteritems():

1161

if not absent:

1162

yield self, key, value

1163

1164

def iter_entries(self, keys):

1165

"""Iterate over keys within the index.

1166

1167

:param keys: An iterable providing the keys to be retrieved.

1168

:return: An iterable of (index, key, value, reference_lists). There is no

1169

defined order for the result iteration - it will be in the most

1170

efficient order for the index (keys iteration order in this case).

1171

"""

1172

keys = set(keys)

1173

if self.reference_lists:

1174

for key in keys.intersection(self._keys):

1175

node = self._nodes[key]

1176

if not node[0]:

1177

yield self, key, node[2], node[1]

1178

else:

1179

for key in keys.intersection(self._keys):

1180

node = self._nodes[key]

1181

if not node[0]:

1182

yield self, key, node[2]

1183

1184

def iter_entries_prefix(self, keys):

1185

"""Iterate over keys within the index using prefix matching.

1186

1187

Prefix matching is applied within the tuple of a key, not to within

1188

the bytestring of each key element. e.g. if you have the keys ('foo',

1189

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1190

only the former key is returned.

1191

1192

:param keys: An iterable providing the key prefixes to be retrieved.

1193

Each key prefix takes the form of a tuple the length of a key, but

1194

with the last N elements 'None' rather than a regular bytestring.

1195

The first element cannot be 'None'.

1196

:return: An iterable as per iter_all_entries, but restricted to the

1197

keys with a matching prefix to those supplied. No additional keys

1198

will be returned, and every match that is in the index will be

1199

returned.

1200

"""

1201

# XXX: To much duplication with the GraphIndex class; consider finding

1202

# a good place to pull out the actual common logic.

1203

keys = set(keys)

1204

if not keys:

1205

return

1206

if self._key_length == 1:

1207

for key in keys:

1208

# sanity check

1209

if key[0] is None:

1210

raise errors.BadIndexKey(key)

1211

if len(key) != self._key_length:

1212

raise errors.BadIndexKey(key)

1213

node = self._nodes[key]

1214

if node[0]:

1215

continue

1216

if self.reference_lists:

1217

yield self, key, node[2], node[1]

1218

else:

1219

yield self, key, node[2]

1220

return

1221

for key in keys:

1222

# sanity check

1223

if key[0] is None:

1224

raise errors.BadIndexKey(key)

1225

if len(key) != self._key_length:

1226

raise errors.BadIndexKey(key)

1227

# find what it refers to:

1228

key_dict = self._nodes_by_key

1229

elements = list(key)

1230

# find the subdict to return

1231

try:

1232

while len(elements) and elements[0] is not None:

1233

key_dict = key_dict[elements[0]]

1234

elements.pop(0)

1235

except KeyError:

1236

# a non-existant lookup.

1237

continue

1238

if len(elements):

1239

dicts = [key_dict]

1240

while dicts:

1241

key_dict = dicts.pop(-1)

1242

# can't be empty or would not exist

1243

item, value = key_dict.iteritems().next()

1244

if type(value) == dict:

1245

# push keys

1246

dicts.extend(key_dict.itervalues())

1247

else:

1248

# yield keys

1249

for value in key_dict.itervalues():

1250

yield (self, ) + value

1251

else:

1252

yield (self, ) + key_dict

1253

1254

def key_count(self):

1255

"""Return an estimate of the number of keys in this index.

1256

1257

For InMemoryGraphIndex the estimate is exact.

1258

"""

1259

return len(self._keys)

1260

1261

def validate(self):

1262

"""In memory index's have no known corruption at the moment."""

1263

1264

1265

class GraphIndexPrefixAdapter(object):

1266

"""An adapter between GraphIndex with different key lengths.

1267

1268

Queries against this will emit queries against the adapted Graph with the

1269

prefix added, queries for all items use iter_entries_prefix. The returned

1270

nodes will have their keys and node references adjusted to remove the

1271

prefix. Finally, an add_nodes_callback can be supplied - when called the

1272

nodes and references being added will have prefix prepended.

1273

"""

1274

1275

def __init__(self, adapted, prefix, missing_key_length,

1276

add_nodes_callback=None):

1277

"""Construct an adapter against adapted with prefix."""

1278

self.adapted = adapted

1279

self.prefix_key = prefix + (None,)*missing_key_length

1280

self.prefix = prefix

1281

self.prefix_len = len(prefix)

1282

self.add_nodes_callback = add_nodes_callback

1283

1284

def add_nodes(self, nodes):

1285

"""Add nodes to the index.

1286

1287

:param nodes: An iterable of (key, node_refs, value) entries to add.

1288

"""

1289

# save nodes in case its an iterator

1290

nodes = tuple(nodes)

1291

translated_nodes = []

1292

try:

1293

# Add prefix_key to each reference node_refs is a tuple of tuples,

1294

# so split it apart, and add prefix_key to the internal reference

1295

for (key, value, node_refs) in nodes:

1296

adjusted_references = (

1297

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1298

for ref_list in node_refs))

1299

translated_nodes.append((self.prefix + key, value,

1300

adjusted_references))

1301

except ValueError:

1302

# XXX: TODO add an explicit interface for getting the reference list

1303

# status, to handle this bit of user-friendliness in the API more

1304

# explicitly.

1305

for (key, value) in nodes:

1306

translated_nodes.append((self.prefix + key, value))

1307

self.add_nodes_callback(translated_nodes)

1308

1309

def add_node(self, key, value, references=()):

1310

"""Add a node to the index.

1311

1312

:param key: The key. keys are non-empty tuples containing

1313

as many whitespace-free utf8 bytestrings as the key length

1314

defined for this index.

1315

:param references: An iterable of iterables of keys. Each is a

1316

reference to another key.

1317

:param value: The value to associate with the key. It may be any

1318

bytes as long as it does not contain \0 or \n.

1319

"""

1320

self.add_nodes(((key, value, references), ))

1321

1322

def _strip_prefix(self, an_iter):

1323

"""Strip prefix data from nodes and return it."""

1324

for node in an_iter:

1325

# cross checks

1326

if node[1][:self.prefix_len] != self.prefix:

1327

raise errors.BadIndexData(self)

1328

for ref_list in node[3]:

1329

for ref_node in ref_list:

1330

if ref_node[:self.prefix_len] != self.prefix:

1331

raise errors.BadIndexData(self)

1332

yield node[0], node[1][self.prefix_len:], node[2], (

1333

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1334

for ref_list in node[3]))

1335

1336

def iter_all_entries(self):

1337

"""Iterate over all keys within the index

1338

1339

iter_all_entries is implemented against the adapted index using

1340

iter_entries_prefix.

1341

1342

:return: An iterable of (index, key, reference_lists, value). There is no

1343

defined order for the result iteration - it will be in the most

1344

efficient order for the index (in this case dictionary hash order).

1345

"""

1346

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1347

1348

def iter_entries(self, keys):

1349

"""Iterate over keys within the index.

1350

1351

:param keys: An iterable providing the keys to be retrieved.

1352

:return: An iterable of (index, key, value, reference_lists). There is no

1353

defined order for the result iteration - it will be in the most

1354

efficient order for the index (keys iteration order in this case).

1355

"""

1356

return self._strip_prefix(self.adapted.iter_entries(

1357

self.prefix + key for key in keys))

1358

1359

def iter_entries_prefix(self, keys):

1360

"""Iterate over keys within the index using prefix matching.

1361

1362

Prefix matching is applied within the tuple of a key, not to within

1363

the bytestring of each key element. e.g. if you have the keys ('foo',

1364

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1365

only the former key is returned.

1366

1367

:param keys: An iterable providing the key prefixes to be retrieved.

1368

Each key prefix takes the form of a tuple the length of a key, but

1369

with the last N elements 'None' rather than a regular bytestring.

1370

The first element cannot be 'None'.

1371

:return: An iterable as per iter_all_entries, but restricted to the

1372

keys with a matching prefix to those supplied. No additional keys

1373

will be returned, and every match that is in the index will be

1374

returned.

1375

"""

1376

return self._strip_prefix(self.adapted.iter_entries_prefix(

1377

self.prefix + key for key in keys))

1378

1379

def key_count(self):

1380

"""Return an estimate of the number of keys in this index.

1381

1382

For GraphIndexPrefixAdapter this is relatively expensive - key

1383

iteration with the prefix is done.

1384

"""

1385

return len(list(self.iter_all_entries()))

1386

1387

def validate(self):

1388

"""Call the adapted's validate."""

1389

self.adapted.validate()

Older »