~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: John Arbash Meinel
Date: 2007-11-13 20:37:09 UTC
mto: This revision was merged to the branch mainline in revision 3001.
Revision ID: john@arbash-meinel.com-20071113203709-kysdte0emqv84pnj

https://launchpad.net/bugs/162486

Fix bug #162486, by having RemoteBranch properly initialize self._revision_id_to_revno_map.

files added:
COPYING.txt

bzr.ico

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/help_topics.py

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/multiparent.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/strace.py

bzrlib/tag.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transform.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tuned_gzip.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/workingtree_4.py

bzrlib/xml6.py

bzrlib/xml7.py

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/knitpack.txt

doc/developers/last-modified.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/profiling.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/user-guide

doc/en/user-guide/authentication_conf.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/centralized_workflow.txt

doc/en/user-guide/configuration.txt

doc/en/user-guide/conflicts.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/version_info.txt

doc/en/user-reference

doc/en/user-reference/hooks.txt

doc/en/user-reference/index.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

tools/__init__.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

tools/win32/survey.txt

files removed:
NEWS.developers

build-api

bzrlib/clone.py

bzrlib/merge_core.py

bzrlib/tests/test_remove.py

bzrlib/tests/test_reweave.py

bzrlib/util/configobj/validate.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

bzrlib/graph.py => bzrlib/deprecated_graph.py

bzrlib/store/weave.py => bzrlib/store/versioned/__init__.py

bzrlib/tests/test_annotate.py => bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/test_status.py => bzrlib/tests/blackbox/test_status.py

bzrlib/tests/test_uncommit.py => bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/test_branch.py => bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/test_parent.py => bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/test_revprops.py => bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/test_command.py => bzrlib/tests/test_commands.py

bzrlib/tests/test_graph.py => bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_basis_inventory.py => bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/transport/http.py => bzrlib/transport/http/__init__.py

bzrlib/win32console.py => bzrlib/win32utils.py

bzrlib/xml.py => bzrlib/xml_serializer.py

HACKING => doc/developers/HACKING.txt

tutorial.txt => doc/en/user-guide/tutorial.txt

bzr_man.py => tools/doc_generate/autodoc_man.py

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py *

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwk

setup.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/trace-revisions

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.trace import mutter

""")

from bzrlib import debug, errors

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

self._nodes = {}

self._nodes_by_key = {}

self._key_length = key_elements

def _check_key(self, key):

"""Raise BadIndexKey if key is not a valid key for this index."""

if type(key) != tuple:

raise errors.BadIndexKey(key)

if self._key_length != len(key):

raise errors.BadIndexKey(key)

for element in key:

if not element or _whitespace_re.search(element) is not None:

raise errors.BadIndexKey(element)

def add_node(self, key, value, references=()):

"""Add a node to the index.

:param key: The key. keys are non-empty tuples containing

as many whitespace-free utf8 bytestrings as the key length

defined for this index.

:param references: An iterable of iterables of keys. Each is a

reference to another key.

:param value: The value to associate with the key. It may be any

100

bytes as long as it does not contain \0 or \n.

101

"""

102

self._check_key(key)

103

if _newline_null_re.search(value) is not None:

104

raise errors.BadIndexValue(value)

105

if len(references) != self.reference_lists:

106

raise errors.BadIndexValue(references)

107

node_refs = []

108

for reference_list in references:

109

for reference in reference_list:

110

self._check_key(reference)

111

if reference not in self._nodes:

112

self._nodes[reference] = ('a', (), '')

113

node_refs.append(tuple(reference_list))

114

if key in self._nodes and self._nodes[key][0] == '':

115

raise errors.BadIndexDuplicateKey(key, self)

116

self._nodes[key] = ('', tuple(node_refs), value)

117

self._keys.add(key)

118

if self._key_length > 1:

119

key_dict = self._nodes_by_key

120

if self.reference_lists:

121

key_value = key, value, tuple(node_refs)

122

else:

123

key_value = key, value

124

# possibly should do this on-demand, but it seems likely it is

125

# always wanted

126

# For a key of (foo, bar, baz) create

127

# _nodes_by_key[foo][bar][baz] = key_value

128

for subkey in key[:-1]:

129

key_dict = key_dict.setdefault(subkey, {})

130

key_dict[key[-1]] = key_value

131

132

def finish(self):

133

lines = [_SIGNATURE]

134

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

135

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

136

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

137

prefix_length = sum(len(x) for x in lines)

138

# references are byte offsets. To avoid having to do nasty

139

# polynomial work to resolve offsets (references to later in the

140

# file cannot be determined until all the inbetween references have

141

# been calculated too) we pad the offsets with 0's to make them be

142

# of consistent length. Using binary offsets would break the trivial

143

# file parsing.

144

# to calculate the width of zero's needed we do three passes:

145

# one to gather all the non-reference data and the number of references.

146

# one to pad all the data with reference-length and determine entry

147

# addresses.

148

# One to serialise.

149

150

# forward sorted by key. In future we may consider topological sorting,

151

# at the cost of table scans for direct lookup, or a second index for

152

# direct lookup

153

nodes = sorted(self._nodes.items())

154

# if we do not prepass, we don't know how long it will be up front.

155

expected_bytes = None

156

# we only need to pre-pass if we have reference lists at all.

157

if self.reference_lists:

158

key_offset_info = []

159

non_ref_bytes = prefix_length

160

total_references = 0

161

# TODO use simple multiplication for the constants in this loop.

162

for key, (absent, references, value) in nodes:

163

# record the offset known *so far* for this key:

164

# the non reference bytes to date, and the total references to

165

# date - saves reaccumulating on the second pass

166

key_offset_info.append((key, non_ref_bytes, total_references))

167

# key is literal, value is literal, there are 3 null's, 1 NL

168

# key is variable length tuple, \x00 between elements

169

non_ref_bytes += sum(len(element) for element in key)

170

if self._key_length > 1:

171

non_ref_bytes += self._key_length - 1

172

# value is literal bytes, there are 3 null's, 1 NL.

173

non_ref_bytes += len(value) + 3 + 1

174

# one byte for absent if set.

175

if absent:

176

non_ref_bytes += 1

177

elif self.reference_lists:

178

# (ref_lists -1) tabs

179

non_ref_bytes += self.reference_lists - 1

180

# (ref-1 cr's per ref_list)

181

for ref_list in references:

182

# how many references across the whole file?

183

total_references += len(ref_list)

184

# accrue reference separators

185

if ref_list:

186

non_ref_bytes += len(ref_list) - 1

187

# how many digits are needed to represent the total byte count?

188

digits = 1

189

possible_total_bytes = non_ref_bytes + total_references*digits

190

while 10 ** digits < possible_total_bytes:

191

digits += 1

192

possible_total_bytes = non_ref_bytes + total_references*digits

193

expected_bytes = possible_total_bytes + 1 # terminating newline

194

# resolve key addresses.

195

key_addresses = {}

196

for key, non_ref_bytes, total_references in key_offset_info:

197

key_addresses[key] = non_ref_bytes + total_references*digits

198

# serialise

199

format_string = '%%0%sd' % digits

200

for key, (absent, references, value) in nodes:

201

flattened_references = []

202

for ref_list in references:

203

ref_addresses = []

204

for reference in ref_list:

205

ref_addresses.append(format_string % key_addresses[reference])

206

flattened_references.append('\r'.join(ref_addresses))

207

string_key = '\x00'.join(key)

208

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

209

'\t'.join(flattened_references), value))

210

lines.append('\n')

211

result = StringIO(''.join(lines))

212

if expected_bytes and len(result.getvalue()) != expected_bytes:

213

raise errors.BzrError('Failed index creation. Internal error:'

214

' mismatched output length and expected length: %d %d' %

215

(len(result.getvalue()), expected_bytes))

216

return StringIO(''.join(lines))

217

218

219

class GraphIndex(object):

220

"""An index for data with embedded graphs.

221

222

The index maps keys to a list of key reference lists, and a value.

223

Each node has the same number of key reference lists. Each key reference

224

list can be empty or an arbitrary length. The value is an opaque NULL

225

terminated string without any newlines. The storage of the index is

226

hidden in the interface: keys and key references are always tuples of

227

bytestrings, never the internal representation (e.g. dictionary offsets).

228

229

It is presumed that the index will not be mutated - it is static data.

230

231

Successive iter_all_entries calls will read the entire index each time.

232

Additionally, iter_entries calls will read the index linearly until the

233

desired keys are found. XXX: This must be fixed before the index is

234

suitable for production use. :XXX

235

"""

236

237

def __init__(self, transport, name, size):

238

"""Open an index called name on transport.

239

240

:param transport: A bzrlib.transport.Transport.

241

:param name: A path to provide to transport API calls.

242

:param size: The size of the index in bytes. This is used for bisection

243

logic to perform partial index reads. While the size could be

244

obtained by statting the file this introduced an additional round

245

trip as well as requiring stat'able transports, both of which are

246

avoided by having it supplied. If size is None, then bisection

247

support will be disabled and accessing the index will just stream

248

all the data.

249

"""

250

self._transport = transport

251

self._name = name

252

# Becomes a dict of key:(value, reference-list-byte-locations) used by

253

# the bisection interface to store parsed but not resolved keys.

254

self._bisect_nodes = None

255

# Becomes a dict of key:(value, reference-list-keys) which are ready to

256

# be returned directly to callers.

257

self._nodes = None

258

# a sorted list of slice-addresses for the parsed bytes of the file.

259

# e.g. (0,1) would mean that byte 0 is parsed.

260

self._parsed_byte_map = []

261

# a sorted list of keys matching each slice address for parsed bytes

262

# e.g. (None, 'foo@bar') would mean that the first byte contained no

263

# key, and the end byte of the slice is the of the data for 'foo@bar'

264

self._parsed_key_map = []

265

self._key_count = None

266

self._keys_by_offset = None

267

self._nodes_by_key = None

268

self._size = size

269

270

def __eq__(self, other):

271

"""Equal when self and other were created with the same parameters."""

272

return (

273

type(self) == type(other) and

274

self._transport == other._transport and

275

self._name == other._name and

276

self._size == other._size)

277

278

def __ne__(self, other):

279

return not self.__eq__(other)

280

281

def _buffer_all(self):

282

"""Buffer all the index data.

283

284

Mutates self._nodes and self.keys_by_offset.

285

"""

286

if 'index' in debug.debug_flags:

287

mutter('Reading entire index %s', self._transport.abspath(self._name))

288

stream = self._transport.get(self._name)

289

self._read_prefix(stream)

290

self._expected_elements = 3 + self._key_length

291

line_count = 0

292

# raw data keyed by offset

293

self._keys_by_offset = {}

294

# ready-to-return key:value or key:value, node_ref_lists

295

self._nodes = {}

296

self._nodes_by_key = {}

297

trailers = 0

298

pos = stream.tell()

299

lines = stream.read().split('\n')

300

del lines[-1]

301

_, _, _, trailers = self._parse_lines(lines, pos)

302

for key, absent, references, value in self._keys_by_offset.itervalues():

303

if absent:

304

continue

305

# resolve references:

306

if self.node_ref_lists:

307

node_value = (value, self._resolve_references(references))

308

else:

309

node_value = value

310

self._nodes[key] = node_value

311

if self._key_length > 1:

312

subkey = list(reversed(key[:-1]))

313

key_dict = self._nodes_by_key

314

if self.node_ref_lists:

315

key_value = key, node_value[0], node_value[1]

316

else:

317

key_value = key, node_value

318

# possibly should do this on-demand, but it seems likely it is

319

# always wanted

320

# For a key of (foo, bar, baz) create

321

# _nodes_by_key[foo][bar][baz] = key_value

322

for subkey in key[:-1]:

323

key_dict = key_dict.setdefault(subkey, {})

324

key_dict[key[-1]] = key_value

325

# cache the keys for quick set intersections

326

self._keys = set(self._nodes)

327

if trailers != 1:

328

# there must be one line - the empty trailer line.

329

raise errors.BadIndexData(self)

330

331

def iter_all_entries(self):

332

"""Iterate over all keys within the index.

333

334

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

335

The former tuple is used when there are no reference lists in the

336

index, making the API compatible with simple key:value index types.

337

There is no defined order for the result iteration - it will be in

338

the most efficient order for the index.

339

"""

340

if 'evil' in debug.debug_flags:

341

trace.mutter_callsite(3,

342

"iter_all_entries scales with size of history.")

343

if self._nodes is None:

344

self._buffer_all()

345

if self.node_ref_lists:

346

for key, (value, node_ref_lists) in self._nodes.iteritems():

347

yield self, key, value, node_ref_lists

348

else:

349

for key, value in self._nodes.iteritems():

350

yield self, key, value

351

352

def _read_prefix(self, stream):

353

signature = stream.read(len(self._signature()))

354

if not signature == self._signature():

355

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

356

options_line = stream.readline()

357

if not options_line.startswith(_OPTION_NODE_REFS):

358

raise errors.BadIndexOptions(self)

359

try:

360

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

361

except ValueError:

362

raise errors.BadIndexOptions(self)

363

options_line = stream.readline()

364

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

365

raise errors.BadIndexOptions(self)

366

try:

367

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

368

except ValueError:

369

raise errors.BadIndexOptions(self)

370

options_line = stream.readline()

371

if not options_line.startswith(_OPTION_LEN):

372

raise errors.BadIndexOptions(self)

373

try:

374

self._key_count = int(options_line[len(_OPTION_LEN):-1])

375

except ValueError:

376

raise errors.BadIndexOptions(self)

377

378

def _resolve_references(self, references):

379

"""Return the resolved key references for references.

380

381

References are resolved by looking up the location of the key in the

382

_keys_by_offset map and substituting the key name, preserving ordering.

383

384

:param references: An iterable of iterables of key locations. e.g.

385

[[123, 456], [123]]

386

:return: A tuple of tuples of keys.

387

"""

388

node_refs = []

389

for ref_list in references:

390

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

391

return tuple(node_refs)

392

393

def _find_index(self, range_map, key):

394

"""Helper for the _parsed_*_index calls.

395

396

Given a range map - [(start, end), ...], finds the index of the range

397

in the map for key if it is in the map, and if it is not there, the

398

immediately preceeding range in the map.

399

"""

400

result = bisect_right(range_map, key) - 1

401

if result + 1 < len(range_map):

402

# check the border condition, it may be in result + 1

403

if range_map[result + 1][0] == key[0]:

404

return result + 1

405

return result

406

407

def _parsed_byte_index(self, offset):

408

"""Return the index of the entry immediately before offset.

409

410

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

411

there is one unparsed byte (the 11th, addressed as[10]). then:

412

asking for 0 will return 0

413

asking for 10 will return 0

414

asking for 11 will return 1

415

asking for 12 will return 1

416

"""

417

key = (offset, 0)

418

return self._find_index(self._parsed_byte_map, key)

419

420

def _parsed_key_index(self, key):

421

"""Return the index of the entry immediately before key.

422

423

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

424

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

425

have been parsed, then:

426

asking for '' will return 0

427

asking for 'a' will return 0

428

asking for 'b' will return 1

429

asking for 'e' will return 1

430

"""

431

search_key = (key, None)

432

return self._find_index(self._parsed_key_map, search_key)

433

434

def _is_parsed(self, offset):

435

"""Returns True if offset has been parsed."""

436

index = self._parsed_byte_index(offset)

437

if index == len(self._parsed_byte_map):

438

return offset < self._parsed_byte_map[index - 1][1]

439

start, end = self._parsed_byte_map[index]

440

return offset >= start and offset < end

441

442

def _iter_entries_from_total_buffer(self, keys):

443

"""Iterate over keys when the entire index is parsed."""

444

keys = keys.intersection(self._keys)

445

if self.node_ref_lists:

446

for key in keys:

447

value, node_refs = self._nodes[key]

448

yield self, key, value, node_refs

449

else:

450

for key in keys:

451

yield self, key, self._nodes[key]

452

453

def iter_entries(self, keys):

454

"""Iterate over keys within the index.

455

456

:param keys: An iterable providing the keys to be retrieved.

457

:return: An iterable as per iter_all_entries, but restricted to the

458

keys supplied. No additional keys will be returned, and every

459

key supplied that is in the index will be returned.

460

"""

461

# PERFORMANCE TODO: parse and bisect all remaining data at some

462

# threshold of total-index processing/get calling layers that expect to

463

# read the entire index to use the iter_all_entries method instead.

464

keys = set(keys)

465

if not keys:

466

return []

467

if self._size is None and self._nodes is None:

468

self._buffer_all()

469

if self._nodes is not None:

470

return self._iter_entries_from_total_buffer(keys)

471

else:

472

return (result[1] for result in bisect_multi_bytes(

473

self._lookup_keys_via_location, self._size, keys))

474

475

def iter_entries_prefix(self, keys):

476

"""Iterate over keys within the index using prefix matching.

477

478

Prefix matching is applied within the tuple of a key, not to within

479

the bytestring of each key element. e.g. if you have the keys ('foo',

480

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

481

only the former key is returned.

482

483

WARNING: Note that this method currently causes a full index parse

484

unconditionally (which is reasonably appropriate as it is a means for

485

thunking many small indices into one larger one and still supplies

486

iter_all_entries at the thunk layer).

487

488

:param keys: An iterable providing the key prefixes to be retrieved.

489

Each key prefix takes the form of a tuple the length of a key, but

490

with the last N elements 'None' rather than a regular bytestring.

491

The first element cannot be 'None'.

492

:return: An iterable as per iter_all_entries, but restricted to the

493

keys with a matching prefix to those supplied. No additional keys

494

will be returned, and every match that is in the index will be

495

returned.

496

"""

497

keys = set(keys)

498

if not keys:

499

return

500

# load data - also finds key lengths

501

if self._nodes is None:

502

self._buffer_all()

503

if self._key_length == 1:

504

for key in keys:

505

# sanity check

506

if key[0] is None:

507

raise errors.BadIndexKey(key)

508

if len(key) != self._key_length:

509

raise errors.BadIndexKey(key)

510

if self.node_ref_lists:

511

value, node_refs = self._nodes[key]

512

yield self, key, value, node_refs

513

else:

514

yield self, key, self._nodes[key]

515

return

516

for key in keys:

517

# sanity check

518

if key[0] is None:

519

raise errors.BadIndexKey(key)

520

if len(key) != self._key_length:

521

raise errors.BadIndexKey(key)

522

# find what it refers to:

523

key_dict = self._nodes_by_key

524

elements = list(key)

525

# find the subdict whose contents should be returned.

526

try:

527

while len(elements) and elements[0] is not None:

528

key_dict = key_dict[elements[0]]

529

elements.pop(0)

530

except KeyError:

531

# a non-existant lookup.

532

continue

533

if len(elements):

534

dicts = [key_dict]

535

while dicts:

536

key_dict = dicts.pop(-1)

537

# can't be empty or would not exist

538

item, value = key_dict.iteritems().next()

539

if type(value) == dict:

540

# push keys

541

dicts.extend(key_dict.itervalues())

542

else:

543

# yield keys

544

for value in key_dict.itervalues():

545

# each value is the key:value:node refs tuple

546

# ready to yield.

547

yield (self, ) + value

548

else:

549

# the last thing looked up was a terminal element

550

yield (self, ) + key_dict

551

552

def key_count(self):

553

"""Return an estimate of the number of keys in this index.

554

555

For GraphIndex the estimate is exact.

556

"""

557

if self._key_count is None:

558

# really this should just read the prefix

559

self._buffer_all()

560

return self._key_count

561

562

def _lookup_keys_via_location(self, location_keys):

563

"""Public interface for implementing bisection.

564

565

If _buffer_all has been called, then all the data for the index is in

566

memory, and this method should not be called, as it uses a separate

567

cache because it cannot pre-resolve all indices, which buffer_all does

568

for performance.

569

570

:param location_keys: A list of location(byte offset), key tuples.

571

:return: A list of (location_key, result) tuples as expected by

572

bzrlib.bisect_multi.bisect_multi_bytes.

573

"""

574

# Possible improvements:

575

# - only bisect lookup each key once

576

# - sort the keys first, and use that to reduce the bisection window

577

# -----

578

# this progresses in three parts:

579

# read data

580

# parse it

581

# attempt to answer the question from the now in memory data.

582

# build the readv request

583

# for each location, ask for 800 bytes - much more than rows we've seen

584

# anywhere.

585

readv_ranges = []

586

for location, key in location_keys:

587

# can we answer from cache?

588

if self._bisect_nodes and key in self._bisect_nodes:

589

# We have the key parsed.

590

continue

591

index = self._parsed_key_index(key)

592

if (len(self._parsed_key_map) and

593

self._parsed_key_map[index][0] <= key and

594

(self._parsed_key_map[index][1] >= key or

595

# end of the file has been parsed

596

self._parsed_byte_map[index][1] == self._size)):

597

# the key has been parsed, so no lookup is needed even if its

598

# not present.

599

continue

600

# - if we have examined this part of the file already - yes

601

index = self._parsed_byte_index(location)

602

if (len(self._parsed_byte_map) and

603

self._parsed_byte_map[index][0] <= location and

604

self._parsed_byte_map[index][1] > location):

605

# the byte region has been parsed, so no read is needed.

606

continue

607

length = 800

608

if location + length > self._size:

609

length = self._size - location

610

# todo, trim out parsed locations.

611

if length > 0:

612

readv_ranges.append((location, length))

613

# read the header if needed

614

if self._bisect_nodes is None:

615

readv_ranges.append((0, 200))

616

self._read_and_parse(readv_ranges)

617

# generate results:

618

# - figure out <, >, missing, present

619

# - result present references so we can return them.

620

result = []

621

# keys that we cannot answer until we resolve references

622

pending_references = []

623

pending_locations = set()

624

for location, key in location_keys:

625

# can we answer from cache?

626

if key in self._bisect_nodes:

627

# the key has been parsed, so no lookup is needed

628

if self.node_ref_lists:

629

# the references may not have been all parsed.

630

value, refs = self._bisect_nodes[key]

631

wanted_locations = []

632

for ref_list in refs:

633

for ref in ref_list:

634

if ref not in self._keys_by_offset:

635

wanted_locations.append(ref)

636

if wanted_locations:

637

pending_locations.update(wanted_locations)

638

pending_references.append((location, key))

639

continue

640

result.append(((location, key), (self, key,

641

value, self._resolve_references(refs))))

642

else:

643

result.append(((location, key),

644

(self, key, self._bisect_nodes[key])))

645

continue

646

else:

647

# has the region the key should be in, been parsed?

648

index = self._parsed_key_index(key)

649

if (self._parsed_key_map[index][0] <= key and

650

(self._parsed_key_map[index][1] >= key or

651

# end of the file has been parsed

652

self._parsed_byte_map[index][1] == self._size)):

653

result.append(((location, key), False))

654

continue

655

# no, is the key above or below the probed location:

656

# get the range of the probed & parsed location

657

index = self._parsed_byte_index(location)

658

# if the key is below the start of the range, its below

659

if key < self._parsed_key_map[index][0]:

660

direction = -1

661

else:

662

direction = +1

663

result.append(((location, key), direction))

664

readv_ranges = []

665

# lookup data to resolve references

666

for location in pending_locations:

667

length = 800

668

if location + length > self._size:

669

length = self._size - location

670

# TODO: trim out parsed locations (e.g. if the 800 is into the

671

# parsed region trim it, and dont use the adjust_for_latency

672

# facility)

673

if length > 0:

674

readv_ranges.append((location, length))

675

self._read_and_parse(readv_ranges)

676

for location, key in pending_references:

677

# answer key references we had to look-up-late.

678

index = self._parsed_key_index(key)

679

value, refs = self._bisect_nodes[key]

680

result.append(((location, key), (self, key,

681

value, self._resolve_references(refs))))

682

return result

683

684

def _parse_header_from_bytes(self, bytes):

685

"""Parse the header from a region of bytes.

686

687

:param bytes: The data to parse.

688

:return: An offset, data tuple such as readv yields, for the unparsed

689

data. (which may length 0).

690

"""

691

signature = bytes[0:len(self._signature())]

692

if not signature == self._signature():

693

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

694

lines = bytes[len(self._signature()):].splitlines()

695

options_line = lines[0]

696

if not options_line.startswith(_OPTION_NODE_REFS):

697

raise errors.BadIndexOptions(self)

698

try:

699

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

700

except ValueError:

701

raise errors.BadIndexOptions(self)

702

options_line = lines[1]

703

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

704

raise errors.BadIndexOptions(self)

705

try:

706

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

707

except ValueError:

708

raise errors.BadIndexOptions(self)

709

options_line = lines[2]

710

if not options_line.startswith(_OPTION_LEN):

711

raise errors.BadIndexOptions(self)

712

try:

713

self._key_count = int(options_line[len(_OPTION_LEN):])

714

except ValueError:

715

raise errors.BadIndexOptions(self)

716

# calculate the bytes we have processed

717

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

718

len(lines[2]) + 3)

719

self._parsed_bytes(0, None, header_end, None)

720

# setup parsing state

721

self._expected_elements = 3 + self._key_length

722

# raw data keyed by offset

723

self._keys_by_offset = {}

724

# keys with the value and node references

725

self._bisect_nodes = {}

726

return header_end, bytes[header_end:]

727

728

def _parse_region(self, offset, data):

729

"""Parse node data returned from a readv operation.

730

731

:param offset: The byte offset the data starts at.

732

:param data: The data to parse.

733

"""

734

# trim the data.

735

# end first:

736

end = offset + len(data)

737

high_parsed = offset

738

while True:

739

# Trivial test - if the current index's end is within the

740

# low-matching parsed range, we're done.

741

index = self._parsed_byte_index(high_parsed)

742

if end < self._parsed_byte_map[index][1]:

743

return

744

# print "[%d:%d]" % (offset, end), \

745

# self._parsed_byte_map[index:index + 2]

746

high_parsed, last_segment = self._parse_segment(

747

offset, data, end, index)

748

if last_segment:

749

return

750

751

def _parse_segment(self, offset, data, end, index):

752

"""Parse one segment of data.

753

754

:param offset: Where 'data' begins in the file.

755

:param data: Some data to parse a segment of.

756

:param end: Where data ends

757

:param index: The current index into the parsed bytes map.

758

:return: True if the parsed segment is the last possible one in the

759

range of data.

760

:return: high_parsed_byte, last_segment.

761

high_parsed_byte is the location of the highest parsed byte in this

762

segment, last_segment is True if the parsed segment is the last

763

possible one in the data block.

764

"""

765

# default is to use all data

766

trim_end = None

767

# accomodate overlap with data before this.

768

if offset < self._parsed_byte_map[index][1]:

769

# overlaps the lower parsed region

770

# skip the parsed data

771

trim_start = self._parsed_byte_map[index][1] - offset

772

# don't trim the start for \n

773

start_adjacent = True

774

elif offset == self._parsed_byte_map[index][1]:

775

# abuts the lower parsed region

776

# use all data

777

trim_start = None

778

# do not trim anything

779

start_adjacent = True

780

else:

781

# does not overlap the lower parsed region

782

# use all data

783

trim_start = None

784

# but trim the leading \n

785

start_adjacent = False

786

if end == self._size:

787

# lines up to the end of all data:

788

# use it all

789

trim_end = None

790

# do not strip to the last \n

791

end_adjacent = True

792

last_segment = True

793

elif index + 1 == len(self._parsed_byte_map):

794

# at the end of the parsed data

795

# use it all

796

trim_end = None

797

# but strip to the last \n

798

end_adjacent = False

799

last_segment = True

800

elif end == self._parsed_byte_map[index + 1][0]:

801

# buts up against the next parsed region

802

# use it all

803

trim_end = None

804

# do not strip to the last \n

805

end_adjacent = True

806

last_segment = True

807

elif end > self._parsed_byte_map[index + 1][0]:

808

# overlaps into the next parsed region

809

# only consider the unparsed data

810

trim_end = self._parsed_byte_map[index + 1][0] - offset

811

# do not strip to the last \n as we know its an entire record

812

end_adjacent = True

813

last_segment = end < self._parsed_byte_map[index + 1][1]

814

else:

815

# does not overlap into the next region

816

# use it all

817

trim_end = None

818

# but strip to the last \n

819

end_adjacent = False

820

last_segment = True

821

# now find bytes to discard if needed

822

if not start_adjacent:

823

# work around python bug in rfind

824

if trim_start is None:

825

trim_start = data.find('\n') + 1

826

else:

827

trim_start = data.find('\n', trim_start) + 1

828

assert trim_start != 0, 'no \n was present'

829

# print 'removing start', offset, trim_start, repr(data[:trim_start])

830

if not end_adjacent:

831

# work around python bug in rfind

832

if trim_end is None:

833

trim_end = data.rfind('\n') + 1

834

else:

835

trim_end = data.rfind('\n', None, trim_end) + 1

836

assert trim_end != 0, 'no \n was present'

837

# print 'removing end', offset, trim_end, repr(data[trim_end:])

838

# adjust offset and data to the parseable data.

839

trimmed_data = data[trim_start:trim_end]

840

assert trimmed_data, 'read unneeded data [%d:%d] from [%d:%d]' % (

841

trim_start, trim_end, offset, offset + len(data))

842

if trim_start:

843

offset += trim_start

844

# print "parsing", repr(trimmed_data)

845

# splitlines mangles the \r delimiters.. don't use it.

846

lines = trimmed_data.split('\n')

847

del lines[-1]

848

pos = offset

849

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

850

for key, value in nodes:

851

self._bisect_nodes[key] = value

852

self._parsed_bytes(offset, first_key,

853

offset + len(trimmed_data), last_key)

854

return offset + len(trimmed_data), last_segment

855

856

def _parse_lines(self, lines, pos):

857

key = None

858

first_key = None

859

trailers = 0

860

nodes = []

861

for line in lines:

862

if line == '':

863

# must be at the end

864

if self._size:

865

assert self._size == pos + 1, "%s %s" % (self._size, pos)

866

trailers += 1

867

continue

868

elements = line.split('\0')

869

if len(elements) != self._expected_elements:

870

raise errors.BadIndexData(self)

871

# keys are tuples

872

key = tuple(elements[:self._key_length])

873

if first_key is None:

874

first_key = key

875

absent, references, value = elements[-3:]

876

ref_lists = []

877

for ref_string in references.split('\t'):

878

ref_lists.append(tuple([

879

int(ref) for ref in ref_string.split('\r') if ref

880

]))

881

ref_lists = tuple(ref_lists)

882

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

883

pos += len(line) + 1 # +1 for the \n

884

if absent:

885

continue

886

if self.node_ref_lists:

887

node_value = (value, ref_lists)

888

else:

889

node_value = value

890

nodes.append((key, node_value))

891

# print "parsed ", key

892

return first_key, key, nodes, trailers

893

894

def _parsed_bytes(self, start, start_key, end, end_key):

895

"""Mark the bytes from start to end as parsed.

896

897

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

898

1) as parsed.

899

900

:param start: The start of the parsed region.

901

:param end: The end of the parsed region.

902

"""

903

index = self._parsed_byte_index(start)

904

new_value = (start, end)

905

new_key = (start_key, end_key)

906

if index == -1:

907

# first range parsed is always the beginning.

908

self._parsed_byte_map.insert(index, new_value)

909

self._parsed_key_map.insert(index, new_key)

910

return

911

# four cases:

912

# new region

913

# extend lower region

914

# extend higher region

915

# combine two regions

916

if (index + 1 < len(self._parsed_byte_map) and

917

self._parsed_byte_map[index][1] == start and

918

self._parsed_byte_map[index + 1][0] == end):

919

# combine two regions

920

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

921

self._parsed_byte_map[index + 1][1])

922

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

923

self._parsed_key_map[index + 1][1])

924

del self._parsed_byte_map[index + 1]

925

del self._parsed_key_map[index + 1]

926

elif self._parsed_byte_map[index][1] == start:

927

# extend the lower entry

928

self._parsed_byte_map[index] = (

929

self._parsed_byte_map[index][0], end)

930

self._parsed_key_map[index] = (

931

self._parsed_key_map[index][0], end_key)

932

elif (index + 1 < len(self._parsed_byte_map) and

933

self._parsed_byte_map[index + 1][0] == end):

934

# extend the higher entry

935

self._parsed_byte_map[index + 1] = (

936

start, self._parsed_byte_map[index + 1][1])

937

self._parsed_key_map[index + 1] = (

938

start_key, self._parsed_key_map[index + 1][1])

939

else:

940

# new entry

941

self._parsed_byte_map.insert(index + 1, new_value)

942

self._parsed_key_map.insert(index + 1, new_key)

943

944

def _read_and_parse(self, readv_ranges):

945

"""Read the the ranges and parse the resulting data.

946

947

:param readv_ranges: A prepared readv range list.

948

"""

949

if readv_ranges:

950

readv_data = self._transport.readv(self._name, readv_ranges, True,

951

self._size)

952

# parse

953

for offset, data in readv_data:

954

if self._bisect_nodes is None:

955

# this must be the start

956

assert offset == 0

957

offset, data = self._parse_header_from_bytes(data)

958

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

959

self._parse_region(offset, data)

960

961

def _signature(self):

962

"""The file signature for this index type."""

963

return _SIGNATURE

964

965

def validate(self):

966

"""Validate that everything in the index can be accessed."""

967

# iter_all validates completely at the moment, so just do that.

968

for node in self.iter_all_entries():

969

pass

970

971

972

class CombinedGraphIndex(object):

973

"""A GraphIndex made up from smaller GraphIndices.

974

975

The backing indices must implement GraphIndex, and are presumed to be

976

static data.

977

978

Queries against the combined index will be made against the first index,

979

and then the second and so on. The order of index's can thus influence

980

performance significantly. For example, if one index is on local disk and a

981

second on a remote server, the local disk index should be before the other

982

in the index list.

983

"""

984

985

def __init__(self, indices):

986

"""Create a CombinedGraphIndex backed by indices.

987

988

:param indices: An ordered list of indices to query for data.

989

"""

990

self._indices = indices

991

992

def __repr__(self):

993

return "%s(%s)" % (

994

self.__class__.__name__,

995

', '.join(map(repr, self._indices)))

996

997

def insert_index(self, pos, index):

998

"""Insert a new index in the list of indices to query.

999

1000

:param pos: The position to insert the index.

1001

:param index: The index to insert.

1002

"""

1003

self._indices.insert(pos, index)

1004

1005

def iter_all_entries(self):

1006

"""Iterate over all keys within the index

1007

1008

Duplicate keys across child indices are presumed to have the same

1009

value and are only reported once.

1010

1011

:return: An iterable of (index, key, reference_lists, value).

1012

There is no defined order for the result iteration - it will be in

1013

the most efficient order for the index.

1014

"""

1015

seen_keys = set()

1016

for index in self._indices:

1017

for node in index.iter_all_entries():

1018

if node[1] not in seen_keys:

1019

yield node

1020

seen_keys.add(node[1])

1021

1022

def iter_entries(self, keys):

1023

"""Iterate over keys within the index.

1024

1025

Duplicate keys across child indices are presumed to have the same

1026

value and are only reported once.

1027

1028

:param keys: An iterable providing the keys to be retrieved.

1029

:return: An iterable of (index, key, reference_lists, value). There is no

1030

defined order for the result iteration - it will be in the most

1031

efficient order for the index.

1032

"""

1033

keys = set(keys)

1034

for index in self._indices:

1035

if not keys:

1036

return

1037

for node in index.iter_entries(keys):

1038

keys.remove(node[1])

1039

yield node

1040

1041

def iter_entries_prefix(self, keys):

1042

"""Iterate over keys within the index using prefix matching.

1043

1044

Duplicate keys across child indices are presumed to have the same

1045

value and are only reported once.

1046

1047

Prefix matching is applied within the tuple of a key, not to within

1048

the bytestring of each key element. e.g. if you have the keys ('foo',

1049

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1050

only the former key is returned.

1051

1052

:param keys: An iterable providing the key prefixes to be retrieved.

1053

Each key prefix takes the form of a tuple the length of a key, but

1054

with the last N elements 'None' rather than a regular bytestring.

1055

The first element cannot be 'None'.

1056

:return: An iterable as per iter_all_entries, but restricted to the

1057

keys with a matching prefix to those supplied. No additional keys

1058

will be returned, and every match that is in the index will be

1059

returned.

1060

"""

1061

keys = set(keys)

1062

if not keys:

1063

return

1064

seen_keys = set()

1065

for index in self._indices:

1066

for node in index.iter_entries_prefix(keys):

1067

if node[1] in seen_keys:

1068

continue

1069

seen_keys.add(node[1])

1070

yield node

1071

1072

def key_count(self):

1073

"""Return an estimate of the number of keys in this index.

1074

1075

For CombinedGraphIndex this is approximated by the sum of the keys of

1076

the child indices. As child indices may have duplicate keys this can

1077

have a maximum error of the number of child indices * largest number of

1078

keys in any index.

1079

"""

1080

return sum((index.key_count() for index in self._indices), 0)

1081

1082

def validate(self):

1083

"""Validate that everything in the index can be accessed."""

1084

for index in self._indices:

1085

index.validate()

1086

1087

1088

class InMemoryGraphIndex(GraphIndexBuilder):

1089

"""A GraphIndex which operates entirely out of memory and is mutable.

1090

1091

This is designed to allow the accumulation of GraphIndex entries during a

1092

single write operation, where the accumulated entries need to be immediately

1093

available - for example via a CombinedGraphIndex.

1094

"""

1095

1096

def add_nodes(self, nodes):

1097

"""Add nodes to the index.

1098

1099

:param nodes: An iterable of (key, node_refs, value) entries to add.

1100

"""

1101

if self.reference_lists:

1102

for (key, value, node_refs) in nodes:

1103

self.add_node(key, value, node_refs)

1104

else:

1105

for (key, value) in nodes:

1106

self.add_node(key, value)

1107

1108

def iter_all_entries(self):

1109

"""Iterate over all keys within the index

1110

1111

:return: An iterable of (index, key, reference_lists, value). There is no

1112

defined order for the result iteration - it will be in the most

1113

efficient order for the index (in this case dictionary hash order).

1114

"""

1115

if 'evil' in debug.debug_flags:

1116

trace.mutter_callsite(3,

1117

"iter_all_entries scales with size of history.")

1118

if self.reference_lists:

1119

for key, (absent, references, value) in self._nodes.iteritems():

1120

if not absent:

1121

yield self, key, value, references

1122

else:

1123

for key, (absent, references, value) in self._nodes.iteritems():

1124

if not absent:

1125

yield self, key, value

1126

1127

def iter_entries(self, keys):

1128

"""Iterate over keys within the index.

1129

1130

:param keys: An iterable providing the keys to be retrieved.

1131

:return: An iterable of (index, key, reference_lists, value). There is no

1132

defined order for the result iteration - it will be in the most

1133

efficient order for the index (keys iteration order in this case).

1134

"""

1135

keys = set(keys)

1136

if self.reference_lists:

1137

for key in keys.intersection(self._keys):

1138

node = self._nodes[key]

1139

if not node[0]:

1140

yield self, key, node[2], node[1]

1141

else:

1142

for key in keys.intersection(self._keys):

1143

node = self._nodes[key]

1144

if not node[0]:

1145

yield self, key, node[2]

1146

1147

def iter_entries_prefix(self, keys):

1148

"""Iterate over keys within the index using prefix matching.

1149

1150

Prefix matching is applied within the tuple of a key, not to within

1151

the bytestring of each key element. e.g. if you have the keys ('foo',

1152

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1153

only the former key is returned.

1154

1155

:param keys: An iterable providing the key prefixes to be retrieved.

1156

Each key prefix takes the form of a tuple the length of a key, but

1157

with the last N elements 'None' rather than a regular bytestring.

1158

The first element cannot be 'None'.

1159

:return: An iterable as per iter_all_entries, but restricted to the

1160

keys with a matching prefix to those supplied. No additional keys

1161

will be returned, and every match that is in the index will be

1162

returned.

1163

"""

1164

# XXX: To much duplication with the GraphIndex class; consider finding

1165

# a good place to pull out the actual common logic.

1166

keys = set(keys)

1167

if not keys:

1168

return

1169

if self._key_length == 1:

1170

for key in keys:

1171

# sanity check

1172

if key[0] is None:

1173

raise errors.BadIndexKey(key)

1174

if len(key) != self._key_length:

1175

raise errors.BadIndexKey(key)

1176

node = self._nodes[key]

1177

if node[0]:

1178

continue

1179

if self.reference_lists:

1180

yield self, key, node[2], node[1]

1181

else:

1182

yield self, key, node[2]

1183

return

1184

for key in keys:

1185

# sanity check

1186

if key[0] is None:

1187

raise errors.BadIndexKey(key)

1188

if len(key) != self._key_length:

1189

raise errors.BadIndexKey(key)

1190

# find what it refers to:

1191

key_dict = self._nodes_by_key

1192

elements = list(key)

1193

# find the subdict to return

1194

try:

1195

while len(elements) and elements[0] is not None:

1196

key_dict = key_dict[elements[0]]

1197

elements.pop(0)

1198

except KeyError:

1199

# a non-existant lookup.

1200

continue

1201

if len(elements):

1202

dicts = [key_dict]

1203

while dicts:

1204

key_dict = dicts.pop(-1)

1205

# can't be empty or would not exist

1206

item, value = key_dict.iteritems().next()

1207

if type(value) == dict:

1208

# push keys

1209

dicts.extend(key_dict.itervalues())

1210

else:

1211

# yield keys

1212

for value in key_dict.itervalues():

1213

yield (self, ) + value

1214

else:

1215

yield (self, ) + key_dict

1216

1217

def key_count(self):

1218

"""Return an estimate of the number of keys in this index.

1219

1220

For InMemoryGraphIndex the estimate is exact.

1221

"""

1222

return len(self._keys)

1223

1224

def validate(self):

1225

"""In memory index's have no known corruption at the moment."""

1226

1227

1228

class GraphIndexPrefixAdapter(object):

1229

"""An adapter between GraphIndex with different key lengths.

1230

1231

Queries against this will emit queries against the adapted Graph with the

1232

prefix added, queries for all items use iter_entries_prefix. The returned

1233

nodes will have their keys and node references adjusted to remove the

1234

prefix. Finally, an add_nodes_callback can be supplied - when called the

1235

nodes and references being added will have prefix prepended.

1236

"""

1237

1238

def __init__(self, adapted, prefix, missing_key_length,

1239

add_nodes_callback=None):

1240

"""Construct an adapter against adapted with prefix."""

1241

self.adapted = adapted

1242

self.prefix_key = prefix + (None,)*missing_key_length

1243

self.prefix = prefix

1244

self.prefix_len = len(prefix)

1245

self.add_nodes_callback = add_nodes_callback

1246

1247

def add_nodes(self, nodes):

1248

"""Add nodes to the index.

1249

1250

:param nodes: An iterable of (key, node_refs, value) entries to add.

1251

"""

1252

# save nodes in case its an iterator

1253

nodes = tuple(nodes)

1254

translated_nodes = []

1255

try:

1256

# Add prefix_key to each reference node_refs is a tuple of tuples,

1257

# so split it apart, and add prefix_key to the internal reference

1258

for (key, value, node_refs) in nodes:

1259

adjusted_references = (

1260

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1261

for ref_list in node_refs))

1262

translated_nodes.append((self.prefix + key, value,

1263

adjusted_references))

1264

except ValueError:

1265

# XXX: TODO add an explicit interface for getting the reference list

1266

# status, to handle this bit of user-friendliness in the API more

1267

# explicitly.

1268

for (key, value) in nodes:

1269

translated_nodes.append((self.prefix + key, value))

1270

self.add_nodes_callback(translated_nodes)

1271

1272

def add_node(self, key, value, references=()):

1273

"""Add a node to the index.

1274

1275

:param key: The key. keys are non-empty tuples containing

1276

as many whitespace-free utf8 bytestrings as the key length

1277

defined for this index.

1278

:param references: An iterable of iterables of keys. Each is a

1279

reference to another key.

1280

:param value: The value to associate with the key. It may be any

1281

bytes as long as it does not contain \0 or \n.

1282

"""

1283

self.add_nodes(((key, value, references), ))

1284

1285

def _strip_prefix(self, an_iter):

1286

"""Strip prefix data from nodes and return it."""

1287

for node in an_iter:

1288

# cross checks

1289

if node[1][:self.prefix_len] != self.prefix:

1290

raise errors.BadIndexData(self)

1291

for ref_list in node[3]:

1292

for ref_node in ref_list:

1293

if ref_node[:self.prefix_len] != self.prefix:

1294

raise errors.BadIndexData(self)

1295

yield node[0], node[1][self.prefix_len:], node[2], (

1296

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1297

for ref_list in node[3]))

1298

1299

def iter_all_entries(self):

1300

"""Iterate over all keys within the index

1301

1302

iter_all_entries is implemented against the adapted index using

1303

iter_entries_prefix.

1304

1305

:return: An iterable of (index, key, reference_lists, value). There is no

1306

defined order for the result iteration - it will be in the most

1307

efficient order for the index (in this case dictionary hash order).

1308

"""

1309

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1310

1311

def iter_entries(self, keys):

1312

"""Iterate over keys within the index.

1313

1314

:param keys: An iterable providing the keys to be retrieved.

1315

:return: An iterable of (key, reference_lists, value). There is no

1316

defined order for the result iteration - it will be in the most

1317

efficient order for the index (keys iteration order in this case).

1318

"""

1319

return self._strip_prefix(self.adapted.iter_entries(

1320

self.prefix + key for key in keys))

1321

1322

def iter_entries_prefix(self, keys):

1323

"""Iterate over keys within the index using prefix matching.

1324

1325

Prefix matching is applied within the tuple of a key, not to within

1326

the bytestring of each key element. e.g. if you have the keys ('foo',

1327

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1328

only the former key is returned.

1329

1330

:param keys: An iterable providing the key prefixes to be retrieved.

1331

Each key prefix takes the form of a tuple the length of a key, but

1332

with the last N elements 'None' rather than a regular bytestring.

1333

The first element cannot be 'None'.

1334

:return: An iterable as per iter_all_entries, but restricted to the

1335

keys with a matching prefix to those supplied. No additional keys

1336

will be returned, and every match that is in the index will be

1337

returned.

1338

"""

1339

return self._strip_prefix(self.adapted.iter_entries_prefix(

1340

self.prefix + key for key in keys))

1341

1342

def key_count(self):

1343

"""Return an estimate of the number of keys in this index.

1344

1345

For GraphIndexPrefixAdapter this is relatively expensive - key

1346

iteration with the prefix is done.

1347

"""

1348

return len(list(self.iter_all_entries()))

1349

1350

def validate(self):

1351

"""Call the adapted's validate."""

1352

self.adapted.validate()

Older »