~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Robert Collins
Date: 2005-09-28 05:25:54 UTC
mfrom: (1185.1.42)
mto: (1092.2.18)
mto: This revision was merged to the branch mainline in revision 1397.
Revision ID: robertc@robertcollins.net-20050928052554-beb985505f77ea6a

update symlink branch to integration

files added:
build-api

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/selftest/testremotebranch.py

bzrlib/upgrade.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

testbzr

testsweet.py

files removed:
BRANCH.TODO

COPYING.txt

INSTALL

bzr.ico

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/email_message.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_get_parent_map.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/win32utils.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

contrib/bzr_access

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/revnos.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

generate_docs.py

man1

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/package_mf.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

tools/win32/survey.txt

files renamed:
doc/developers/HACKING.txt => HACKING

tools/doc_generate/autodoc_man.py => bzr-man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

bzrlib/deprecated_graph.py => bzrlib/graph.py

contrib/newinventory.py => bzrlib/newinventory.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/http_utils.py => bzrlib/selftest/HTTPTestUtil.py

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/branch_implementations/test_parent.py => bzrlib/selftest/test_parent.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/selftest/test_revision_info.py

bzrlib/tests/branch_implementations/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_deprecated_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionspec.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/blackbox/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/__init__.py => bzrlib/store.py

bzrlib/ui/__init__.py => bzrlib/ui.py

bzrlib/xml_serializer.py => bzrlib/xml.py

bzrlib/upgrade.py => tools/history2weaves.py

bzrlib/tests/test_weave.py => tools/testweave.py

doc/en/tutorials/tutorial.txt => tutorial.txt

files modified:
.bzrignore

.rsyncexclude

Makefile

NEWS

README

TODO

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib/bash/bzr.simple

contrib/pwk

contrib/zsh/_bzr

setup.py *

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

self._nodes = {}

self._nodes_by_key = {}

self._key_length = key_elements

def _check_key(self, key):

"""Raise BadIndexKey if key is not a valid key for this index."""

if type(key) != tuple:

raise errors.BadIndexKey(key)

if self._key_length != len(key):

raise errors.BadIndexKey(key)

for element in key:

if not element or _whitespace_re.search(element) is not None:

raise errors.BadIndexKey(element)

def add_node(self, key, value, references=()):

"""Add a node to the index.

100

:param key: The key. keys are non-empty tuples containing

101

as many whitespace-free utf8 bytestrings as the key length

102

defined for this index.

103

:param references: An iterable of iterables of keys. Each is a

104

reference to another key.

105

:param value: The value to associate with the key. It may be any

106

bytes as long as it does not contain \0 or \n.

107

"""

108

self._check_key(key)

109

if _newline_null_re.search(value) is not None:

110

raise errors.BadIndexValue(value)

111

if len(references) != self.reference_lists:

112

raise errors.BadIndexValue(references)

113

node_refs = []

114

for reference_list in references:

115

for reference in reference_list:

116

self._check_key(reference)

117

if reference not in self._nodes:

118

self._nodes[reference] = ('a', (), '')

119

node_refs.append(tuple(reference_list))

120

if key in self._nodes and self._nodes[key][0] == '':

121

raise errors.BadIndexDuplicateKey(key, self)

122

self._nodes[key] = ('', tuple(node_refs), value)

123

self._keys.add(key)

124

if self._key_length > 1:

125

key_dict = self._nodes_by_key

126

if self.reference_lists:

127

key_value = key, value, tuple(node_refs)

128

else:

129

key_value = key, value

130

# possibly should do this on-demand, but it seems likely it is

131

# always wanted

132

# For a key of (foo, bar, baz) create

133

# _nodes_by_key[foo][bar][baz] = key_value

134

for subkey in key[:-1]:

135

key_dict = key_dict.setdefault(subkey, {})

136

key_dict[key[-1]] = key_value

137

138

def finish(self):

139

lines = [_SIGNATURE]

140

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

141

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

142

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

143

prefix_length = sum(len(x) for x in lines)

144

# references are byte offsets. To avoid having to do nasty

145

# polynomial work to resolve offsets (references to later in the

146

# file cannot be determined until all the inbetween references have

147

# been calculated too) we pad the offsets with 0's to make them be

148

# of consistent length. Using binary offsets would break the trivial

149

# file parsing.

150

# to calculate the width of zero's needed we do three passes:

151

# one to gather all the non-reference data and the number of references.

152

# one to pad all the data with reference-length and determine entry

153

# addresses.

154

# One to serialise.

155

156

# forward sorted by key. In future we may consider topological sorting,

157

# at the cost of table scans for direct lookup, or a second index for

158

# direct lookup

159

nodes = sorted(self._nodes.items())

160

# if we do not prepass, we don't know how long it will be up front.

161

expected_bytes = None

162

# we only need to pre-pass if we have reference lists at all.

163

if self.reference_lists:

164

key_offset_info = []

165

non_ref_bytes = prefix_length

166

total_references = 0

167

# TODO use simple multiplication for the constants in this loop.

168

for key, (absent, references, value) in nodes:

169

# record the offset known *so far* for this key:

170

# the non reference bytes to date, and the total references to

171

# date - saves reaccumulating on the second pass

172

key_offset_info.append((key, non_ref_bytes, total_references))

173

# key is literal, value is literal, there are 3 null's, 1 NL

174

# key is variable length tuple, \x00 between elements

175

non_ref_bytes += sum(len(element) for element in key)

176

if self._key_length > 1:

177

non_ref_bytes += self._key_length - 1

178

# value is literal bytes, there are 3 null's, 1 NL.

179

non_ref_bytes += len(value) + 3 + 1

180

# one byte for absent if set.

181

if absent:

182

non_ref_bytes += 1

183

elif self.reference_lists:

184

# (ref_lists -1) tabs

185

non_ref_bytes += self.reference_lists - 1

186

# (ref-1 cr's per ref_list)

187

for ref_list in references:

188

# how many references across the whole file?

189

total_references += len(ref_list)

190

# accrue reference separators

191

if ref_list:

192

non_ref_bytes += len(ref_list) - 1

193

# how many digits are needed to represent the total byte count?

194

digits = 1

195

possible_total_bytes = non_ref_bytes + total_references*digits

196

while 10 ** digits < possible_total_bytes:

197

digits += 1

198

possible_total_bytes = non_ref_bytes + total_references*digits

199

expected_bytes = possible_total_bytes + 1 # terminating newline

200

# resolve key addresses.

201

key_addresses = {}

202

for key, non_ref_bytes, total_references in key_offset_info:

203

key_addresses[key] = non_ref_bytes + total_references*digits

204

# serialise

205

format_string = '%%0%sd' % digits

206

for key, (absent, references, value) in nodes:

207

flattened_references = []

208

for ref_list in references:

209

ref_addresses = []

210

for reference in ref_list:

211

ref_addresses.append(format_string % key_addresses[reference])

212

flattened_references.append('\r'.join(ref_addresses))

213

string_key = '\x00'.join(key)

214

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

215

'\t'.join(flattened_references), value))

216

lines.append('\n')

217

result = StringIO(''.join(lines))

218

if expected_bytes and len(result.getvalue()) != expected_bytes:

219

raise errors.BzrError('Failed index creation. Internal error:'

220

' mismatched output length and expected length: %d %d' %

221

(len(result.getvalue()), expected_bytes))

222

return StringIO(''.join(lines))

223

224

225

class GraphIndex(object):

226

"""An index for data with embedded graphs.

227

228

The index maps keys to a list of key reference lists, and a value.

229

Each node has the same number of key reference lists. Each key reference

230

list can be empty or an arbitrary length. The value is an opaque NULL

231

terminated string without any newlines. The storage of the index is

232

hidden in the interface: keys and key references are always tuples of

233

bytestrings, never the internal representation (e.g. dictionary offsets).

234

235

It is presumed that the index will not be mutated - it is static data.

236

237

Successive iter_all_entries calls will read the entire index each time.

238

Additionally, iter_entries calls will read the index linearly until the

239

desired keys are found. XXX: This must be fixed before the index is

240

suitable for production use. :XXX

241

"""

242

243

def __init__(self, transport, name, size):

244

"""Open an index called name on transport.

245

246

:param transport: A bzrlib.transport.Transport.

247

:param name: A path to provide to transport API calls.

248

:param size: The size of the index in bytes. This is used for bisection

249

logic to perform partial index reads. While the size could be

250

obtained by statting the file this introduced an additional round

251

trip as well as requiring stat'able transports, both of which are

252

avoided by having it supplied. If size is None, then bisection

253

support will be disabled and accessing the index will just stream

254

all the data.

255

"""

256

self._transport = transport

257

self._name = name

258

# Becomes a dict of key:(value, reference-list-byte-locations) used by

259

# the bisection interface to store parsed but not resolved keys.

260

self._bisect_nodes = None

261

# Becomes a dict of key:(value, reference-list-keys) which are ready to

262

# be returned directly to callers.

263

self._nodes = None

264

# a sorted list of slice-addresses for the parsed bytes of the file.

265

# e.g. (0,1) would mean that byte 0 is parsed.

266

self._parsed_byte_map = []

267

# a sorted list of keys matching each slice address for parsed bytes

268

# e.g. (None, 'foo@bar') would mean that the first byte contained no

269

# key, and the end byte of the slice is the of the data for 'foo@bar'

270

self._parsed_key_map = []

271

self._key_count = None

272

self._keys_by_offset = None

273

self._nodes_by_key = None

274

self._size = size

275

276

def __eq__(self, other):

277

"""Equal when self and other were created with the same parameters."""

278

return (

279

type(self) == type(other) and

280

self._transport == other._transport and

281

self._name == other._name and

282

self._size == other._size)

283

284

def __ne__(self, other):

285

return not self.__eq__(other)

286

287

def _buffer_all(self):

288

"""Buffer all the index data.

289

290

Mutates self._nodes and self.keys_by_offset.

291

"""

292

if 'index' in debug.debug_flags:

293

mutter('Reading entire index %s', self._transport.abspath(self._name))

294

stream = self._transport.get(self._name)

295

self._read_prefix(stream)

296

self._expected_elements = 3 + self._key_length

297

line_count = 0

298

# raw data keyed by offset

299

self._keys_by_offset = {}

300

# ready-to-return key:value or key:value, node_ref_lists

301

self._nodes = {}

302

self._nodes_by_key = {}

303

trailers = 0

304

pos = stream.tell()

305

lines = stream.read().split('\n')

306

del lines[-1]

307

_, _, _, trailers = self._parse_lines(lines, pos)

308

for key, absent, references, value in self._keys_by_offset.itervalues():

309

if absent:

310

continue

311

# resolve references:

312

if self.node_ref_lists:

313

node_value = (value, self._resolve_references(references))

314

else:

315

node_value = value

316

self._nodes[key] = node_value

317

if self._key_length > 1:

318

subkey = list(reversed(key[:-1]))

319

key_dict = self._nodes_by_key

320

if self.node_ref_lists:

321

key_value = key, node_value[0], node_value[1]

322

else:

323

key_value = key, node_value

324

# possibly should do this on-demand, but it seems likely it is

325

# always wanted

326

# For a key of (foo, bar, baz) create

327

# _nodes_by_key[foo][bar][baz] = key_value

328

for subkey in key[:-1]:

329

key_dict = key_dict.setdefault(subkey, {})

330

key_dict[key[-1]] = key_value

331

# cache the keys for quick set intersections

332

self._keys = set(self._nodes)

333

if trailers != 1:

334

# there must be one line - the empty trailer line.

335

raise errors.BadIndexData(self)

336

337

def iter_all_entries(self):

338

"""Iterate over all keys within the index.

339

340

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

341

The former tuple is used when there are no reference lists in the

342

index, making the API compatible with simple key:value index types.

343

There is no defined order for the result iteration - it will be in

344

the most efficient order for the index.

345

"""

346

if 'evil' in debug.debug_flags:

347

trace.mutter_callsite(3,

348

"iter_all_entries scales with size of history.")

349

if self._nodes is None:

350

self._buffer_all()

351

if self.node_ref_lists:

352

for key, (value, node_ref_lists) in self._nodes.iteritems():

353

yield self, key, value, node_ref_lists

354

else:

355

for key, value in self._nodes.iteritems():

356

yield self, key, value

357

358

def _read_prefix(self, stream):

359

signature = stream.read(len(self._signature()))

360

if not signature == self._signature():

361

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

362

options_line = stream.readline()

363

if not options_line.startswith(_OPTION_NODE_REFS):

364

raise errors.BadIndexOptions(self)

365

try:

366

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

367

except ValueError:

368

raise errors.BadIndexOptions(self)

369

options_line = stream.readline()

370

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

371

raise errors.BadIndexOptions(self)

372

try:

373

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

374

except ValueError:

375

raise errors.BadIndexOptions(self)

376

options_line = stream.readline()

377

if not options_line.startswith(_OPTION_LEN):

378

raise errors.BadIndexOptions(self)

379

try:

380

self._key_count = int(options_line[len(_OPTION_LEN):-1])

381

except ValueError:

382

raise errors.BadIndexOptions(self)

383

384

def _resolve_references(self, references):

385

"""Return the resolved key references for references.

386

387

References are resolved by looking up the location of the key in the

388

_keys_by_offset map and substituting the key name, preserving ordering.

389

390

:param references: An iterable of iterables of key locations. e.g.

391

[[123, 456], [123]]

392

:return: A tuple of tuples of keys.

393

"""

394

node_refs = []

395

for ref_list in references:

396

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

397

return tuple(node_refs)

398

399

def _find_index(self, range_map, key):

400

"""Helper for the _parsed_*_index calls.

401

402

Given a range map - [(start, end), ...], finds the index of the range

403

in the map for key if it is in the map, and if it is not there, the

404

immediately preceeding range in the map.

405

"""

406

result = bisect_right(range_map, key) - 1

407

if result + 1 < len(range_map):

408

# check the border condition, it may be in result + 1

409

if range_map[result + 1][0] == key[0]:

410

return result + 1

411

return result

412

413

def _parsed_byte_index(self, offset):

414

"""Return the index of the entry immediately before offset.

415

416

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

417

there is one unparsed byte (the 11th, addressed as[10]). then:

418

asking for 0 will return 0

419

asking for 10 will return 0

420

asking for 11 will return 1

421

asking for 12 will return 1

422

"""

423

key = (offset, 0)

424

return self._find_index(self._parsed_byte_map, key)

425

426

def _parsed_key_index(self, key):

427

"""Return the index of the entry immediately before key.

428

429

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

430

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

431

have been parsed, then:

432

asking for '' will return 0

433

asking for 'a' will return 0

434

asking for 'b' will return 1

435

asking for 'e' will return 1

436

"""

437

search_key = (key, None)

438

return self._find_index(self._parsed_key_map, search_key)

439

440

def _is_parsed(self, offset):

441

"""Returns True if offset has been parsed."""

442

index = self._parsed_byte_index(offset)

443

if index == len(self._parsed_byte_map):

444

return offset < self._parsed_byte_map[index - 1][1]

445

start, end = self._parsed_byte_map[index]

446

return offset >= start and offset < end

447

448

def _iter_entries_from_total_buffer(self, keys):

449

"""Iterate over keys when the entire index is parsed."""

450

keys = keys.intersection(self._keys)

451

if self.node_ref_lists:

452

for key in keys:

453

value, node_refs = self._nodes[key]

454

yield self, key, value, node_refs

455

else:

456

for key in keys:

457

yield self, key, self._nodes[key]

458

459

def iter_entries(self, keys):

460

"""Iterate over keys within the index.

461

462

:param keys: An iterable providing the keys to be retrieved.

463

:return: An iterable as per iter_all_entries, but restricted to the

464

keys supplied. No additional keys will be returned, and every

465

key supplied that is in the index will be returned.

466

"""

467

# PERFORMANCE TODO: parse and bisect all remaining data at some

468

# threshold of total-index processing/get calling layers that expect to

469

# read the entire index to use the iter_all_entries method instead.

470

keys = set(keys)

471

if not keys:

472

return []

473

if self._size is None and self._nodes is None:

474

self._buffer_all()

475

if self._nodes is not None:

476

return self._iter_entries_from_total_buffer(keys)

477

else:

478

return (result[1] for result in bisect_multi_bytes(

479

self._lookup_keys_via_location, self._size, keys))

480

481

def iter_entries_prefix(self, keys):

482

"""Iterate over keys within the index using prefix matching.

483

484

Prefix matching is applied within the tuple of a key, not to within

485

the bytestring of each key element. e.g. if you have the keys ('foo',

486

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

487

only the former key is returned.

488

489

WARNING: Note that this method currently causes a full index parse

490

unconditionally (which is reasonably appropriate as it is a means for

491

thunking many small indices into one larger one and still supplies

492

iter_all_entries at the thunk layer).

493

494

:param keys: An iterable providing the key prefixes to be retrieved.

495

Each key prefix takes the form of a tuple the length of a key, but

496

with the last N elements 'None' rather than a regular bytestring.

497

The first element cannot be 'None'.

498

:return: An iterable as per iter_all_entries, but restricted to the

499

keys with a matching prefix to those supplied. No additional keys

500

will be returned, and every match that is in the index will be

501

returned.

502

"""

503

keys = set(keys)

504

if not keys:

505

return

506

# load data - also finds key lengths

507

if self._nodes is None:

508

self._buffer_all()

509

if self._key_length == 1:

510

for key in keys:

511

# sanity check

512

if key[0] is None:

513

raise errors.BadIndexKey(key)

514

if len(key) != self._key_length:

515

raise errors.BadIndexKey(key)

516

if self.node_ref_lists:

517

value, node_refs = self._nodes[key]

518

yield self, key, value, node_refs

519

else:

520

yield self, key, self._nodes[key]

521

return

522

for key in keys:

523

# sanity check

524

if key[0] is None:

525

raise errors.BadIndexKey(key)

526

if len(key) != self._key_length:

527

raise errors.BadIndexKey(key)

528

# find what it refers to:

529

key_dict = self._nodes_by_key

530

elements = list(key)

531

# find the subdict whose contents should be returned.

532

try:

533

while len(elements) and elements[0] is not None:

534

key_dict = key_dict[elements[0]]

535

elements.pop(0)

536

except KeyError:

537

# a non-existant lookup.

538

continue

539

if len(elements):

540

dicts = [key_dict]

541

while dicts:

542

key_dict = dicts.pop(-1)

543

# can't be empty or would not exist

544

item, value = key_dict.iteritems().next()

545

if type(value) == dict:

546

# push keys

547

dicts.extend(key_dict.itervalues())

548

else:

549

# yield keys

550

for value in key_dict.itervalues():

551

# each value is the key:value:node refs tuple

552

# ready to yield.

553

yield (self, ) + value

554

else:

555

# the last thing looked up was a terminal element

556

yield (self, ) + key_dict

557

558

def key_count(self):

559

"""Return an estimate of the number of keys in this index.

560

561

For GraphIndex the estimate is exact.

562

"""

563

if self._key_count is None:

564

self._read_and_parse([_HEADER_READV])

565

return self._key_count

566

567

def _lookup_keys_via_location(self, location_keys):

568

"""Public interface for implementing bisection.

569

570

If _buffer_all has been called, then all the data for the index is in

571

memory, and this method should not be called, as it uses a separate

572

cache because it cannot pre-resolve all indices, which buffer_all does

573

for performance.

574

575

:param location_keys: A list of location(byte offset), key tuples.

576

:return: A list of (location_key, result) tuples as expected by

577

bzrlib.bisect_multi.bisect_multi_bytes.

578

"""

579

# Possible improvements:

580

# - only bisect lookup each key once

581

# - sort the keys first, and use that to reduce the bisection window

582

# -----

583

# this progresses in three parts:

584

# read data

585

# parse it

586

# attempt to answer the question from the now in memory data.

587

# build the readv request

588

# for each location, ask for 800 bytes - much more than rows we've seen

589

# anywhere.

590

readv_ranges = []

591

for location, key in location_keys:

592

# can we answer from cache?

593

if self._bisect_nodes and key in self._bisect_nodes:

594

# We have the key parsed.

595

continue

596

index = self._parsed_key_index(key)

597

if (len(self._parsed_key_map) and

598

self._parsed_key_map[index][0] <= key and

599

(self._parsed_key_map[index][1] >= key or

600

# end of the file has been parsed

601

self._parsed_byte_map[index][1] == self._size)):

602

# the key has been parsed, so no lookup is needed even if its

603

# not present.

604

continue

605

# - if we have examined this part of the file already - yes

606

index = self._parsed_byte_index(location)

607

if (len(self._parsed_byte_map) and

608

self._parsed_byte_map[index][0] <= location and

609

self._parsed_byte_map[index][1] > location):

610

# the byte region has been parsed, so no read is needed.

611

continue

612

length = 800

613

if location + length > self._size:

614

length = self._size - location

615

# todo, trim out parsed locations.

616

if length > 0:

617

readv_ranges.append((location, length))

618

# read the header if needed

619

if self._bisect_nodes is None:

620

readv_ranges.append(_HEADER_READV)

621

self._read_and_parse(readv_ranges)

622

# generate results:

623

# - figure out <, >, missing, present

624

# - result present references so we can return them.

625

result = []

626

# keys that we cannot answer until we resolve references

627

pending_references = []

628

pending_locations = set()

629

for location, key in location_keys:

630

# can we answer from cache?

631

if key in self._bisect_nodes:

632

# the key has been parsed, so no lookup is needed

633

if self.node_ref_lists:

634

# the references may not have been all parsed.

635

value, refs = self._bisect_nodes[key]

636

wanted_locations = []

637

for ref_list in refs:

638

for ref in ref_list:

639

if ref not in self._keys_by_offset:

640

wanted_locations.append(ref)

641

if wanted_locations:

642

pending_locations.update(wanted_locations)

643

pending_references.append((location, key))

644

continue

645

result.append(((location, key), (self, key,

646

value, self._resolve_references(refs))))

647

else:

648

result.append(((location, key),

649

(self, key, self._bisect_nodes[key])))

650

continue

651

else:

652

# has the region the key should be in, been parsed?

653

index = self._parsed_key_index(key)

654

if (self._parsed_key_map[index][0] <= key and

655

(self._parsed_key_map[index][1] >= key or

656

# end of the file has been parsed

657

self._parsed_byte_map[index][1] == self._size)):

658

result.append(((location, key), False))

659

continue

660

# no, is the key above or below the probed location:

661

# get the range of the probed & parsed location

662

index = self._parsed_byte_index(location)

663

# if the key is below the start of the range, its below

664

if key < self._parsed_key_map[index][0]:

665

direction = -1

666

else:

667

direction = +1

668

result.append(((location, key), direction))

669

readv_ranges = []

670

# lookup data to resolve references

671

for location in pending_locations:

672

length = 800

673

if location + length > self._size:

674

length = self._size - location

675

# TODO: trim out parsed locations (e.g. if the 800 is into the

676

# parsed region trim it, and dont use the adjust_for_latency

677

# facility)

678

if length > 0:

679

readv_ranges.append((location, length))

680

self._read_and_parse(readv_ranges)

681

for location, key in pending_references:

682

# answer key references we had to look-up-late.

683

index = self._parsed_key_index(key)

684

value, refs = self._bisect_nodes[key]

685

result.append(((location, key), (self, key,

686

value, self._resolve_references(refs))))

687

return result

688

689

def _parse_header_from_bytes(self, bytes):

690

"""Parse the header from a region of bytes.

691

692

:param bytes: The data to parse.

693

:return: An offset, data tuple such as readv yields, for the unparsed

694

data. (which may length 0).

695

"""

696

signature = bytes[0:len(self._signature())]

697

if not signature == self._signature():

698

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

699

lines = bytes[len(self._signature()):].splitlines()

700

options_line = lines[0]

701

if not options_line.startswith(_OPTION_NODE_REFS):

702

raise errors.BadIndexOptions(self)

703

try:

704

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

705

except ValueError:

706

raise errors.BadIndexOptions(self)

707

options_line = lines[1]

708

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

709

raise errors.BadIndexOptions(self)

710

try:

711

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

712

except ValueError:

713

raise errors.BadIndexOptions(self)

714

options_line = lines[2]

715

if not options_line.startswith(_OPTION_LEN):

716

raise errors.BadIndexOptions(self)

717

try:

718

self._key_count = int(options_line[len(_OPTION_LEN):])

719

except ValueError:

720

raise errors.BadIndexOptions(self)

721

# calculate the bytes we have processed

722

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

723

len(lines[2]) + 3)

724

self._parsed_bytes(0, None, header_end, None)

725

# setup parsing state

726

self._expected_elements = 3 + self._key_length

727

# raw data keyed by offset

728

self._keys_by_offset = {}

729

# keys with the value and node references

730

self._bisect_nodes = {}

731

return header_end, bytes[header_end:]

732

733

def _parse_region(self, offset, data):

734

"""Parse node data returned from a readv operation.

735

736

:param offset: The byte offset the data starts at.

737

:param data: The data to parse.

738

"""

739

# trim the data.

740

# end first:

741

end = offset + len(data)

742

high_parsed = offset

743

while True:

744

# Trivial test - if the current index's end is within the

745

# low-matching parsed range, we're done.

746

index = self._parsed_byte_index(high_parsed)

747

if end < self._parsed_byte_map[index][1]:

748

return

749

# print "[%d:%d]" % (offset, end), \

750

# self._parsed_byte_map[index:index + 2]

751

high_parsed, last_segment = self._parse_segment(

752

offset, data, end, index)

753

if last_segment:

754

return

755

756

def _parse_segment(self, offset, data, end, index):

757

"""Parse one segment of data.

758

759

:param offset: Where 'data' begins in the file.

760

:param data: Some data to parse a segment of.

761

:param end: Where data ends

762

:param index: The current index into the parsed bytes map.

763

:return: True if the parsed segment is the last possible one in the

764

range of data.

765

:return: high_parsed_byte, last_segment.

766

high_parsed_byte is the location of the highest parsed byte in this

767

segment, last_segment is True if the parsed segment is the last

768

possible one in the data block.

769

"""

770

# default is to use all data

771

trim_end = None

772

# accomodate overlap with data before this.

773

if offset < self._parsed_byte_map[index][1]:

774

# overlaps the lower parsed region

775

# skip the parsed data

776

trim_start = self._parsed_byte_map[index][1] - offset

777

# don't trim the start for \n

778

start_adjacent = True

779

elif offset == self._parsed_byte_map[index][1]:

780

# abuts the lower parsed region

781

# use all data

782

trim_start = None

783

# do not trim anything

784

start_adjacent = True

785

else:

786

# does not overlap the lower parsed region

787

# use all data

788

trim_start = None

789

# but trim the leading \n

790

start_adjacent = False

791

if end == self._size:

792

# lines up to the end of all data:

793

# use it all

794

trim_end = None

795

# do not strip to the last \n

796

end_adjacent = True

797

last_segment = True

798

elif index + 1 == len(self._parsed_byte_map):

799

# at the end of the parsed data

800

# use it all

801

trim_end = None

802

# but strip to the last \n

803

end_adjacent = False

804

last_segment = True

805

elif end == self._parsed_byte_map[index + 1][0]:

806

# buts up against the next parsed region

807

# use it all

808

trim_end = None

809

# do not strip to the last \n

810

end_adjacent = True

811

last_segment = True

812

elif end > self._parsed_byte_map[index + 1][0]:

813

# overlaps into the next parsed region

814

# only consider the unparsed data

815

trim_end = self._parsed_byte_map[index + 1][0] - offset

816

# do not strip to the last \n as we know its an entire record

817

end_adjacent = True

818

last_segment = end < self._parsed_byte_map[index + 1][1]

819

else:

820

# does not overlap into the next region

821

# use it all

822

trim_end = None

823

# but strip to the last \n

824

end_adjacent = False

825

last_segment = True

826

# now find bytes to discard if needed

827

if not start_adjacent:

828

# work around python bug in rfind

829

if trim_start is None:

830

trim_start = data.find('\n') + 1

831

else:

832

trim_start = data.find('\n', trim_start) + 1

833

if not (trim_start != 0):

834

raise AssertionError('no \n was present')

835

# print 'removing start', offset, trim_start, repr(data[:trim_start])

836

if not end_adjacent:

837

# work around python bug in rfind

838

if trim_end is None:

839

trim_end = data.rfind('\n') + 1

840

else:

841

trim_end = data.rfind('\n', None, trim_end) + 1

842

if not (trim_end != 0):

843

raise AssertionError('no \n was present')

844

# print 'removing end', offset, trim_end, repr(data[trim_end:])

845

# adjust offset and data to the parseable data.

846

trimmed_data = data[trim_start:trim_end]

847

if not (trimmed_data):

848

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

849

% (trim_start, trim_end, offset, offset + len(data)))

850

if trim_start:

851

offset += trim_start

852

# print "parsing", repr(trimmed_data)

853

# splitlines mangles the \r delimiters.. don't use it.

854

lines = trimmed_data.split('\n')

855

del lines[-1]

856

pos = offset

857

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

858

for key, value in nodes:

859

self._bisect_nodes[key] = value

860

self._parsed_bytes(offset, first_key,

861

offset + len(trimmed_data), last_key)

862

return offset + len(trimmed_data), last_segment

863

864

def _parse_lines(self, lines, pos):

865

key = None

866

first_key = None

867

trailers = 0

868

nodes = []

869

for line in lines:

870

if line == '':

871

# must be at the end

872

if self._size:

873

if not (self._size == pos + 1):

874

raise AssertionError("%s %s" % (self._size, pos))

875

trailers += 1

876

continue

877

elements = line.split('\0')

878

if len(elements) != self._expected_elements:

879

raise errors.BadIndexData(self)

880

# keys are tuples

881

key = tuple(elements[:self._key_length])

882

if first_key is None:

883

first_key = key

884

absent, references, value = elements[-3:]

885

ref_lists = []

886

for ref_string in references.split('\t'):

887

ref_lists.append(tuple([

888

int(ref) for ref in ref_string.split('\r') if ref

889

]))

890

ref_lists = tuple(ref_lists)

891

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

892

pos += len(line) + 1 # +1 for the \n

893

if absent:

894

continue

895

if self.node_ref_lists:

896

node_value = (value, ref_lists)

897

else:

898

node_value = value

899

nodes.append((key, node_value))

900

# print "parsed ", key

901

return first_key, key, nodes, trailers

902

903

def _parsed_bytes(self, start, start_key, end, end_key):

904

"""Mark the bytes from start to end as parsed.

905

906

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

907

1) as parsed.

908

909

:param start: The start of the parsed region.

910

:param end: The end of the parsed region.

911

"""

912

index = self._parsed_byte_index(start)

913

new_value = (start, end)

914

new_key = (start_key, end_key)

915

if index == -1:

916

# first range parsed is always the beginning.

917

self._parsed_byte_map.insert(index, new_value)

918

self._parsed_key_map.insert(index, new_key)

919

return

920

# four cases:

921

# new region

922

# extend lower region

923

# extend higher region

924

# combine two regions

925

if (index + 1 < len(self._parsed_byte_map) and

926

self._parsed_byte_map[index][1] == start and

927

self._parsed_byte_map[index + 1][0] == end):

928

# combine two regions

929

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

930

self._parsed_byte_map[index + 1][1])

931

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

932

self._parsed_key_map[index + 1][1])

933

del self._parsed_byte_map[index + 1]

934

del self._parsed_key_map[index + 1]

935

elif self._parsed_byte_map[index][1] == start:

936

# extend the lower entry

937

self._parsed_byte_map[index] = (

938

self._parsed_byte_map[index][0], end)

939

self._parsed_key_map[index] = (

940

self._parsed_key_map[index][0], end_key)

941

elif (index + 1 < len(self._parsed_byte_map) and

942

self._parsed_byte_map[index + 1][0] == end):

943

# extend the higher entry

944

self._parsed_byte_map[index + 1] = (

945

start, self._parsed_byte_map[index + 1][1])

946

self._parsed_key_map[index + 1] = (

947

start_key, self._parsed_key_map[index + 1][1])

948

else:

949

# new entry

950

self._parsed_byte_map.insert(index + 1, new_value)

951

self._parsed_key_map.insert(index + 1, new_key)

952

953

def _read_and_parse(self, readv_ranges):

954

"""Read the the ranges and parse the resulting data.

955

956

:param readv_ranges: A prepared readv range list.

957

"""

958

if readv_ranges:

959

readv_data = self._transport.readv(self._name, readv_ranges, True,

960

self._size)

961

# parse

962

for offset, data in readv_data:

963

if self._bisect_nodes is None:

964

# this must be the start

965

if not (offset == 0):

966

raise AssertionError()

967

offset, data = self._parse_header_from_bytes(data)

968

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

969

self._parse_region(offset, data)

970

971

def _signature(self):

972

"""The file signature for this index type."""

973

return _SIGNATURE

974

975

def validate(self):

976

"""Validate that everything in the index can be accessed."""

977

# iter_all validates completely at the moment, so just do that.

978

for node in self.iter_all_entries():

979

pass

980

981

982

class CombinedGraphIndex(object):

983

"""A GraphIndex made up from smaller GraphIndices.

984

985

The backing indices must implement GraphIndex, and are presumed to be

986

static data.

987

988

Queries against the combined index will be made against the first index,

989

and then the second and so on. The order of index's can thus influence

990

performance significantly. For example, if one index is on local disk and a

991

second on a remote server, the local disk index should be before the other

992

in the index list.

993

"""

994

995

def __init__(self, indices):

996

"""Create a CombinedGraphIndex backed by indices.

997

998

:param indices: An ordered list of indices to query for data.

999

"""

1000

self._indices = indices

1001

1002

def __repr__(self):

1003

return "%s(%s)" % (

1004

self.__class__.__name__,

1005

', '.join(map(repr, self._indices)))

1006

1007

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

1008

def get_parents(self, revision_ids):

1009

"""See graph._StackedParentsProvider.get_parents.

1010

1011

This implementation thunks the graph.Graph.get_parents api across to

1012

GraphIndex.

1013

1014

:param revision_ids: An iterable of graph keys for this graph.

1015

:return: A list of parent details for each key in revision_ids.

1016

Each parent details will be one of:

1017

* None when the key was missing

1018

* (NULL_REVISION,) when the key has no parents.

1019

* (parent_key, parent_key...) otherwise.

1020

"""

1021

parent_map = self.get_parent_map(revision_ids)

1022

return [parent_map.get(r, None) for r in revision_ids]

1023

1024

def get_parent_map(self, keys):

1025

"""See graph._StackedParentsProvider.get_parent_map"""

1026

search_keys = set(keys)

1027

if NULL_REVISION in search_keys:

1028

search_keys.discard(NULL_REVISION)

1029

found_parents = {NULL_REVISION:[]}

1030

else:

1031

found_parents = {}

1032

for index, key, value, refs in self.iter_entries(search_keys):

1033

parents = refs[0]

1034

if not parents:

1035

parents = (NULL_REVISION,)

1036

found_parents[key] = parents

1037

return found_parents

1038

1039

def insert_index(self, pos, index):

1040

"""Insert a new index in the list of indices to query.

1041

1042

:param pos: The position to insert the index.

1043

:param index: The index to insert.

1044

"""

1045

self._indices.insert(pos, index)

1046

1047

def iter_all_entries(self):

1048

"""Iterate over all keys within the index

1049

1050

Duplicate keys across child indices are presumed to have the same

1051

value and are only reported once.

1052

1053

:return: An iterable of (index, key, reference_lists, value).

1054

There is no defined order for the result iteration - it will be in

1055

the most efficient order for the index.

1056

"""

1057

seen_keys = set()

1058

for index in self._indices:

1059

for node in index.iter_all_entries():

1060

if node[1] not in seen_keys:

1061

yield node

1062

seen_keys.add(node[1])

1063

1064

def iter_entries(self, keys):

1065

"""Iterate over keys within the index.

1066

1067

Duplicate keys across child indices are presumed to have the same

1068

value and are only reported once.

1069

1070

:param keys: An iterable providing the keys to be retrieved.

1071

:return: An iterable of (index, key, reference_lists, value). There is no

1072

defined order for the result iteration - it will be in the most

1073

efficient order for the index.

1074

"""

1075

keys = set(keys)

1076

for index in self._indices:

1077

if not keys:

1078

return

1079

for node in index.iter_entries(keys):

1080

keys.remove(node[1])

1081

yield node

1082

1083

def iter_entries_prefix(self, keys):

1084

"""Iterate over keys within the index using prefix matching.

1085

1086

Duplicate keys across child indices are presumed to have the same

1087

value and are only reported once.

1088

1089

Prefix matching is applied within the tuple of a key, not to within

1090

the bytestring of each key element. e.g. if you have the keys ('foo',

1091

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1092

only the former key is returned.

1093

1094

:param keys: An iterable providing the key prefixes to be retrieved.

1095

Each key prefix takes the form of a tuple the length of a key, but

1096

with the last N elements 'None' rather than a regular bytestring.

1097

The first element cannot be 'None'.

1098

:return: An iterable as per iter_all_entries, but restricted to the

1099

keys with a matching prefix to those supplied. No additional keys

1100

will be returned, and every match that is in the index will be

1101

returned.

1102

"""

1103

keys = set(keys)

1104

if not keys:

1105

return

1106

seen_keys = set()

1107

for index in self._indices:

1108

for node in index.iter_entries_prefix(keys):

1109

if node[1] in seen_keys:

1110

continue

1111

seen_keys.add(node[1])

1112

yield node

1113

1114

def key_count(self):

1115

"""Return an estimate of the number of keys in this index.

1116

1117

For CombinedGraphIndex this is approximated by the sum of the keys of

1118

the child indices. As child indices may have duplicate keys this can

1119

have a maximum error of the number of child indices * largest number of

1120

keys in any index.

1121

"""

1122

return sum((index.key_count() for index in self._indices), 0)

1123

1124

def validate(self):

1125

"""Validate that everything in the index can be accessed."""

1126

for index in self._indices:

1127

index.validate()

1128

1129

1130

class InMemoryGraphIndex(GraphIndexBuilder):

1131

"""A GraphIndex which operates entirely out of memory and is mutable.

1132

1133

This is designed to allow the accumulation of GraphIndex entries during a

1134

single write operation, where the accumulated entries need to be immediately

1135

available - for example via a CombinedGraphIndex.

1136

"""

1137

1138

def add_nodes(self, nodes):

1139

"""Add nodes to the index.

1140

1141

:param nodes: An iterable of (key, node_refs, value) entries to add.

1142

"""

1143

if self.reference_lists:

1144

for (key, value, node_refs) in nodes:

1145

self.add_node(key, value, node_refs)

1146

else:

1147

for (key, value) in nodes:

1148

self.add_node(key, value)

1149

1150

def iter_all_entries(self):

1151

"""Iterate over all keys within the index

1152

1153

:return: An iterable of (index, key, reference_lists, value). There is no

1154

defined order for the result iteration - it will be in the most

1155

efficient order for the index (in this case dictionary hash order).

1156

"""

1157

if 'evil' in debug.debug_flags:

1158

trace.mutter_callsite(3,

1159

"iter_all_entries scales with size of history.")

1160

if self.reference_lists:

1161

for key, (absent, references, value) in self._nodes.iteritems():

1162

if not absent:

1163

yield self, key, value, references

1164

else:

1165

for key, (absent, references, value) in self._nodes.iteritems():

1166

if not absent:

1167

yield self, key, value

1168

1169

def iter_entries(self, keys):

1170

"""Iterate over keys within the index.

1171

1172

:param keys: An iterable providing the keys to be retrieved.

1173

:return: An iterable of (index, key, value, reference_lists). There is no

1174

defined order for the result iteration - it will be in the most

1175

efficient order for the index (keys iteration order in this case).

1176

"""

1177

keys = set(keys)

1178

if self.reference_lists:

1179

for key in keys.intersection(self._keys):

1180

node = self._nodes[key]

1181

if not node[0]:

1182

yield self, key, node[2], node[1]

1183

else:

1184

for key in keys.intersection(self._keys):

1185

node = self._nodes[key]

1186

if not node[0]:

1187

yield self, key, node[2]

1188

1189

def iter_entries_prefix(self, keys):

1190

"""Iterate over keys within the index using prefix matching.

1191

1192

Prefix matching is applied within the tuple of a key, not to within

1193

the bytestring of each key element. e.g. if you have the keys ('foo',

1194

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1195

only the former key is returned.

1196

1197

:param keys: An iterable providing the key prefixes to be retrieved.

1198

Each key prefix takes the form of a tuple the length of a key, but

1199

with the last N elements 'None' rather than a regular bytestring.

1200

The first element cannot be 'None'.

1201

:return: An iterable as per iter_all_entries, but restricted to the

1202

keys with a matching prefix to those supplied. No additional keys

1203

will be returned, and every match that is in the index will be

1204

returned.

1205

"""

1206

# XXX: To much duplication with the GraphIndex class; consider finding

1207

# a good place to pull out the actual common logic.

1208

keys = set(keys)

1209

if not keys:

1210

return

1211

if self._key_length == 1:

1212

for key in keys:

1213

# sanity check

1214

if key[0] is None:

1215

raise errors.BadIndexKey(key)

1216

if len(key) != self._key_length:

1217

raise errors.BadIndexKey(key)

1218

node = self._nodes[key]

1219

if node[0]:

1220

continue

1221

if self.reference_lists:

1222

yield self, key, node[2], node[1]

1223

else:

1224

yield self, key, node[2]

1225

return

1226

for key in keys:

1227

# sanity check

1228

if key[0] is None:

1229

raise errors.BadIndexKey(key)

1230

if len(key) != self._key_length:

1231

raise errors.BadIndexKey(key)

1232

# find what it refers to:

1233

key_dict = self._nodes_by_key

1234

elements = list(key)

1235

# find the subdict to return

1236

try:

1237

while len(elements) and elements[0] is not None:

1238

key_dict = key_dict[elements[0]]

1239

elements.pop(0)

1240

except KeyError:

1241

# a non-existant lookup.

1242

continue

1243

if len(elements):

1244

dicts = [key_dict]

1245

while dicts:

1246

key_dict = dicts.pop(-1)

1247

# can't be empty or would not exist

1248

item, value = key_dict.iteritems().next()

1249

if type(value) == dict:

1250

# push keys

1251

dicts.extend(key_dict.itervalues())

1252

else:

1253

# yield keys

1254

for value in key_dict.itervalues():

1255

yield (self, ) + value

1256

else:

1257

yield (self, ) + key_dict

1258

1259

def key_count(self):

1260

"""Return an estimate of the number of keys in this index.

1261

1262

For InMemoryGraphIndex the estimate is exact.

1263

"""

1264

return len(self._keys)

1265

1266

def validate(self):

1267

"""In memory index's have no known corruption at the moment."""

1268

1269

1270

class GraphIndexPrefixAdapter(object):

1271

"""An adapter between GraphIndex with different key lengths.

1272

1273

Queries against this will emit queries against the adapted Graph with the

1274

prefix added, queries for all items use iter_entries_prefix. The returned

1275

nodes will have their keys and node references adjusted to remove the

1276

prefix. Finally, an add_nodes_callback can be supplied - when called the

1277

nodes and references being added will have prefix prepended.

1278

"""

1279

1280

def __init__(self, adapted, prefix, missing_key_length,

1281

add_nodes_callback=None):

1282

"""Construct an adapter against adapted with prefix."""

1283

self.adapted = adapted

1284

self.prefix_key = prefix + (None,)*missing_key_length

1285

self.prefix = prefix

1286

self.prefix_len = len(prefix)

1287

self.add_nodes_callback = add_nodes_callback

1288

1289

def add_nodes(self, nodes):

1290

"""Add nodes to the index.

1291

1292

:param nodes: An iterable of (key, node_refs, value) entries to add.

1293

"""

1294

# save nodes in case its an iterator

1295

nodes = tuple(nodes)

1296

translated_nodes = []

1297

try:

1298

# Add prefix_key to each reference node_refs is a tuple of tuples,

1299

# so split it apart, and add prefix_key to the internal reference

1300

for (key, value, node_refs) in nodes:

1301

adjusted_references = (

1302

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1303

for ref_list in node_refs))

1304

translated_nodes.append((self.prefix + key, value,

1305

adjusted_references))

1306

except ValueError:

1307

# XXX: TODO add an explicit interface for getting the reference list

1308

# status, to handle this bit of user-friendliness in the API more

1309

# explicitly.

1310

for (key, value) in nodes:

1311

translated_nodes.append((self.prefix + key, value))

1312

self.add_nodes_callback(translated_nodes)

1313

1314

def add_node(self, key, value, references=()):

1315

"""Add a node to the index.

1316

1317

:param key: The key. keys are non-empty tuples containing

1318

as many whitespace-free utf8 bytestrings as the key length

1319

defined for this index.

1320

:param references: An iterable of iterables of keys. Each is a

1321

reference to another key.

1322

:param value: The value to associate with the key. It may be any

1323

bytes as long as it does not contain \0 or \n.

1324

"""

1325

self.add_nodes(((key, value, references), ))

1326

1327

def _strip_prefix(self, an_iter):

1328

"""Strip prefix data from nodes and return it."""

1329

for node in an_iter:

1330

# cross checks

1331

if node[1][:self.prefix_len] != self.prefix:

1332

raise errors.BadIndexData(self)

1333

for ref_list in node[3]:

1334

for ref_node in ref_list:

1335

if ref_node[:self.prefix_len] != self.prefix:

1336

raise errors.BadIndexData(self)

1337

yield node[0], node[1][self.prefix_len:], node[2], (

1338

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1339

for ref_list in node[3]))

1340

1341

def iter_all_entries(self):

1342

"""Iterate over all keys within the index

1343

1344

iter_all_entries is implemented against the adapted index using

1345

iter_entries_prefix.

1346

1347

:return: An iterable of (index, key, reference_lists, value). There is no

1348

defined order for the result iteration - it will be in the most

1349

efficient order for the index (in this case dictionary hash order).

1350

"""

1351

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1352

1353

def iter_entries(self, keys):

1354

"""Iterate over keys within the index.

1355

1356

:param keys: An iterable providing the keys to be retrieved.

1357

:return: An iterable of (index, key, value, reference_lists). There is no

1358

defined order for the result iteration - it will be in the most

1359

efficient order for the index (keys iteration order in this case).

1360

"""

1361

return self._strip_prefix(self.adapted.iter_entries(

1362

self.prefix + key for key in keys))

1363

1364

def iter_entries_prefix(self, keys):

1365

"""Iterate over keys within the index using prefix matching.

1366

1367

Prefix matching is applied within the tuple of a key, not to within

1368

the bytestring of each key element. e.g. if you have the keys ('foo',

1369

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1370

only the former key is returned.

1371

1372

:param keys: An iterable providing the key prefixes to be retrieved.

1373

Each key prefix takes the form of a tuple the length of a key, but

1374

with the last N elements 'None' rather than a regular bytestring.

1375

The first element cannot be 'None'.

1376

:return: An iterable as per iter_all_entries, but restricted to the

1377

keys with a matching prefix to those supplied. No additional keys

1378

will be returned, and every match that is in the index will be

1379

returned.

1380

"""

1381

return self._strip_prefix(self.adapted.iter_entries_prefix(

1382

self.prefix + key for key in keys))

1383

1384

def key_count(self):

1385

"""Return an estimate of the number of keys in this index.

1386

1387

For GraphIndexPrefixAdapter this is relatively expensive - key

1388

iteration with the prefix is done.

1389

"""

1390

return len(list(self.iter_all_entries()))

1391

1392

def validate(self):

1393

"""Call the adapted's validate."""

1394

self.adapted.validate()

Older »