~bzr-pqm/bzr/bzr.dev

Committer: John Arbash Meinel
Date: 2008-08-18 22:34:21 UTC
mto: (3606.5.6 1.6)
mto: This revision was merged to the branch mainline in revision 3641.
Revision ID: john@arbash-meinel.com-20080818223421-todjny24vj4faj4t

Add tests for the fetching behavior.

The proper parameter passed is 'unordered' add an assert for it, and
fix callers that were passing 'unsorted' instead.
Add tests that we make the right get_record_stream call based
on the value of _fetch_uses_deltas.
Fix the fetch request for signatures.

files added:
COPYING.txt

bzr.ico

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_walkdirs_win32.h

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/email_message.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/pack.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/push.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/revisiontree.py

bzrlib/rules.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/tag.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_add_fallback_repository.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_get_parent_map.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/timestamp.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/nosmart.py

bzrlib/transport/remote.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/util/bencode.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/packrepo.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/index.txt

man1

profile_imports.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/package_mf.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

tools/win32/survey.txt

files removed:
NEWS.developers

build-api

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_escaped_store.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/README.1st

files renamed:
bzrlib/patiencediff.py => bzrlib/_patiencediff_py.py

bzrlib/bundle/read_bundle.py => bzrlib/bundle/bundle_data.py

bzrlib/bundle/serializer/v07.py => bzrlib/bundle/serializer/v08.py

bzrlib/graph.py => bzrlib/deprecated_graph.py

doc/configuration.txt => bzrlib/help_topics/en/configuration.txt

bzrlib/tests/HTTPTestUtil.py => bzrlib/tests/http_utils.py

bzrlib/tests/test_revprops.py => bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/test_command.py => bzrlib/tests/test_commands.py

bzrlib/tests/test_graph.py => bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/tests/test_revisionspec.py

bzrlib/win32console.py => bzrlib/win32utils.py

bzrlib/xml5.py => bzrlib/xml8.py

HACKING => doc/developers/HACKING.txt

doc/tutorial.txt => doc/en/tutorials/tutorial.txt

doc/plugins.txt => doc/en/user-guide/plugins.txt

doc/setting_up_email.txt => doc/en/user-guide/setting_up_email.txt

doc/specifying_revisions.txt => doc/en/user-guide/specifying_revisions.txt

doc/using_aliases.txt => doc/en/user-guide/using_aliases.txt

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/elementtree/ElementTree.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml_serializer.py

contrib/bash/bzr.simple

contrib/newinventory.py

generate_docs.py

setup.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/trace-revisions

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

symbol_versioning,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

self._nodes = {}

self._nodes_by_key = {}

self._key_length = key_elements

def _check_key(self, key):

"""Raise BadIndexKey if key is not a valid key for this index."""

if type(key) != tuple:

raise errors.BadIndexKey(key)

if self._key_length != len(key):

raise errors.BadIndexKey(key)

for element in key:

if not element or _whitespace_re.search(element) is not None:

raise errors.BadIndexKey(element)

def add_node(self, key, value, references=()):

"""Add a node to the index.

100

:param key: The key. keys are non-empty tuples containing

101

as many whitespace-free utf8 bytestrings as the key length

102

defined for this index.

103

:param references: An iterable of iterables of keys. Each is a

104

reference to another key.

105

:param value: The value to associate with the key. It may be any

106

bytes as long as it does not contain \0 or \n.

107

"""

108

self._check_key(key)

109

if _newline_null_re.search(value) is not None:

110

raise errors.BadIndexValue(value)

111

if len(references) != self.reference_lists:

112

raise errors.BadIndexValue(references)

113

node_refs = []

114

for reference_list in references:

115

for reference in reference_list:

116

self._check_key(reference)

117

if reference not in self._nodes:

118

self._nodes[reference] = ('a', (), '')

119

node_refs.append(tuple(reference_list))

120

if key in self._nodes and self._nodes[key][0] == '':

121

raise errors.BadIndexDuplicateKey(key, self)

122

self._nodes[key] = ('', tuple(node_refs), value)

123

self._keys.add(key)

124

if self._key_length > 1:

125

key_dict = self._nodes_by_key

126

if self.reference_lists:

127

key_value = key, value, tuple(node_refs)

128

else:

129

key_value = key, value

130

# possibly should do this on-demand, but it seems likely it is

131

# always wanted

132

# For a key of (foo, bar, baz) create

133

# _nodes_by_key[foo][bar][baz] = key_value

134

for subkey in key[:-1]:

135

key_dict = key_dict.setdefault(subkey, {})

136

key_dict[key[-1]] = key_value

137

138

def finish(self):

139

lines = [_SIGNATURE]

140

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

141

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

142

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

143

prefix_length = sum(len(x) for x in lines)

144

# references are byte offsets. To avoid having to do nasty

145

# polynomial work to resolve offsets (references to later in the

146

# file cannot be determined until all the inbetween references have

147

# been calculated too) we pad the offsets with 0's to make them be

148

# of consistent length. Using binary offsets would break the trivial

149

# file parsing.

150

# to calculate the width of zero's needed we do three passes:

151

# one to gather all the non-reference data and the number of references.

152

# one to pad all the data with reference-length and determine entry

153

# addresses.

154

# One to serialise.

155

156

# forward sorted by key. In future we may consider topological sorting,

157

# at the cost of table scans for direct lookup, or a second index for

158

# direct lookup

159

nodes = sorted(self._nodes.items())

160

# if we do not prepass, we don't know how long it will be up front.

161

expected_bytes = None

162

# we only need to pre-pass if we have reference lists at all.

163

if self.reference_lists:

164

key_offset_info = []

165

non_ref_bytes = prefix_length

166

total_references = 0

167

# TODO use simple multiplication for the constants in this loop.

168

for key, (absent, references, value) in nodes:

169

# record the offset known *so far* for this key:

170

# the non reference bytes to date, and the total references to

171

# date - saves reaccumulating on the second pass

172

key_offset_info.append((key, non_ref_bytes, total_references))

173

# key is literal, value is literal, there are 3 null's, 1 NL

174

# key is variable length tuple, \x00 between elements

175

non_ref_bytes += sum(len(element) for element in key)

176

if self._key_length > 1:

177

non_ref_bytes += self._key_length - 1

178

# value is literal bytes, there are 3 null's, 1 NL.

179

non_ref_bytes += len(value) + 3 + 1

180

# one byte for absent if set.

181

if absent:

182

non_ref_bytes += 1

183

elif self.reference_lists:

184

# (ref_lists -1) tabs

185

non_ref_bytes += self.reference_lists - 1

186

# (ref-1 cr's per ref_list)

187

for ref_list in references:

188

# how many references across the whole file?

189

total_references += len(ref_list)

190

# accrue reference separators

191

if ref_list:

192

non_ref_bytes += len(ref_list) - 1

193

# how many digits are needed to represent the total byte count?

194

digits = 1

195

possible_total_bytes = non_ref_bytes + total_references*digits

196

while 10 ** digits < possible_total_bytes:

197

digits += 1

198

possible_total_bytes = non_ref_bytes + total_references*digits

199

expected_bytes = possible_total_bytes + 1 # terminating newline

200

# resolve key addresses.

201

key_addresses = {}

202

for key, non_ref_bytes, total_references in key_offset_info:

203

key_addresses[key] = non_ref_bytes + total_references*digits

204

# serialise

205

format_string = '%%0%sd' % digits

206

for key, (absent, references, value) in nodes:

207

flattened_references = []

208

for ref_list in references:

209

ref_addresses = []

210

for reference in ref_list:

211

ref_addresses.append(format_string % key_addresses[reference])

212

flattened_references.append('\r'.join(ref_addresses))

213

string_key = '\x00'.join(key)

214

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

215

'\t'.join(flattened_references), value))

216

lines.append('\n')

217

result = StringIO(''.join(lines))

218

if expected_bytes and len(result.getvalue()) != expected_bytes:

219

raise errors.BzrError('Failed index creation. Internal error:'

220

' mismatched output length and expected length: %d %d' %

221

(len(result.getvalue()), expected_bytes))

222

return result

223

224

225

class GraphIndex(object):

226

"""An index for data with embedded graphs.

227

228

The index maps keys to a list of key reference lists, and a value.

229

Each node has the same number of key reference lists. Each key reference

230

list can be empty or an arbitrary length. The value is an opaque NULL

231

terminated string without any newlines. The storage of the index is

232

hidden in the interface: keys and key references are always tuples of

233

bytestrings, never the internal representation (e.g. dictionary offsets).

234

235

It is presumed that the index will not be mutated - it is static data.

236

237

Successive iter_all_entries calls will read the entire index each time.

238

Additionally, iter_entries calls will read the index linearly until the

239

desired keys are found. XXX: This must be fixed before the index is

240

suitable for production use. :XXX

241

"""

242

243

def __init__(self, transport, name, size):

244

"""Open an index called name on transport.

245

246

:param transport: A bzrlib.transport.Transport.

247

:param name: A path to provide to transport API calls.

248

:param size: The size of the index in bytes. This is used for bisection

249

logic to perform partial index reads. While the size could be

250

obtained by statting the file this introduced an additional round

251

trip as well as requiring stat'able transports, both of which are

252

avoided by having it supplied. If size is None, then bisection

253

support will be disabled and accessing the index will just stream

254

all the data.

255

"""

256

self._transport = transport

257

self._name = name

258

# Becomes a dict of key:(value, reference-list-byte-locations) used by

259

# the bisection interface to store parsed but not resolved keys.

260

self._bisect_nodes = None

261

# Becomes a dict of key:(value, reference-list-keys) which are ready to

262

# be returned directly to callers.

263

self._nodes = None

264

# a sorted list of slice-addresses for the parsed bytes of the file.

265

# e.g. (0,1) would mean that byte 0 is parsed.

266

self._parsed_byte_map = []

267

# a sorted list of keys matching each slice address for parsed bytes

268

# e.g. (None, 'foo@bar') would mean that the first byte contained no

269

# key, and the end byte of the slice is the of the data for 'foo@bar'

270

self._parsed_key_map = []

271

self._key_count = None

272

self._keys_by_offset = None

273

self._nodes_by_key = None

274

self._size = size

275

276

def __eq__(self, other):

277

"""Equal when self and other were created with the same parameters."""

278

return (

279

type(self) == type(other) and

280

self._transport == other._transport and

281

self._name == other._name and

282

self._size == other._size)

283

284

def __ne__(self, other):

285

return not self.__eq__(other)

286

287

def __repr__(self):

288

return "%s(%r)" % (self.__class__.__name__,

289

self._transport.abspath(self._name))

290

291

def _buffer_all(self):

292

"""Buffer all the index data.

293

294

Mutates self._nodes and self.keys_by_offset.

295

"""

296

if 'index' in debug.debug_flags:

297

mutter('Reading entire index %s', self._transport.abspath(self._name))

298

stream = self._transport.get(self._name)

299

self._read_prefix(stream)

300

self._expected_elements = 3 + self._key_length

301

line_count = 0

302

# raw data keyed by offset

303

self._keys_by_offset = {}

304

# ready-to-return key:value or key:value, node_ref_lists

305

self._nodes = {}

306

self._nodes_by_key = {}

307

trailers = 0

308

pos = stream.tell()

309

lines = stream.read().split('\n')

310

del lines[-1]

311

_, _, _, trailers = self._parse_lines(lines, pos)

312

for key, absent, references, value in self._keys_by_offset.itervalues():

313

if absent:

314

continue

315

# resolve references:

316

if self.node_ref_lists:

317

node_value = (value, self._resolve_references(references))

318

else:

319

node_value = value

320

self._nodes[key] = node_value

321

if self._key_length > 1:

322

subkey = list(reversed(key[:-1]))

323

key_dict = self._nodes_by_key

324

if self.node_ref_lists:

325

key_value = key, node_value[0], node_value[1]

326

else:

327

key_value = key, node_value

328

# possibly should do this on-demand, but it seems likely it is

329

# always wanted

330

# For a key of (foo, bar, baz) create

331

# _nodes_by_key[foo][bar][baz] = key_value

332

for subkey in key[:-1]:

333

key_dict = key_dict.setdefault(subkey, {})

334

key_dict[key[-1]] = key_value

335

# cache the keys for quick set intersections

336

self._keys = set(self._nodes)

337

if trailers != 1:

338

# there must be one line - the empty trailer line.

339

raise errors.BadIndexData(self)

340

341

def iter_all_entries(self):

342

"""Iterate over all keys within the index.

343

344

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

345

The former tuple is used when there are no reference lists in the

346

index, making the API compatible with simple key:value index types.

347

There is no defined order for the result iteration - it will be in

348

the most efficient order for the index.

349

"""

350

if 'evil' in debug.debug_flags:

351

trace.mutter_callsite(3,

352

"iter_all_entries scales with size of history.")

353

if self._nodes is None:

354

self._buffer_all()

355

if self.node_ref_lists:

356

for key, (value, node_ref_lists) in self._nodes.iteritems():

357

yield self, key, value, node_ref_lists

358

else:

359

for key, value in self._nodes.iteritems():

360

yield self, key, value

361

362

def _read_prefix(self, stream):

363

signature = stream.read(len(self._signature()))

364

if not signature == self._signature():

365

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

366

options_line = stream.readline()

367

if not options_line.startswith(_OPTION_NODE_REFS):

368

raise errors.BadIndexOptions(self)

369

try:

370

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

371

except ValueError:

372

raise errors.BadIndexOptions(self)

373

options_line = stream.readline()

374

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

375

raise errors.BadIndexOptions(self)

376

try:

377

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

378

except ValueError:

379

raise errors.BadIndexOptions(self)

380

options_line = stream.readline()

381

if not options_line.startswith(_OPTION_LEN):

382

raise errors.BadIndexOptions(self)

383

try:

384

self._key_count = int(options_line[len(_OPTION_LEN):-1])

385

except ValueError:

386

raise errors.BadIndexOptions(self)

387

388

def _resolve_references(self, references):

389

"""Return the resolved key references for references.

390

391

References are resolved by looking up the location of the key in the

392

_keys_by_offset map and substituting the key name, preserving ordering.

393

394

:param references: An iterable of iterables of key locations. e.g.

395

[[123, 456], [123]]

396

:return: A tuple of tuples of keys.

397

"""

398

node_refs = []

399

for ref_list in references:

400

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

401

return tuple(node_refs)

402

403

def _find_index(self, range_map, key):

404

"""Helper for the _parsed_*_index calls.

405

406

Given a range map - [(start, end), ...], finds the index of the range

407

in the map for key if it is in the map, and if it is not there, the

408

immediately preceeding range in the map.

409

"""

410

result = bisect_right(range_map, key) - 1

411

if result + 1 < len(range_map):

412

# check the border condition, it may be in result + 1

413

if range_map[result + 1][0] == key[0]:

414

return result + 1

415

return result

416

417

def _parsed_byte_index(self, offset):

418

"""Return the index of the entry immediately before offset.

419

420

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

421

there is one unparsed byte (the 11th, addressed as[10]). then:

422

asking for 0 will return 0

423

asking for 10 will return 0

424

asking for 11 will return 1

425

asking for 12 will return 1

426

"""

427

key = (offset, 0)

428

return self._find_index(self._parsed_byte_map, key)

429

430

def _parsed_key_index(self, key):

431

"""Return the index of the entry immediately before key.

432

433

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

434

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

435

have been parsed, then:

436

asking for '' will return 0

437

asking for 'a' will return 0

438

asking for 'b' will return 1

439

asking for 'e' will return 1

440

"""

441

search_key = (key, None)

442

return self._find_index(self._parsed_key_map, search_key)

443

444

def _is_parsed(self, offset):

445

"""Returns True if offset has been parsed."""

446

index = self._parsed_byte_index(offset)

447

if index == len(self._parsed_byte_map):

448

return offset < self._parsed_byte_map[index - 1][1]

449

start, end = self._parsed_byte_map[index]

450

return offset >= start and offset < end

451

452

def _iter_entries_from_total_buffer(self, keys):

453

"""Iterate over keys when the entire index is parsed."""

454

keys = keys.intersection(self._keys)

455

if self.node_ref_lists:

456

for key in keys:

457

value, node_refs = self._nodes[key]

458

yield self, key, value, node_refs

459

else:

460

for key in keys:

461

yield self, key, self._nodes[key]

462

463

def iter_entries(self, keys):

464

"""Iterate over keys within the index.

465

466

:param keys: An iterable providing the keys to be retrieved.

467

:return: An iterable as per iter_all_entries, but restricted to the

468

keys supplied. No additional keys will be returned, and every

469

key supplied that is in the index will be returned.

470

"""

471

keys = set(keys)

472

if not keys:

473

return []

474

if self._size is None and self._nodes is None:

475

self._buffer_all()

476

# We fit about 20 keys per minimum-read (4K), so if we are looking for

477

# more than 1/20th of the index its likely (assuming homogenous key

478

# spread) that we'll read the entire index. If we're going to do that,

479

# buffer the whole thing. A better analysis might take key spread into

480

# account - but B+Tree indices are better anyway.

481

# We could look at all data read, and use a threshold there, which will

482

# trigger on ancestry walks, but that is not yet fully mapped out.

483

if self._nodes is None and len(keys) * 20 > self.key_count():

484

self._buffer_all()

485

if self._nodes is not None:

486

return self._iter_entries_from_total_buffer(keys)

487

else:

488

return (result[1] for result in bisect_multi_bytes(

489

self._lookup_keys_via_location, self._size, keys))

490

491

def iter_entries_prefix(self, keys):

492

"""Iterate over keys within the index using prefix matching.

493

494

Prefix matching is applied within the tuple of a key, not to within

495

the bytestring of each key element. e.g. if you have the keys ('foo',

496

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

497

only the former key is returned.

498

499

WARNING: Note that this method currently causes a full index parse

500

unconditionally (which is reasonably appropriate as it is a means for

501

thunking many small indices into one larger one and still supplies

502

iter_all_entries at the thunk layer).

503

504

:param keys: An iterable providing the key prefixes to be retrieved.

505

Each key prefix takes the form of a tuple the length of a key, but

506

with the last N elements 'None' rather than a regular bytestring.

507

The first element cannot be 'None'.

508

:return: An iterable as per iter_all_entries, but restricted to the

509

keys with a matching prefix to those supplied. No additional keys

510

will be returned, and every match that is in the index will be

511

returned.

512

"""

513

keys = set(keys)

514

if not keys:

515

return

516

# load data - also finds key lengths

517

if self._nodes is None:

518

self._buffer_all()

519

if self._key_length == 1:

520

for key in keys:

521

# sanity check

522

if key[0] is None:

523

raise errors.BadIndexKey(key)

524

if len(key) != self._key_length:

525

raise errors.BadIndexKey(key)

526

if self.node_ref_lists:

527

value, node_refs = self._nodes[key]

528

yield self, key, value, node_refs

529

else:

530

yield self, key, self._nodes[key]

531

return

532

for key in keys:

533

# sanity check

534

if key[0] is None:

535

raise errors.BadIndexKey(key)

536

if len(key) != self._key_length:

537

raise errors.BadIndexKey(key)

538

# find what it refers to:

539

key_dict = self._nodes_by_key

540

elements = list(key)

541

# find the subdict whose contents should be returned.

542

try:

543

while len(elements) and elements[0] is not None:

544

key_dict = key_dict[elements[0]]

545

elements.pop(0)

546

except KeyError:

547

# a non-existant lookup.

548

continue

549

if len(elements):

550

dicts = [key_dict]

551

while dicts:

552

key_dict = dicts.pop(-1)

553

# can't be empty or would not exist

554

item, value = key_dict.iteritems().next()

555

if type(value) == dict:

556

# push keys

557

dicts.extend(key_dict.itervalues())

558

else:

559

# yield keys

560

for value in key_dict.itervalues():

561

# each value is the key:value:node refs tuple

562

# ready to yield.

563

yield (self, ) + value

564

else:

565

# the last thing looked up was a terminal element

566

yield (self, ) + key_dict

567

568

def key_count(self):

569

"""Return an estimate of the number of keys in this index.

570

571

For GraphIndex the estimate is exact.

572

"""

573

if self._key_count is None:

574

self._read_and_parse([_HEADER_READV])

575

return self._key_count

576

577

def _lookup_keys_via_location(self, location_keys):

578

"""Public interface for implementing bisection.

579

580

If _buffer_all has been called, then all the data for the index is in

581

memory, and this method should not be called, as it uses a separate

582

cache because it cannot pre-resolve all indices, which buffer_all does

583

for performance.

584

585

:param location_keys: A list of location(byte offset), key tuples.

586

:return: A list of (location_key, result) tuples as expected by

587

bzrlib.bisect_multi.bisect_multi_bytes.

588

"""

589

# Possible improvements:

590

# - only bisect lookup each key once

591

# - sort the keys first, and use that to reduce the bisection window

592

# -----

593

# this progresses in three parts:

594

# read data

595

# parse it

596

# attempt to answer the question from the now in memory data.

597

# build the readv request

598

# for each location, ask for 800 bytes - much more than rows we've seen

599

# anywhere.

600

readv_ranges = []

601

for location, key in location_keys:

602

# can we answer from cache?

603

if self._bisect_nodes and key in self._bisect_nodes:

604

# We have the key parsed.

605

continue

606

index = self._parsed_key_index(key)

607

if (len(self._parsed_key_map) and

608

self._parsed_key_map[index][0] <= key and

609

(self._parsed_key_map[index][1] >= key or

610

# end of the file has been parsed

611

self._parsed_byte_map[index][1] == self._size)):

612

# the key has been parsed, so no lookup is needed even if its

613

# not present.

614

continue

615

# - if we have examined this part of the file already - yes

616

index = self._parsed_byte_index(location)

617

if (len(self._parsed_byte_map) and

618

self._parsed_byte_map[index][0] <= location and

619

self._parsed_byte_map[index][1] > location):

620

# the byte region has been parsed, so no read is needed.

621

continue

622

length = 800

623

if location + length > self._size:

624

length = self._size - location

625

# todo, trim out parsed locations.

626

if length > 0:

627

readv_ranges.append((location, length))

628

# read the header if needed

629

if self._bisect_nodes is None:

630

readv_ranges.append(_HEADER_READV)

631

self._read_and_parse(readv_ranges)

632

# generate results:

633

# - figure out <, >, missing, present

634

# - result present references so we can return them.

635

result = []

636

# keys that we cannot answer until we resolve references

637

pending_references = []

638

pending_locations = set()

639

for location, key in location_keys:

640

# can we answer from cache?

641

if key in self._bisect_nodes:

642

# the key has been parsed, so no lookup is needed

643

if self.node_ref_lists:

644

# the references may not have been all parsed.

645

value, refs = self._bisect_nodes[key]

646

wanted_locations = []

647

for ref_list in refs:

648

for ref in ref_list:

649

if ref not in self._keys_by_offset:

650

wanted_locations.append(ref)

651

if wanted_locations:

652

pending_locations.update(wanted_locations)

653

pending_references.append((location, key))

654

continue

655

result.append(((location, key), (self, key,

656

value, self._resolve_references(refs))))

657

else:

658

result.append(((location, key),

659

(self, key, self._bisect_nodes[key])))

660

continue

661

else:

662

# has the region the key should be in, been parsed?

663

index = self._parsed_key_index(key)

664

if (self._parsed_key_map[index][0] <= key and

665

(self._parsed_key_map[index][1] >= key or

666

# end of the file has been parsed

667

self._parsed_byte_map[index][1] == self._size)):

668

result.append(((location, key), False))

669

continue

670

# no, is the key above or below the probed location:

671

# get the range of the probed & parsed location

672

index = self._parsed_byte_index(location)

673

# if the key is below the start of the range, its below

674

if key < self._parsed_key_map[index][0]:

675

direction = -1

676

else:

677

direction = +1

678

result.append(((location, key), direction))

679

readv_ranges = []

680

# lookup data to resolve references

681

for location in pending_locations:

682

length = 800

683

if location + length > self._size:

684

length = self._size - location

685

# TODO: trim out parsed locations (e.g. if the 800 is into the

686

# parsed region trim it, and dont use the adjust_for_latency

687

# facility)

688

if length > 0:

689

readv_ranges.append((location, length))

690

self._read_and_parse(readv_ranges)

691

for location, key in pending_references:

692

# answer key references we had to look-up-late.

693

index = self._parsed_key_index(key)

694

value, refs = self._bisect_nodes[key]

695

result.append(((location, key), (self, key,

696

value, self._resolve_references(refs))))

697

return result

698

699

def _parse_header_from_bytes(self, bytes):

700

"""Parse the header from a region of bytes.

701

702

:param bytes: The data to parse.

703

:return: An offset, data tuple such as readv yields, for the unparsed

704

data. (which may length 0).

705

"""

706

signature = bytes[0:len(self._signature())]

707

if not signature == self._signature():

708

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

709

lines = bytes[len(self._signature()):].splitlines()

710

options_line = lines[0]

711

if not options_line.startswith(_OPTION_NODE_REFS):

712

raise errors.BadIndexOptions(self)

713

try:

714

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

715

except ValueError:

716

raise errors.BadIndexOptions(self)

717

options_line = lines[1]

718

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

719

raise errors.BadIndexOptions(self)

720

try:

721

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

722

except ValueError:

723

raise errors.BadIndexOptions(self)

724

options_line = lines[2]

725

if not options_line.startswith(_OPTION_LEN):

726

raise errors.BadIndexOptions(self)

727

try:

728

self._key_count = int(options_line[len(_OPTION_LEN):])

729

except ValueError:

730

raise errors.BadIndexOptions(self)

731

# calculate the bytes we have processed

732

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

733

len(lines[2]) + 3)

734

self._parsed_bytes(0, None, header_end, None)

735

# setup parsing state

736

self._expected_elements = 3 + self._key_length

737

# raw data keyed by offset

738

self._keys_by_offset = {}

739

# keys with the value and node references

740

self._bisect_nodes = {}

741

return header_end, bytes[header_end:]

742

743

def _parse_region(self, offset, data):

744

"""Parse node data returned from a readv operation.

745

746

:param offset: The byte offset the data starts at.

747

:param data: The data to parse.

748

"""

749

# trim the data.

750

# end first:

751

end = offset + len(data)

752

high_parsed = offset

753

while True:

754

# Trivial test - if the current index's end is within the

755

# low-matching parsed range, we're done.

756

index = self._parsed_byte_index(high_parsed)

757

if end < self._parsed_byte_map[index][1]:

758

return

759

# print "[%d:%d]" % (offset, end), \

760

# self._parsed_byte_map[index:index + 2]

761

high_parsed, last_segment = self._parse_segment(

762

offset, data, end, index)

763

if last_segment:

764

return

765

766

def _parse_segment(self, offset, data, end, index):

767

"""Parse one segment of data.

768

769

:param offset: Where 'data' begins in the file.

770

:param data: Some data to parse a segment of.

771

:param end: Where data ends

772

:param index: The current index into the parsed bytes map.

773

:return: True if the parsed segment is the last possible one in the

774

range of data.

775

:return: high_parsed_byte, last_segment.

776

high_parsed_byte is the location of the highest parsed byte in this

777

segment, last_segment is True if the parsed segment is the last

778

possible one in the data block.

779

"""

780

# default is to use all data

781

trim_end = None

782

# accomodate overlap with data before this.

783

if offset < self._parsed_byte_map[index][1]:

784

# overlaps the lower parsed region

785

# skip the parsed data

786

trim_start = self._parsed_byte_map[index][1] - offset

787

# don't trim the start for \n

788

start_adjacent = True

789

elif offset == self._parsed_byte_map[index][1]:

790

# abuts the lower parsed region

791

# use all data

792

trim_start = None

793

# do not trim anything

794

start_adjacent = True

795

else:

796

# does not overlap the lower parsed region

797

# use all data

798

trim_start = None

799

# but trim the leading \n

800

start_adjacent = False

801

if end == self._size:

802

# lines up to the end of all data:

803

# use it all

804

trim_end = None

805

# do not strip to the last \n

806

end_adjacent = True

807

last_segment = True

808

elif index + 1 == len(self._parsed_byte_map):

809

# at the end of the parsed data

810

# use it all

811

trim_end = None

812

# but strip to the last \n

813

end_adjacent = False

814

last_segment = True

815

elif end == self._parsed_byte_map[index + 1][0]:

816

# buts up against the next parsed region

817

# use it all

818

trim_end = None

819

# do not strip to the last \n

820

end_adjacent = True

821

last_segment = True

822

elif end > self._parsed_byte_map[index + 1][0]:

823

# overlaps into the next parsed region

824

# only consider the unparsed data

825

trim_end = self._parsed_byte_map[index + 1][0] - offset

826

# do not strip to the last \n as we know its an entire record

827

end_adjacent = True

828

last_segment = end < self._parsed_byte_map[index + 1][1]

829

else:

830

# does not overlap into the next region

831

# use it all

832

trim_end = None

833

# but strip to the last \n

834

end_adjacent = False

835

last_segment = True

836

# now find bytes to discard if needed

837

if not start_adjacent:

838

# work around python bug in rfind

839

if trim_start is None:

840

trim_start = data.find('\n') + 1

841

else:

842

trim_start = data.find('\n', trim_start) + 1

843

if not (trim_start != 0):

844

raise AssertionError('no \n was present')

845

# print 'removing start', offset, trim_start, repr(data[:trim_start])

846

if not end_adjacent:

847

# work around python bug in rfind

848

if trim_end is None:

849

trim_end = data.rfind('\n') + 1

850

else:

851

trim_end = data.rfind('\n', None, trim_end) + 1

852

if not (trim_end != 0):

853

raise AssertionError('no \n was present')

854

# print 'removing end', offset, trim_end, repr(data[trim_end:])

855

# adjust offset and data to the parseable data.

856

trimmed_data = data[trim_start:trim_end]

857

if not (trimmed_data):

858

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

859

% (trim_start, trim_end, offset, offset + len(data)))

860

if trim_start:

861

offset += trim_start

862

# print "parsing", repr(trimmed_data)

863

# splitlines mangles the \r delimiters.. don't use it.

864

lines = trimmed_data.split('\n')

865

del lines[-1]

866

pos = offset

867

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

868

for key, value in nodes:

869

self._bisect_nodes[key] = value

870

self._parsed_bytes(offset, first_key,

871

offset + len(trimmed_data), last_key)

872

return offset + len(trimmed_data), last_segment

873

874

def _parse_lines(self, lines, pos):

875

key = None

876

first_key = None

877

trailers = 0

878

nodes = []

879

for line in lines:

880

if line == '':

881

# must be at the end

882

if self._size:

883

if not (self._size == pos + 1):

884

raise AssertionError("%s %s" % (self._size, pos))

885

trailers += 1

886

continue

887

elements = line.split('\0')

888

if len(elements) != self._expected_elements:

889

raise errors.BadIndexData(self)

890

# keys are tuples. Each element is a string that may occur many

891

# times, so we intern them to save space. AB, RC, 200807

892

key = tuple(intern(element) for element in elements[:self._key_length])

893

if first_key is None:

894

first_key = key

895

absent, references, value = elements[-3:]

896

ref_lists = []

897

for ref_string in references.split('\t'):

898

ref_lists.append(tuple([

899

int(ref) for ref in ref_string.split('\r') if ref

900

]))

901

ref_lists = tuple(ref_lists)

902

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

903

pos += len(line) + 1 # +1 for the \n

904

if absent:

905

continue

906

if self.node_ref_lists:

907

node_value = (value, ref_lists)

908

else:

909

node_value = value

910

nodes.append((key, node_value))

911

# print "parsed ", key

912

return first_key, key, nodes, trailers

913

914

def _parsed_bytes(self, start, start_key, end, end_key):

915

"""Mark the bytes from start to end as parsed.

916

917

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

918

1) as parsed.

919

920

:param start: The start of the parsed region.

921

:param end: The end of the parsed region.

922

"""

923

index = self._parsed_byte_index(start)

924

new_value = (start, end)

925

new_key = (start_key, end_key)

926

if index == -1:

927

# first range parsed is always the beginning.

928

self._parsed_byte_map.insert(index, new_value)

929

self._parsed_key_map.insert(index, new_key)

930

return

931

# four cases:

932

# new region

933

# extend lower region

934

# extend higher region

935

# combine two regions

936

if (index + 1 < len(self._parsed_byte_map) and

937

self._parsed_byte_map[index][1] == start and

938

self._parsed_byte_map[index + 1][0] == end):

939

# combine two regions

940

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

941

self._parsed_byte_map[index + 1][1])

942

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

943

self._parsed_key_map[index + 1][1])

944

del self._parsed_byte_map[index + 1]

945

del self._parsed_key_map[index + 1]

946

elif self._parsed_byte_map[index][1] == start:

947

# extend the lower entry

948

self._parsed_byte_map[index] = (

949

self._parsed_byte_map[index][0], end)

950

self._parsed_key_map[index] = (

951

self._parsed_key_map[index][0], end_key)

952

elif (index + 1 < len(self._parsed_byte_map) and

953

self._parsed_byte_map[index + 1][0] == end):

954

# extend the higher entry

955

self._parsed_byte_map[index + 1] = (

956

start, self._parsed_byte_map[index + 1][1])

957

self._parsed_key_map[index + 1] = (

958

start_key, self._parsed_key_map[index + 1][1])

959

else:

960

# new entry

961

self._parsed_byte_map.insert(index + 1, new_value)

962

self._parsed_key_map.insert(index + 1, new_key)

963

964

def _read_and_parse(self, readv_ranges):

965

"""Read the the ranges and parse the resulting data.

966

967

:param readv_ranges: A prepared readv range list.

968

"""

969

if readv_ranges:

970

readv_data = self._transport.readv(self._name, readv_ranges, True,

971

self._size)

972

# parse

973

for offset, data in readv_data:

974

if self._bisect_nodes is None:

975

# this must be the start

976

if not (offset == 0):

977

raise AssertionError()

978

offset, data = self._parse_header_from_bytes(data)

979

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

980

self._parse_region(offset, data)

981

982

def _signature(self):

983

"""The file signature for this index type."""

984

return _SIGNATURE

985

986

def validate(self):

987

"""Validate that everything in the index can be accessed."""

988

# iter_all validates completely at the moment, so just do that.

989

for node in self.iter_all_entries():

990

pass

991

992

993

class CombinedGraphIndex(object):

994

"""A GraphIndex made up from smaller GraphIndices.

995

996

The backing indices must implement GraphIndex, and are presumed to be

997

static data.

998

999

Queries against the combined index will be made against the first index,

1000

and then the second and so on. The order of index's can thus influence

1001

performance significantly. For example, if one index is on local disk and a

1002

second on a remote server, the local disk index should be before the other

1003

in the index list.

1004

"""

1005

1006

def __init__(self, indices):

1007

"""Create a CombinedGraphIndex backed by indices.

1008

1009

:param indices: An ordered list of indices to query for data.

1010

"""

1011

self._indices = indices

1012

1013

def __repr__(self):

1014

return "%s(%s)" % (

1015

self.__class__.__name__,

1016

', '.join(map(repr, self._indices)))

1017

1018

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

1019

def get_parents(self, revision_ids):

1020

"""See graph._StackedParentsProvider.get_parents.

1021

1022

This implementation thunks the graph.Graph.get_parents api across to

1023

GraphIndex.

1024

1025

:param revision_ids: An iterable of graph keys for this graph.

1026

:return: A list of parent details for each key in revision_ids.

1027

Each parent details will be one of:

1028

* None when the key was missing

1029

* (NULL_REVISION,) when the key has no parents.

1030

* (parent_key, parent_key...) otherwise.

1031

"""

1032

parent_map = self.get_parent_map(revision_ids)

1033

return [parent_map.get(r, None) for r in revision_ids]

1034

1035

def get_parent_map(self, keys):

1036

"""See graph._StackedParentsProvider.get_parent_map"""

1037

search_keys = set(keys)

1038

if NULL_REVISION in search_keys:

1039

search_keys.discard(NULL_REVISION)

1040

found_parents = {NULL_REVISION:[]}

1041

else:

1042

found_parents = {}

1043

for index, key, value, refs in self.iter_entries(search_keys):

1044

parents = refs[0]

1045

if not parents:

1046

parents = (NULL_REVISION,)

1047

found_parents[key] = parents

1048

return found_parents

1049

1050

def insert_index(self, pos, index):

1051

"""Insert a new index in the list of indices to query.

1052

1053

:param pos: The position to insert the index.

1054

:param index: The index to insert.

1055

"""

1056

self._indices.insert(pos, index)

1057

1058

def iter_all_entries(self):

1059

"""Iterate over all keys within the index

1060

1061

Duplicate keys across child indices are presumed to have the same

1062

value and are only reported once.

1063

1064

:return: An iterable of (index, key, reference_lists, value).

1065

There is no defined order for the result iteration - it will be in

1066

the most efficient order for the index.

1067

"""

1068

seen_keys = set()

1069

for index in self._indices:

1070

for node in index.iter_all_entries():

1071

if node[1] not in seen_keys:

1072

yield node

1073

seen_keys.add(node[1])

1074

1075

def iter_entries(self, keys):

1076

"""Iterate over keys within the index.

1077

1078

Duplicate keys across child indices are presumed to have the same

1079

value and are only reported once.

1080

1081

:param keys: An iterable providing the keys to be retrieved.

1082

:return: An iterable of (index, key, reference_lists, value). There is no

1083

defined order for the result iteration - it will be in the most

1084

efficient order for the index.

1085

"""

1086

keys = set(keys)

1087

for index in self._indices:

1088

if not keys:

1089

return

1090

for node in index.iter_entries(keys):

1091

keys.remove(node[1])

1092

yield node

1093

1094

def iter_entries_prefix(self, keys):

1095

"""Iterate over keys within the index using prefix matching.

1096

1097

Duplicate keys across child indices are presumed to have the same

1098

value and are only reported once.

1099

1100

Prefix matching is applied within the tuple of a key, not to within

1101

the bytestring of each key element. e.g. if you have the keys ('foo',

1102

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1103

only the former key is returned.

1104

1105

:param keys: An iterable providing the key prefixes to be retrieved.

1106

Each key prefix takes the form of a tuple the length of a key, but

1107

with the last N elements 'None' rather than a regular bytestring.

1108

The first element cannot be 'None'.

1109

:return: An iterable as per iter_all_entries, but restricted to the

1110

keys with a matching prefix to those supplied. No additional keys

1111

will be returned, and every match that is in the index will be

1112

returned.

1113

"""

1114

keys = set(keys)

1115

if not keys:

1116

return

1117

seen_keys = set()

1118

for index in self._indices:

1119

for node in index.iter_entries_prefix(keys):

1120

if node[1] in seen_keys:

1121

continue

1122

seen_keys.add(node[1])

1123

yield node

1124

1125

def key_count(self):

1126

"""Return an estimate of the number of keys in this index.

1127

1128

For CombinedGraphIndex this is approximated by the sum of the keys of

1129

the child indices. As child indices may have duplicate keys this can

1130

have a maximum error of the number of child indices * largest number of

1131

keys in any index.

1132

"""

1133

return sum((index.key_count() for index in self._indices), 0)

1134

1135

def validate(self):

1136

"""Validate that everything in the index can be accessed."""

1137

for index in self._indices:

1138

index.validate()

1139

1140

1141

class InMemoryGraphIndex(GraphIndexBuilder):

1142

"""A GraphIndex which operates entirely out of memory and is mutable.

1143

1144

This is designed to allow the accumulation of GraphIndex entries during a

1145

single write operation, where the accumulated entries need to be immediately

1146

available - for example via a CombinedGraphIndex.

1147

"""

1148

1149

def add_nodes(self, nodes):

1150

"""Add nodes to the index.

1151

1152

:param nodes: An iterable of (key, node_refs, value) entries to add.

1153

"""

1154

if self.reference_lists:

1155

for (key, value, node_refs) in nodes:

1156

self.add_node(key, value, node_refs)

1157

else:

1158

for (key, value) in nodes:

1159

self.add_node(key, value)

1160

1161

def iter_all_entries(self):

1162

"""Iterate over all keys within the index

1163

1164

:return: An iterable of (index, key, reference_lists, value). There is no

1165

defined order for the result iteration - it will be in the most

1166

efficient order for the index (in this case dictionary hash order).

1167

"""

1168

if 'evil' in debug.debug_flags:

1169

trace.mutter_callsite(3,

1170

"iter_all_entries scales with size of history.")

1171

if self.reference_lists:

1172

for key, (absent, references, value) in self._nodes.iteritems():

1173

if not absent:

1174

yield self, key, value, references

1175

else:

1176

for key, (absent, references, value) in self._nodes.iteritems():

1177

if not absent:

1178

yield self, key, value

1179

1180

def iter_entries(self, keys):

1181

"""Iterate over keys within the index.

1182

1183

:param keys: An iterable providing the keys to be retrieved.

1184

:return: An iterable of (index, key, value, reference_lists). There is no

1185

defined order for the result iteration - it will be in the most

1186

efficient order for the index (keys iteration order in this case).

1187

"""

1188

keys = set(keys)

1189

if self.reference_lists:

1190

for key in keys.intersection(self._keys):

1191

node = self._nodes[key]

1192

if not node[0]:

1193

yield self, key, node[2], node[1]

1194

else:

1195

for key in keys.intersection(self._keys):

1196

node = self._nodes[key]

1197

if not node[0]:

1198

yield self, key, node[2]

1199

1200

def iter_entries_prefix(self, keys):

1201

"""Iterate over keys within the index using prefix matching.

1202

1203

Prefix matching is applied within the tuple of a key, not to within

1204

the bytestring of each key element. e.g. if you have the keys ('foo',

1205

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1206

only the former key is returned.

1207

1208

:param keys: An iterable providing the key prefixes to be retrieved.

1209

Each key prefix takes the form of a tuple the length of a key, but

1210

with the last N elements 'None' rather than a regular bytestring.

1211

The first element cannot be 'None'.

1212

:return: An iterable as per iter_all_entries, but restricted to the

1213

keys with a matching prefix to those supplied. No additional keys

1214

will be returned, and every match that is in the index will be

1215

returned.

1216

"""

1217

# XXX: To much duplication with the GraphIndex class; consider finding

1218

# a good place to pull out the actual common logic.

1219

keys = set(keys)

1220

if not keys:

1221

return

1222

if self._key_length == 1:

1223

for key in keys:

1224

# sanity check

1225

if key[0] is None:

1226

raise errors.BadIndexKey(key)

1227

if len(key) != self._key_length:

1228

raise errors.BadIndexKey(key)

1229

node = self._nodes[key]

1230

if node[0]:

1231

continue

1232

if self.reference_lists:

1233

yield self, key, node[2], node[1]

1234

else:

1235

yield self, key, node[2]

1236

return

1237

for key in keys:

1238

# sanity check

1239

if key[0] is None:

1240

raise errors.BadIndexKey(key)

1241

if len(key) != self._key_length:

1242

raise errors.BadIndexKey(key)

1243

# find what it refers to:

1244

key_dict = self._nodes_by_key

1245

elements = list(key)

1246

# find the subdict to return

1247

try:

1248

while len(elements) and elements[0] is not None:

1249

key_dict = key_dict[elements[0]]

1250

elements.pop(0)

1251

except KeyError:

1252

# a non-existant lookup.

1253

continue

1254

if len(elements):

1255

dicts = [key_dict]

1256

while dicts:

1257

key_dict = dicts.pop(-1)

1258

# can't be empty or would not exist

1259

item, value = key_dict.iteritems().next()

1260

if type(value) == dict:

1261

# push keys

1262

dicts.extend(key_dict.itervalues())

1263

else:

1264

# yield keys

1265

for value in key_dict.itervalues():

1266

yield (self, ) + value

1267

else:

1268

yield (self, ) + key_dict

1269

1270

def key_count(self):

1271

"""Return an estimate of the number of keys in this index.

1272

1273

For InMemoryGraphIndex the estimate is exact.

1274

"""

1275

return len(self._keys)

1276

1277

def validate(self):

1278

"""In memory index's have no known corruption at the moment."""

1279

1280

1281

class GraphIndexPrefixAdapter(object):

1282

"""An adapter between GraphIndex with different key lengths.

1283

1284

Queries against this will emit queries against the adapted Graph with the

1285

prefix added, queries for all items use iter_entries_prefix. The returned

1286

nodes will have their keys and node references adjusted to remove the

1287

prefix. Finally, an add_nodes_callback can be supplied - when called the

1288

nodes and references being added will have prefix prepended.

1289

"""

1290

1291

def __init__(self, adapted, prefix, missing_key_length,

1292

add_nodes_callback=None):

1293

"""Construct an adapter against adapted with prefix."""

1294

self.adapted = adapted

1295

self.prefix_key = prefix + (None,)*missing_key_length

1296

self.prefix = prefix

1297

self.prefix_len = len(prefix)

1298

self.add_nodes_callback = add_nodes_callback

1299

1300

def add_nodes(self, nodes):

1301

"""Add nodes to the index.

1302

1303

:param nodes: An iterable of (key, node_refs, value) entries to add.

1304

"""

1305

# save nodes in case its an iterator

1306

nodes = tuple(nodes)

1307

translated_nodes = []

1308

try:

1309

# Add prefix_key to each reference node_refs is a tuple of tuples,

1310

# so split it apart, and add prefix_key to the internal reference

1311

for (key, value, node_refs) in nodes:

1312

adjusted_references = (

1313

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1314

for ref_list in node_refs))

1315

translated_nodes.append((self.prefix + key, value,

1316

adjusted_references))

1317

except ValueError:

1318

# XXX: TODO add an explicit interface for getting the reference list

1319

# status, to handle this bit of user-friendliness in the API more

1320

# explicitly.

1321

for (key, value) in nodes:

1322

translated_nodes.append((self.prefix + key, value))

1323

self.add_nodes_callback(translated_nodes)

1324

1325

def add_node(self, key, value, references=()):

1326

"""Add a node to the index.

1327

1328

:param key: The key. keys are non-empty tuples containing

1329

as many whitespace-free utf8 bytestrings as the key length

1330

defined for this index.

1331

:param references: An iterable of iterables of keys. Each is a

1332

reference to another key.

1333

:param value: The value to associate with the key. It may be any

1334

bytes as long as it does not contain \0 or \n.

1335

"""

1336

self.add_nodes(((key, value, references), ))

1337

1338

def _strip_prefix(self, an_iter):

1339

"""Strip prefix data from nodes and return it."""

1340

for node in an_iter:

1341

# cross checks

1342

if node[1][:self.prefix_len] != self.prefix:

1343

raise errors.BadIndexData(self)

1344

for ref_list in node[3]:

1345

for ref_node in ref_list:

1346

if ref_node[:self.prefix_len] != self.prefix:

1347

raise errors.BadIndexData(self)

1348

yield node[0], node[1][self.prefix_len:], node[2], (

1349

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1350

for ref_list in node[3]))

1351

1352

def iter_all_entries(self):

1353

"""Iterate over all keys within the index

1354

1355

iter_all_entries is implemented against the adapted index using

1356

iter_entries_prefix.

1357

1358

:return: An iterable of (index, key, reference_lists, value). There is no

1359

defined order for the result iteration - it will be in the most

1360

efficient order for the index (in this case dictionary hash order).

1361

"""

1362

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1363

1364

def iter_entries(self, keys):

1365

"""Iterate over keys within the index.

1366

1367

:param keys: An iterable providing the keys to be retrieved.

1368

:return: An iterable of (index, key, value, reference_lists). There is no

1369

defined order for the result iteration - it will be in the most

1370

efficient order for the index (keys iteration order in this case).

1371

"""

1372

return self._strip_prefix(self.adapted.iter_entries(

1373

self.prefix + key for key in keys))

1374

1375

def iter_entries_prefix(self, keys):

1376

"""Iterate over keys within the index using prefix matching.

1377

1378

Prefix matching is applied within the tuple of a key, not to within

1379

the bytestring of each key element. e.g. if you have the keys ('foo',

1380

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1381

only the former key is returned.

1382

1383

:param keys: An iterable providing the key prefixes to be retrieved.

1384

Each key prefix takes the form of a tuple the length of a key, but

1385

with the last N elements 'None' rather than a regular bytestring.

1386

The first element cannot be 'None'.

1387

:return: An iterable as per iter_all_entries, but restricted to the

1388

keys with a matching prefix to those supplied. No additional keys

1389

will be returned, and every match that is in the index will be

1390

returned.

1391

"""

1392

return self._strip_prefix(self.adapted.iter_entries_prefix(

1393

self.prefix + key for key in keys))

1394

1395

def key_count(self):

1396

"""Return an estimate of the number of keys in this index.

1397

1398

For GraphIndexPrefixAdapter this is relatively expensive - key

1399

iteration with the prefix is done.

1400

"""

1401

return len(list(self.iter_all_entries()))

1402

1403

def validate(self):

1404

"""Call the adapted's validate."""

1405

self.adapted.validate()

Older »