~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/index.py

Committer: Robert Collins
Date: 2009-07-14 00:20:03 UTC
mto: This revision was merged to the branch mainline in revision 4553.
Revision ID: robertc@robertcollins.net-20090714002003-ingqr8vlkz5577v1

Require that added ids in inventory deltas be new.

files added:
BRANCH.TODO

COPYING.txt

INSTALL

bzr.ico

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/email_message.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store/revision

bzrlib/store/versioned

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave_commands.py

bzrlib/win32utils.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/bazaar-vcs.org.kid

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/developer-guide

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/Makefile

doc/es/quick-reference/quick-start-summary.pdf

doc/es/quick-reference/quick-start-summary.png

doc/es/quick-reference/quick-start-summary.svg

doc/es/release-notes

doc/es/user-guide

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/es/user-reference

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/news-template.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/check-newsbugs.py

tools/generate_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
NEWS.developers

build-api

bzrlib/clone.py

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/revfile.py

bzrlib/store/compressed_text.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

bzrlib/graph.py => bzrlib/deprecated_graph.py

bzr-man.py => bzrlib/doc_generate/autodoc_man.py

bzrlib/store/weave.py => bzrlib/store/versioned/__init__.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/test_revision_info.py => bzrlib/tests/blackbox/test_revision_info.py

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/HTTPTestUtil.py => bzrlib/tests/http_utils.py

bzrlib/selftest/testbranch.py => bzrlib/tests/per_branch/test_branch.py

bzrlib/selftest/test_parent.py => bzrlib/tests/per_branch/test_parent.py

bzrlib/selftest/testgraph.py => bzrlib/tests/test_deprecated_graph.py

bzrlib/selftest/testdiff.py => bzrlib/tests/test_diff.py

bzrlib/selftest/testfetch.py => bzrlib/tests/test_fetch.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testlog.py => bzrlib/tests/test_log.py

bzrlib/selftest/testmerge.py => bzrlib/tests/test_merge.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevision.py => bzrlib/tests/test_revision.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionspec.py

bzrlib/selftest/teststore.py => bzrlib/tests/test_store.py

bzrlib/selftest/testtransport.py => bzrlib/tests/test_transport.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

bzrlib/selftest/testworkingtree.py => bzrlib/tests/test_workingtree.py

bzrlib/transport/http.py => bzrlib/transport/http/__init__.py

bzrlib/ui.py => bzrlib/ui/__init__.py

bzrlib/xml5.py => bzrlib/xml8.py

bzrlib/xml.py => bzrlib/xml_serializer.py

HACKING => doc/en/developer-guide/HACKING.txt

tutorial.txt => doc/en/tutorials/tutorial.txt

files modified:
.bzrignore

.rsyncexclude

Makefile

NEWS

README

TODO

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

setup.py *

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Indexing facilities."""

__all__ = [

'CombinedGraphIndex',

'GraphIndex',

'GraphIndexBuilder',

'GraphIndexPrefixAdapter',

'InMemoryGraphIndex',

]

from bisect import bisect_right

from cStringIO import StringIO

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import trace

from bzrlib.bisect_multi import bisect_multi_bytes

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

""")

from bzrlib import (

debug,

errors,

)

_HEADER_READV = (0, 200)

_OPTION_KEY_ELEMENTS = "key_elements="

_OPTION_LEN = "len="

_OPTION_NODE_REFS = "node_ref_lists="

_SIGNATURE = "Bazaar Graph Index 1\n"

_whitespace_re = re.compile('[\t\n\x0b\x0c\r\x00 ]')

_newline_null_re = re.compile('[\n\0]')

def _has_key_from_parent_map(self, key):

"""Check if this index has one key.

If it's possible to check for multiple keys at once through

calling get_parent_map that should be faster.

"""

return (key in self.get_parent_map([key]))

def _missing_keys_from_parent_map(self, keys):

return set(keys) - set(self.get_parent_map(keys))

class GraphIndexBuilder(object):

"""A builder that can build a GraphIndex.

The resulting graph has the structure:

_SIGNATURE OPTIONS NODES NEWLINE

_SIGNATURE := 'Bazaar Graph Index 1' NEWLINE

OPTIONS := 'node_ref_lists=' DIGITS NEWLINE

NODES := NODE*

NODE := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

KEY := Not-whitespace-utf8

ABSENT := 'a'

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

REFERENCE := DIGITS ; digits is the byte offset in the index of the

; referenced key.

VALUE := no-newline-no-null-bytes

"""

def __init__(self, reference_lists=0, key_elements=1):

"""Create a GraphIndex builder.

:param reference_lists: The number of node references lists for each

entry.

:param key_elements: The number of bytestrings in each key.

"""

self.reference_lists = reference_lists

self._keys = set()

# A dict of {key: (absent, ref_lists, value)}

self._nodes = {}

self._nodes_by_key = None

self._key_length = key_elements

100

self._optimize_for_size = False

101

self._combine_backing_indices = True

102

103

def _check_key(self, key):

104

"""Raise BadIndexKey if key is not a valid key for this index."""

105

if type(key) != tuple:

106

raise errors.BadIndexKey(key)

107

if self._key_length != len(key):

108

raise errors.BadIndexKey(key)

109

for element in key:

110

if not element or _whitespace_re.search(element) is not None:

111

raise errors.BadIndexKey(element)

112

113

def _external_references(self):

114

"""Return references that are not present in this index.

115

"""

116

keys = set()

117

refs = set()

118

# TODO: JAM 2008-11-21 This makes an assumption about how the reference

119

# lists are used. It is currently correct for pack-0.92 through

120

# 1.9, which use the node references (3rd column) second

121

# reference list as the compression parent. Perhaps this should

122

# be moved into something higher up the stack, since it

123

# makes assumptions about how the index is used.

124

if self.reference_lists > 1:

125

for node in self.iter_all_entries():

126

keys.add(node[1])

127

refs.update(node[3][1])

128

return refs - keys

129

else:

130

# If reference_lists == 0 there can be no external references, and

131

# if reference_lists == 1, then there isn't a place to store the

132

# compression parent

133

return set()

134

135

def _get_nodes_by_key(self):

136

if self._nodes_by_key is None:

137

nodes_by_key = {}

138

if self.reference_lists:

139

for key, (absent, references, value) in self._nodes.iteritems():

140

if absent:

141

continue

142

key_dict = nodes_by_key

143

for subkey in key[:-1]:

144

key_dict = key_dict.setdefault(subkey, {})

145

key_dict[key[-1]] = key, value, references

146

else:

147

for key, (absent, references, value) in self._nodes.iteritems():

148

if absent:

149

continue

150

key_dict = nodes_by_key

151

for subkey in key[:-1]:

152

key_dict = key_dict.setdefault(subkey, {})

153

key_dict[key[-1]] = key, value

154

self._nodes_by_key = nodes_by_key

155

return self._nodes_by_key

156

157

def _update_nodes_by_key(self, key, value, node_refs):

158

"""Update the _nodes_by_key dict with a new key.

159

160

For a key of (foo, bar, baz) create

161

_nodes_by_key[foo][bar][baz] = key_value

162

"""

163

if self._nodes_by_key is None:

164

return

165

key_dict = self._nodes_by_key

166

if self.reference_lists:

167

key_value = key, value, node_refs

168

else:

169

key_value = key, value

170

for subkey in key[:-1]:

171

key_dict = key_dict.setdefault(subkey, {})

172

key_dict[key[-1]] = key_value

173

174

def _check_key_ref_value(self, key, references, value):

175

"""Check that 'key' and 'references' are all valid.

176

177

:param key: A key tuple. Must conform to the key interface (be a tuple,

178

be of the right length, not have any whitespace or nulls in any key

179

element.)

180

:param references: An iterable of reference lists. Something like

181

[[(ref, key)], [(ref, key), (other, key)]]

182

:param value: The value associate with this key. Must not contain

183

newlines or null characters.

184

:return: (node_refs, absent_references)

185

node_refs basically a packed form of 'references' where all

186

iterables are tuples

187

absent_references reference keys that are not in self._nodes.

188

This may contain duplicates if the same key is

189

referenced in multiple lists.

190

"""

191

self._check_key(key)

192

if _newline_null_re.search(value) is not None:

193

raise errors.BadIndexValue(value)

194

if len(references) != self.reference_lists:

195

raise errors.BadIndexValue(references)

196

node_refs = []

197

absent_references = []

198

for reference_list in references:

199

for reference in reference_list:

200

# If reference *is* in self._nodes, then we know it has already

201

# been checked.

202

if reference not in self._nodes:

203

self._check_key(reference)

204

absent_references.append(reference)

205

node_refs.append(tuple(reference_list))

206

return tuple(node_refs), absent_references

207

208

def add_node(self, key, value, references=()):

209

"""Add a node to the index.

210

211

:param key: The key. keys are non-empty tuples containing

212

as many whitespace-free utf8 bytestrings as the key length

213

defined for this index.

214

:param references: An iterable of iterables of keys. Each is a

215

reference to another key.

216

:param value: The value to associate with the key. It may be any

217

bytes as long as it does not contain \0 or \n.

218

"""

219

(node_refs,

220

absent_references) = self._check_key_ref_value(key, references, value)

221

if key in self._nodes and self._nodes[key][0] != 'a':

222

raise errors.BadIndexDuplicateKey(key, self)

223

for reference in absent_references:

224

# There may be duplicates, but I don't think it is worth worrying

225

# about

226

self._nodes[reference] = ('a', (), '')

227

self._nodes[key] = ('', node_refs, value)

228

self._keys.add(key)

229

if self._nodes_by_key is not None and self._key_length > 1:

230

self._update_nodes_by_key(key, value, node_refs)

231

232

def finish(self):

233

lines = [_SIGNATURE]

234

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

235

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

236

lines.append(_OPTION_LEN + str(len(self._keys)) + '\n')

237

prefix_length = sum(len(x) for x in lines)

238

# references are byte offsets. To avoid having to do nasty

239

# polynomial work to resolve offsets (references to later in the

240

# file cannot be determined until all the inbetween references have

241

# been calculated too) we pad the offsets with 0's to make them be

242

# of consistent length. Using binary offsets would break the trivial

243

# file parsing.

244

# to calculate the width of zero's needed we do three passes:

245

# one to gather all the non-reference data and the number of references.

246

# one to pad all the data with reference-length and determine entry

247

# addresses.

248

# One to serialise.

249

250

# forward sorted by key. In future we may consider topological sorting,

251

# at the cost of table scans for direct lookup, or a second index for

252

# direct lookup

253

nodes = sorted(self._nodes.items())

254

# if we do not prepass, we don't know how long it will be up front.

255

expected_bytes = None

256

# we only need to pre-pass if we have reference lists at all.

257

if self.reference_lists:

258

key_offset_info = []

259

non_ref_bytes = prefix_length

260

total_references = 0

261

# TODO use simple multiplication for the constants in this loop.

262

for key, (absent, references, value) in nodes:

263

# record the offset known *so far* for this key:

264

# the non reference bytes to date, and the total references to

265

# date - saves reaccumulating on the second pass

266

key_offset_info.append((key, non_ref_bytes, total_references))

267

# key is literal, value is literal, there are 3 null's, 1 NL

268

# key is variable length tuple, \x00 between elements

269

non_ref_bytes += sum(len(element) for element in key)

270

if self._key_length > 1:

271

non_ref_bytes += self._key_length - 1

272

# value is literal bytes, there are 3 null's, 1 NL.

273

non_ref_bytes += len(value) + 3 + 1

274

# one byte for absent if set.

275

if absent:

276

non_ref_bytes += 1

277

elif self.reference_lists:

278

# (ref_lists -1) tabs

279

non_ref_bytes += self.reference_lists - 1

280

# (ref-1 cr's per ref_list)

281

for ref_list in references:

282

# how many references across the whole file?

283

total_references += len(ref_list)

284

# accrue reference separators

285

if ref_list:

286

non_ref_bytes += len(ref_list) - 1

287

# how many digits are needed to represent the total byte count?

288

digits = 1

289

possible_total_bytes = non_ref_bytes + total_references*digits

290

while 10 ** digits < possible_total_bytes:

291

digits += 1

292

possible_total_bytes = non_ref_bytes + total_references*digits

293

expected_bytes = possible_total_bytes + 1 # terminating newline

294

# resolve key addresses.

295

key_addresses = {}

296

for key, non_ref_bytes, total_references in key_offset_info:

297

key_addresses[key] = non_ref_bytes + total_references*digits

298

# serialise

299

format_string = '%%0%sd' % digits

300

for key, (absent, references, value) in nodes:

301

flattened_references = []

302

for ref_list in references:

303

ref_addresses = []

304

for reference in ref_list:

305

ref_addresses.append(format_string % key_addresses[reference])

306

flattened_references.append('\r'.join(ref_addresses))

307

string_key = '\x00'.join(key)

308

lines.append("%s\x00%s\x00%s\x00%s\n" % (string_key, absent,

309

'\t'.join(flattened_references), value))

310

lines.append('\n')

311

result = StringIO(''.join(lines))

312

if expected_bytes and len(result.getvalue()) != expected_bytes:

313

raise errors.BzrError('Failed index creation. Internal error:'

314

' mismatched output length and expected length: %d %d' %

315

(len(result.getvalue()), expected_bytes))

316

return result

317

318

def set_optimize(self, for_size=None, combine_backing_indices=None):

319

"""Change how the builder tries to optimize the result.

320

321

:param for_size: Tell the builder to try and make the index as small as

322

possible.

323

:param combine_backing_indices: If the builder spills to disk to save

324

memory, should the on-disk indices be combined. Set to True if you

325

are going to be probing the index, but to False if you are not. (If

326

you are not querying, then the time spent combining is wasted.)

327

:return: None

328

"""

329

# GraphIndexBuilder itself doesn't pay attention to the flag yet, but

330

# other builders do.

331

if for_size is not None:

332

self._optimize_for_size = for_size

333

if combine_backing_indices is not None:

334

self._combine_backing_indices = combine_backing_indices

335

336

337

class GraphIndex(object):

338

"""An index for data with embedded graphs.

339

340

The index maps keys to a list of key reference lists, and a value.

341

Each node has the same number of key reference lists. Each key reference

342

list can be empty or an arbitrary length. The value is an opaque NULL

343

terminated string without any newlines. The storage of the index is

344

hidden in the interface: keys and key references are always tuples of

345

bytestrings, never the internal representation (e.g. dictionary offsets).

346

347

It is presumed that the index will not be mutated - it is static data.

348

349

Successive iter_all_entries calls will read the entire index each time.

350

Additionally, iter_entries calls will read the index linearly until the

351

desired keys are found. XXX: This must be fixed before the index is

352

suitable for production use. :XXX

353

"""

354

355

def __init__(self, transport, name, size):

356

"""Open an index called name on transport.

357

358

:param transport: A bzrlib.transport.Transport.

359

:param name: A path to provide to transport API calls.

360

:param size: The size of the index in bytes. This is used for bisection

361

logic to perform partial index reads. While the size could be

362

obtained by statting the file this introduced an additional round

363

trip as well as requiring stat'able transports, both of which are

364

avoided by having it supplied. If size is None, then bisection

365

support will be disabled and accessing the index will just stream

366

all the data.

367

"""

368

self._transport = transport

369

self._name = name

370

# Becomes a dict of key:(value, reference-list-byte-locations) used by

371

# the bisection interface to store parsed but not resolved keys.

372

self._bisect_nodes = None

373

# Becomes a dict of key:(value, reference-list-keys) which are ready to

374

# be returned directly to callers.

375

self._nodes = None

376

# a sorted list of slice-addresses for the parsed bytes of the file.

377

# e.g. (0,1) would mean that byte 0 is parsed.

378

self._parsed_byte_map = []

379

# a sorted list of keys matching each slice address for parsed bytes

380

# e.g. (None, 'foo@bar') would mean that the first byte contained no

381

# key, and the end byte of the slice is the of the data for 'foo@bar'

382

self._parsed_key_map = []

383

self._key_count = None

384

self._keys_by_offset = None

385

self._nodes_by_key = None

386

self._size = size

387

# The number of bytes we've read so far in trying to process this file

388

self._bytes_read = 0

389

390

def __eq__(self, other):

391

"""Equal when self and other were created with the same parameters."""

392

return (

393

type(self) == type(other) and

394

self._transport == other._transport and

395

self._name == other._name and

396

self._size == other._size)

397

398

def __ne__(self, other):

399

return not self.__eq__(other)

400

401

def __repr__(self):

402

return "%s(%r)" % (self.__class__.__name__,

403

self._transport.abspath(self._name))

404

405

def _buffer_all(self, stream=None):

406

"""Buffer all the index data.

407

408

Mutates self._nodes and self.keys_by_offset.

409

"""

410

if self._nodes is not None:

411

# We already did this

412

return

413

if 'index' in debug.debug_flags:

414

mutter('Reading entire index %s', self._transport.abspath(self._name))

415

if stream is None:

416

stream = self._transport.get(self._name)

417

self._read_prefix(stream)

418

self._expected_elements = 3 + self._key_length

419

line_count = 0

420

# raw data keyed by offset

421

self._keys_by_offset = {}

422

# ready-to-return key:value or key:value, node_ref_lists

423

self._nodes = {}

424

self._nodes_by_key = None

425

trailers = 0

426

pos = stream.tell()

427

lines = stream.read().split('\n')

428

del lines[-1]

429

_, _, _, trailers = self._parse_lines(lines, pos)

430

for key, absent, references, value in self._keys_by_offset.itervalues():

431

if absent:

432

continue

433

# resolve references:

434

if self.node_ref_lists:

435

node_value = (value, self._resolve_references(references))

436

else:

437

node_value = value

438

self._nodes[key] = node_value

439

# cache the keys for quick set intersections

440

self._keys = set(self._nodes)

441

if trailers != 1:

442

# there must be one line - the empty trailer line.

443

raise errors.BadIndexData(self)

444

445

def external_references(self, ref_list_num):

446

"""Return references that are not present in this index.

447

"""

448

self._buffer_all()

449

if ref_list_num + 1 > self.node_ref_lists:

450

raise ValueError('No ref list %d, index has %d ref lists'

451

% (ref_list_num, self.node_ref_lists))

452

refs = set()

453

for key, (value, ref_lists) in self._nodes.iteritems():

454

ref_list = ref_lists[ref_list_num]

455

refs.update(ref_list)

456

return refs - self._keys

457

458

def _get_nodes_by_key(self):

459

if self._nodes_by_key is None:

460

nodes_by_key = {}

461

if self.node_ref_lists:

462

for key, (value, references) in self._nodes.iteritems():

463

key_dict = nodes_by_key

464

for subkey in key[:-1]:

465

key_dict = key_dict.setdefault(subkey, {})

466

key_dict[key[-1]] = key, value, references

467

else:

468

for key, value in self._nodes.iteritems():

469

key_dict = nodes_by_key

470

for subkey in key[:-1]:

471

key_dict = key_dict.setdefault(subkey, {})

472

key_dict[key[-1]] = key, value

473

self._nodes_by_key = nodes_by_key

474

return self._nodes_by_key

475

476

def iter_all_entries(self):

477

"""Iterate over all keys within the index.

478

479

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

480

The former tuple is used when there are no reference lists in the

481

index, making the API compatible with simple key:value index types.

482

There is no defined order for the result iteration - it will be in

483

the most efficient order for the index.

484

"""

485

if 'evil' in debug.debug_flags:

486

trace.mutter_callsite(3,

487

"iter_all_entries scales with size of history.")

488

if self._nodes is None:

489

self._buffer_all()

490

if self.node_ref_lists:

491

for key, (value, node_ref_lists) in self._nodes.iteritems():

492

yield self, key, value, node_ref_lists

493

else:

494

for key, value in self._nodes.iteritems():

495

yield self, key, value

496

497

def _read_prefix(self, stream):

498

signature = stream.read(len(self._signature()))

499

if not signature == self._signature():

500

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

501

options_line = stream.readline()

502

if not options_line.startswith(_OPTION_NODE_REFS):

503

raise errors.BadIndexOptions(self)

504

try:

505

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):-1])

506

except ValueError:

507

raise errors.BadIndexOptions(self)

508

options_line = stream.readline()

509

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

510

raise errors.BadIndexOptions(self)

511

try:

512

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):-1])

513

except ValueError:

514

raise errors.BadIndexOptions(self)

515

options_line = stream.readline()

516

if not options_line.startswith(_OPTION_LEN):

517

raise errors.BadIndexOptions(self)

518

try:

519

self._key_count = int(options_line[len(_OPTION_LEN):-1])

520

except ValueError:

521

raise errors.BadIndexOptions(self)

522

523

def _resolve_references(self, references):

524

"""Return the resolved key references for references.

525

526

References are resolved by looking up the location of the key in the

527

_keys_by_offset map and substituting the key name, preserving ordering.

528

529

:param references: An iterable of iterables of key locations. e.g.

530

[[123, 456], [123]]

531

:return: A tuple of tuples of keys.

532

"""

533

node_refs = []

534

for ref_list in references:

535

node_refs.append(tuple([self._keys_by_offset[ref][0] for ref in ref_list]))

536

return tuple(node_refs)

537

538

def _find_index(self, range_map, key):

539

"""Helper for the _parsed_*_index calls.

540

541

Given a range map - [(start, end), ...], finds the index of the range

542

in the map for key if it is in the map, and if it is not there, the

543

immediately preceeding range in the map.

544

"""

545

result = bisect_right(range_map, key) - 1

546

if result + 1 < len(range_map):

547

# check the border condition, it may be in result + 1

548

if range_map[result + 1][0] == key[0]:

549

return result + 1

550

return result

551

552

def _parsed_byte_index(self, offset):

553

"""Return the index of the entry immediately before offset.

554

555

e.g. if the parsed map has regions 0,10 and 11,12 parsed, meaning that

556

there is one unparsed byte (the 11th, addressed as[10]). then:

557

asking for 0 will return 0

558

asking for 10 will return 0

559

asking for 11 will return 1

560

asking for 12 will return 1

561

"""

562

key = (offset, 0)

563

return self._find_index(self._parsed_byte_map, key)

564

565

def _parsed_key_index(self, key):

566

"""Return the index of the entry immediately before key.

567

568

e.g. if the parsed map has regions (None, 'a') and ('b','c') parsed,

569

meaning that keys from None to 'a' inclusive, and 'b' to 'c' inclusive

570

have been parsed, then:

571

asking for '' will return 0

572

asking for 'a' will return 0

573

asking for 'b' will return 1

574

asking for 'e' will return 1

575

"""

576

search_key = (key, None)

577

return self._find_index(self._parsed_key_map, search_key)

578

579

def _is_parsed(self, offset):

580

"""Returns True if offset has been parsed."""

581

index = self._parsed_byte_index(offset)

582

if index == len(self._parsed_byte_map):

583

return offset < self._parsed_byte_map[index - 1][1]

584

start, end = self._parsed_byte_map[index]

585

return offset >= start and offset < end

586

587

def _iter_entries_from_total_buffer(self, keys):

588

"""Iterate over keys when the entire index is parsed."""

589

keys = keys.intersection(self._keys)

590

if self.node_ref_lists:

591

for key in keys:

592

value, node_refs = self._nodes[key]

593

yield self, key, value, node_refs

594

else:

595

for key in keys:

596

yield self, key, self._nodes[key]

597

598

def iter_entries(self, keys):

599

"""Iterate over keys within the index.

600

601

:param keys: An iterable providing the keys to be retrieved.

602

:return: An iterable as per iter_all_entries, but restricted to the

603

keys supplied. No additional keys will be returned, and every

604

key supplied that is in the index will be returned.

605

"""

606

keys = set(keys)

607

if not keys:

608

return []

609

if self._size is None and self._nodes is None:

610

self._buffer_all()

611

612

# We fit about 20 keys per minimum-read (4K), so if we are looking for

613

# more than 1/20th of the index its likely (assuming homogenous key

614

# spread) that we'll read the entire index. If we're going to do that,

615

# buffer the whole thing. A better analysis might take key spread into

616

# account - but B+Tree indices are better anyway.

617

# We could look at all data read, and use a threshold there, which will

618

# trigger on ancestry walks, but that is not yet fully mapped out.

619

if self._nodes is None and len(keys) * 20 > self.key_count():

620

self._buffer_all()

621

if self._nodes is not None:

622

return self._iter_entries_from_total_buffer(keys)

623

else:

624

return (result[1] for result in bisect_multi_bytes(

625

self._lookup_keys_via_location, self._size, keys))

626

627

def iter_entries_prefix(self, keys):

628

"""Iterate over keys within the index using prefix matching.

629

630

Prefix matching is applied within the tuple of a key, not to within

631

the bytestring of each key element. e.g. if you have the keys ('foo',

632

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

633

only the former key is returned.

634

635

WARNING: Note that this method currently causes a full index parse

636

unconditionally (which is reasonably appropriate as it is a means for

637

thunking many small indices into one larger one and still supplies

638

iter_all_entries at the thunk layer).

639

640

:param keys: An iterable providing the key prefixes to be retrieved.

641

Each key prefix takes the form of a tuple the length of a key, but

642

with the last N elements 'None' rather than a regular bytestring.

643

The first element cannot be 'None'.

644

:return: An iterable as per iter_all_entries, but restricted to the

645

keys with a matching prefix to those supplied. No additional keys

646

will be returned, and every match that is in the index will be

647

returned.

648

"""

649

keys = set(keys)

650

if not keys:

651

return

652

# load data - also finds key lengths

653

if self._nodes is None:

654

self._buffer_all()

655

if self._key_length == 1:

656

for key in keys:

657

# sanity check

658

if key[0] is None:

659

raise errors.BadIndexKey(key)

660

if len(key) != self._key_length:

661

raise errors.BadIndexKey(key)

662

if self.node_ref_lists:

663

value, node_refs = self._nodes[key]

664

yield self, key, value, node_refs

665

else:

666

yield self, key, self._nodes[key]

667

return

668

nodes_by_key = self._get_nodes_by_key()

669

for key in keys:

670

# sanity check

671

if key[0] is None:

672

raise errors.BadIndexKey(key)

673

if len(key) != self._key_length:

674

raise errors.BadIndexKey(key)

675

# find what it refers to:

676

key_dict = nodes_by_key

677

elements = list(key)

678

# find the subdict whose contents should be returned.

679

try:

680

while len(elements) and elements[0] is not None:

681

key_dict = key_dict[elements[0]]

682

elements.pop(0)

683

except KeyError:

684

# a non-existant lookup.

685

continue

686

if len(elements):

687

dicts = [key_dict]

688

while dicts:

689

key_dict = dicts.pop(-1)

690

# can't be empty or would not exist

691

item, value = key_dict.iteritems().next()

692

if type(value) == dict:

693

# push keys

694

dicts.extend(key_dict.itervalues())

695

else:

696

# yield keys

697

for value in key_dict.itervalues():

698

# each value is the key:value:node refs tuple

699

# ready to yield.

700

yield (self, ) + value

701

else:

702

# the last thing looked up was a terminal element

703

yield (self, ) + key_dict

704

705

def key_count(self):

706

"""Return an estimate of the number of keys in this index.

707

708

For GraphIndex the estimate is exact.

709

"""

710

if self._key_count is None:

711

self._read_and_parse([_HEADER_READV])

712

return self._key_count

713

714

def _lookup_keys_via_location(self, location_keys):

715

"""Public interface for implementing bisection.

716

717

If _buffer_all has been called, then all the data for the index is in

718

memory, and this method should not be called, as it uses a separate

719

cache because it cannot pre-resolve all indices, which buffer_all does

720

for performance.

721

722

:param location_keys: A list of location(byte offset), key tuples.

723

:return: A list of (location_key, result) tuples as expected by

724

bzrlib.bisect_multi.bisect_multi_bytes.

725

"""

726

# Possible improvements:

727

# - only bisect lookup each key once

728

# - sort the keys first, and use that to reduce the bisection window

729

# -----

730

# this progresses in three parts:

731

# read data

732

# parse it

733

# attempt to answer the question from the now in memory data.

734

# build the readv request

735

# for each location, ask for 800 bytes - much more than rows we've seen

736

# anywhere.

737

readv_ranges = []

738

for location, key in location_keys:

739

# can we answer from cache?

740

if self._bisect_nodes and key in self._bisect_nodes:

741

# We have the key parsed.

742

continue

743

index = self._parsed_key_index(key)

744

if (len(self._parsed_key_map) and

745

self._parsed_key_map[index][0] <= key and

746

(self._parsed_key_map[index][1] >= key or

747

# end of the file has been parsed

748

self._parsed_byte_map[index][1] == self._size)):

749

# the key has been parsed, so no lookup is needed even if its

750

# not present.

751

continue

752

# - if we have examined this part of the file already - yes

753

index = self._parsed_byte_index(location)

754

if (len(self._parsed_byte_map) and

755

self._parsed_byte_map[index][0] <= location and

756

self._parsed_byte_map[index][1] > location):

757

# the byte region has been parsed, so no read is needed.

758

continue

759

length = 800

760

if location + length > self._size:

761

length = self._size - location

762

# todo, trim out parsed locations.

763

if length > 0:

764

readv_ranges.append((location, length))

765

# read the header if needed

766

if self._bisect_nodes is None:

767

readv_ranges.append(_HEADER_READV)

768

self._read_and_parse(readv_ranges)

769

result = []

770

if self._nodes is not None:

771

# _read_and_parse triggered a _buffer_all because we requested the

772

# whole data range

773

for location, key in location_keys:

774

if key not in self._nodes: # not present

775

result.append(((location, key), False))

776

elif self.node_ref_lists:

777

value, refs = self._nodes[key]

778

result.append(((location, key),

779

(self, key, value, refs)))

780

else:

781

result.append(((location, key),

782

(self, key, self._nodes[key])))

783

return result

784

# generate results:

785

# - figure out <, >, missing, present

786

# - result present references so we can return them.

787

# keys that we cannot answer until we resolve references

788

pending_references = []

789

pending_locations = set()

790

for location, key in location_keys:

791

# can we answer from cache?

792

if key in self._bisect_nodes:

793

# the key has been parsed, so no lookup is needed

794

if self.node_ref_lists:

795

# the references may not have been all parsed.

796

value, refs = self._bisect_nodes[key]

797

wanted_locations = []

798

for ref_list in refs:

799

for ref in ref_list:

800

if ref not in self._keys_by_offset:

801

wanted_locations.append(ref)

802

if wanted_locations:

803

pending_locations.update(wanted_locations)

804

pending_references.append((location, key))

805

continue

806

result.append(((location, key), (self, key,

807

value, self._resolve_references(refs))))

808

else:

809

result.append(((location, key),

810

(self, key, self._bisect_nodes[key])))

811

continue

812

else:

813

# has the region the key should be in, been parsed?

814

index = self._parsed_key_index(key)

815

if (self._parsed_key_map[index][0] <= key and

816

(self._parsed_key_map[index][1] >= key or

817

# end of the file has been parsed

818

self._parsed_byte_map[index][1] == self._size)):

819

result.append(((location, key), False))

820

continue

821

# no, is the key above or below the probed location:

822

# get the range of the probed & parsed location

823

index = self._parsed_byte_index(location)

824

# if the key is below the start of the range, its below

825

if key < self._parsed_key_map[index][0]:

826

direction = -1

827

else:

828

direction = +1

829

result.append(((location, key), direction))

830

readv_ranges = []

831

# lookup data to resolve references

832

for location in pending_locations:

833

length = 800

834

if location + length > self._size:

835

length = self._size - location

836

# TODO: trim out parsed locations (e.g. if the 800 is into the

837

# parsed region trim it, and dont use the adjust_for_latency

838

# facility)

839

if length > 0:

840

readv_ranges.append((location, length))

841

self._read_and_parse(readv_ranges)

842

if self._nodes is not None:

843

# The _read_and_parse triggered a _buffer_all, grab the data and

844

# return it

845

for location, key in pending_references:

846

value, refs = self._nodes[key]

847

result.append(((location, key), (self, key, value, refs)))

848

return result

849

for location, key in pending_references:

850

# answer key references we had to look-up-late.

851

value, refs = self._bisect_nodes[key]

852

result.append(((location, key), (self, key,

853

value, self._resolve_references(refs))))

854

return result

855

856

def _parse_header_from_bytes(self, bytes):

857

"""Parse the header from a region of bytes.

858

859

:param bytes: The data to parse.

860

:return: An offset, data tuple such as readv yields, for the unparsed

861

data. (which may length 0).

862

"""

863

signature = bytes[0:len(self._signature())]

864

if not signature == self._signature():

865

raise errors.BadIndexFormatSignature(self._name, GraphIndex)

866

lines = bytes[len(self._signature()):].splitlines()

867

options_line = lines[0]

868

if not options_line.startswith(_OPTION_NODE_REFS):

869

raise errors.BadIndexOptions(self)

870

try:

871

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

872

except ValueError:

873

raise errors.BadIndexOptions(self)

874

options_line = lines[1]

875

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

876

raise errors.BadIndexOptions(self)

877

try:

878

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

879

except ValueError:

880

raise errors.BadIndexOptions(self)

881

options_line = lines[2]

882

if not options_line.startswith(_OPTION_LEN):

883

raise errors.BadIndexOptions(self)

884

try:

885

self._key_count = int(options_line[len(_OPTION_LEN):])

886

except ValueError:

887

raise errors.BadIndexOptions(self)

888

# calculate the bytes we have processed

889

header_end = (len(signature) + len(lines[0]) + len(lines[1]) +

890

len(lines[2]) + 3)

891

self._parsed_bytes(0, None, header_end, None)

892

# setup parsing state

893

self._expected_elements = 3 + self._key_length

894

# raw data keyed by offset

895

self._keys_by_offset = {}

896

# keys with the value and node references

897

self._bisect_nodes = {}

898

return header_end, bytes[header_end:]

899

900

def _parse_region(self, offset, data):

901

"""Parse node data returned from a readv operation.

902

903

:param offset: The byte offset the data starts at.

904

:param data: The data to parse.

905

"""

906

# trim the data.

907

# end first:

908

end = offset + len(data)

909

high_parsed = offset

910

while True:

911

# Trivial test - if the current index's end is within the

912

# low-matching parsed range, we're done.

913

index = self._parsed_byte_index(high_parsed)

914

if end < self._parsed_byte_map[index][1]:

915

return

916

# print "[%d:%d]" % (offset, end), \

917

# self._parsed_byte_map[index:index + 2]

918

high_parsed, last_segment = self._parse_segment(

919

offset, data, end, index)

920

if last_segment:

921

return

922

923

def _parse_segment(self, offset, data, end, index):

924

"""Parse one segment of data.

925

926

:param offset: Where 'data' begins in the file.

927

:param data: Some data to parse a segment of.

928

:param end: Where data ends

929

:param index: The current index into the parsed bytes map.

930

:return: True if the parsed segment is the last possible one in the

931

range of data.

932

:return: high_parsed_byte, last_segment.

933

high_parsed_byte is the location of the highest parsed byte in this

934

segment, last_segment is True if the parsed segment is the last

935

possible one in the data block.

936

"""

937

# default is to use all data

938

trim_end = None

939

# accomodate overlap with data before this.

940

if offset < self._parsed_byte_map[index][1]:

941

# overlaps the lower parsed region

942

# skip the parsed data

943

trim_start = self._parsed_byte_map[index][1] - offset

944

# don't trim the start for \n

945

start_adjacent = True

946

elif offset == self._parsed_byte_map[index][1]:

947

# abuts the lower parsed region

948

# use all data

949

trim_start = None

950

# do not trim anything

951

start_adjacent = True

952

else:

953

# does not overlap the lower parsed region

954

# use all data

955

trim_start = None

956

# but trim the leading \n

957

start_adjacent = False

958

if end == self._size:

959

# lines up to the end of all data:

960

# use it all

961

trim_end = None

962

# do not strip to the last \n

963

end_adjacent = True

964

last_segment = True

965

elif index + 1 == len(self._parsed_byte_map):

966

# at the end of the parsed data

967

# use it all

968

trim_end = None

969

# but strip to the last \n

970

end_adjacent = False

971

last_segment = True

972

elif end == self._parsed_byte_map[index + 1][0]:

973

# buts up against the next parsed region

974

# use it all

975

trim_end = None

976

# do not strip to the last \n

977

end_adjacent = True

978

last_segment = True

979

elif end > self._parsed_byte_map[index + 1][0]:

980

# overlaps into the next parsed region

981

# only consider the unparsed data

982

trim_end = self._parsed_byte_map[index + 1][0] - offset

983

# do not strip to the last \n as we know its an entire record

984

end_adjacent = True

985

last_segment = end < self._parsed_byte_map[index + 1][1]

986

else:

987

# does not overlap into the next region

988

# use it all

989

trim_end = None

990

# but strip to the last \n

991

end_adjacent = False

992

last_segment = True

993

# now find bytes to discard if needed

994

if not start_adjacent:

995

# work around python bug in rfind

996

if trim_start is None:

997

trim_start = data.find('\n') + 1

998

else:

999

trim_start = data.find('\n', trim_start) + 1

1000

if not (trim_start != 0):

1001

raise AssertionError('no \n was present')

1002

# print 'removing start', offset, trim_start, repr(data[:trim_start])

1003

if not end_adjacent:

1004

# work around python bug in rfind

1005

if trim_end is None:

1006

trim_end = data.rfind('\n') + 1

1007

else:

1008

trim_end = data.rfind('\n', None, trim_end) + 1

1009

if not (trim_end != 0):

1010

raise AssertionError('no \n was present')

1011

# print 'removing end', offset, trim_end, repr(data[trim_end:])

1012

# adjust offset and data to the parseable data.

1013

trimmed_data = data[trim_start:trim_end]

1014

if not (trimmed_data):

1015

raise AssertionError('read unneeded data [%d:%d] from [%d:%d]'

1016

% (trim_start, trim_end, offset, offset + len(data)))

1017

if trim_start:

1018

offset += trim_start

1019

# print "parsing", repr(trimmed_data)

1020

# splitlines mangles the \r delimiters.. don't use it.

1021

lines = trimmed_data.split('\n')

1022

del lines[-1]

1023

pos = offset

1024

first_key, last_key, nodes, _ = self._parse_lines(lines, pos)

1025

for key, value in nodes:

1026

self._bisect_nodes[key] = value

1027

self._parsed_bytes(offset, first_key,

1028

offset + len(trimmed_data), last_key)

1029

return offset + len(trimmed_data), last_segment

1030

1031

def _parse_lines(self, lines, pos):

1032

key = None

1033

first_key = None

1034

trailers = 0

1035

nodes = []

1036

for line in lines:

1037

if line == '':

1038

# must be at the end

1039

if self._size:

1040

if not (self._size == pos + 1):

1041

raise AssertionError("%s %s" % (self._size, pos))

1042

trailers += 1

1043

continue

1044

elements = line.split('\0')

1045

if len(elements) != self._expected_elements:

1046

raise errors.BadIndexData(self)

1047

# keys are tuples. Each element is a string that may occur many

1048

# times, so we intern them to save space. AB, RC, 200807

1049

key = tuple([intern(element) for element in elements[:self._key_length]])

1050

if first_key is None:

1051

first_key = key

1052

absent, references, value = elements[-3:]

1053

ref_lists = []

1054

for ref_string in references.split('\t'):

1055

ref_lists.append(tuple([

1056

int(ref) for ref in ref_string.split('\r') if ref

1057

]))

1058

ref_lists = tuple(ref_lists)

1059

self._keys_by_offset[pos] = (key, absent, ref_lists, value)

1060

pos += len(line) + 1 # +1 for the \n

1061

if absent:

1062

continue

1063

if self.node_ref_lists:

1064

node_value = (value, ref_lists)

1065

else:

1066

node_value = value

1067

nodes.append((key, node_value))

1068

# print "parsed ", key

1069

return first_key, key, nodes, trailers

1070

1071

def _parsed_bytes(self, start, start_key, end, end_key):

1072

"""Mark the bytes from start to end as parsed.

1073

1074

Calling self._parsed_bytes(1,2) will mark one byte (the one at offset

1075

1) as parsed.

1076

1077

:param start: The start of the parsed region.

1078

:param end: The end of the parsed region.

1079

"""

1080

index = self._parsed_byte_index(start)

1081

new_value = (start, end)

1082

new_key = (start_key, end_key)

1083

if index == -1:

1084

# first range parsed is always the beginning.

1085

self._parsed_byte_map.insert(index, new_value)

1086

self._parsed_key_map.insert(index, new_key)

1087

return

1088

# four cases:

1089

# new region

1090

# extend lower region

1091

# extend higher region

1092

# combine two regions

1093

if (index + 1 < len(self._parsed_byte_map) and

1094

self._parsed_byte_map[index][1] == start and

1095

self._parsed_byte_map[index + 1][0] == end):

1096

# combine two regions

1097

self._parsed_byte_map[index] = (self._parsed_byte_map[index][0],

1098

self._parsed_byte_map[index + 1][1])

1099

self._parsed_key_map[index] = (self._parsed_key_map[index][0],

1100

self._parsed_key_map[index + 1][1])

1101

del self._parsed_byte_map[index + 1]

1102

del self._parsed_key_map[index + 1]

1103

elif self._parsed_byte_map[index][1] == start:

1104

# extend the lower entry

1105

self._parsed_byte_map[index] = (

1106

self._parsed_byte_map[index][0], end)

1107

self._parsed_key_map[index] = (

1108

self._parsed_key_map[index][0], end_key)

1109

elif (index + 1 < len(self._parsed_byte_map) and

1110

self._parsed_byte_map[index + 1][0] == end):

1111

# extend the higher entry

1112

self._parsed_byte_map[index + 1] = (

1113

start, self._parsed_byte_map[index + 1][1])

1114

self._parsed_key_map[index + 1] = (

1115

start_key, self._parsed_key_map[index + 1][1])

1116

else:

1117

# new entry

1118

self._parsed_byte_map.insert(index + 1, new_value)

1119

self._parsed_key_map.insert(index + 1, new_key)

1120

1121

def _read_and_parse(self, readv_ranges):

1122

"""Read the the ranges and parse the resulting data.

1123

1124

:param readv_ranges: A prepared readv range list.

1125

"""

1126

if not readv_ranges:

1127

return

1128

if self._nodes is None and self._bytes_read * 2 >= self._size:

1129

# We've already read more than 50% of the file and we are about to

1130

# request more data, just _buffer_all() and be done

1131

self._buffer_all()

1132

return

1133

1134

readv_data = self._transport.readv(self._name, readv_ranges, True,

1135

self._size)

1136

# parse

1137

for offset, data in readv_data:

1138

self._bytes_read += len(data)

1139

if offset == 0 and len(data) == self._size:

1140

# We read the whole range, most likely because the

1141

# Transport upcast our readv ranges into one long request

1142

# for enough total data to grab the whole index.

1143

self._buffer_all(StringIO(data))

1144

return

1145

if self._bisect_nodes is None:

1146

# this must be the start

1147

if not (offset == 0):

1148

raise AssertionError()

1149

offset, data = self._parse_header_from_bytes(data)

1150

# print readv_ranges, "[%d:%d]" % (offset, offset + len(data))

1151

self._parse_region(offset, data)

1152

1153

def _signature(self):

1154

"""The file signature for this index type."""

1155

return _SIGNATURE

1156

1157

def validate(self):

1158

"""Validate that everything in the index can be accessed."""

1159

# iter_all validates completely at the moment, so just do that.

1160

for node in self.iter_all_entries():

1161

pass

1162

1163

1164

class CombinedGraphIndex(object):

1165

"""A GraphIndex made up from smaller GraphIndices.

1166

1167

The backing indices must implement GraphIndex, and are presumed to be

1168

static data.

1169

1170

Queries against the combined index will be made against the first index,

1171

and then the second and so on. The order of index's can thus influence

1172

performance significantly. For example, if one index is on local disk and a

1173

second on a remote server, the local disk index should be before the other

1174

in the index list.

1175

"""

1176

1177

def __init__(self, indices, reload_func=None):

1178

"""Create a CombinedGraphIndex backed by indices.

1179

1180

:param indices: An ordered list of indices to query for data.

1181

:param reload_func: A function to call if we find we are missing an

1182

index. Should have the form reload_func() => True/False to indicate

1183

if reloading actually changed anything.

1184

"""

1185

self._indices = indices

1186

self._reload_func = reload_func

1187

1188

def __repr__(self):

1189

return "%s(%s)" % (

1190

self.__class__.__name__,

1191

', '.join(map(repr, self._indices)))

1192

1193

def get_parent_map(self, keys):

1194

"""See graph.StackedParentsProvider.get_parent_map"""

1195

search_keys = set(keys)

1196

if NULL_REVISION in search_keys:

1197

search_keys.discard(NULL_REVISION)

1198

found_parents = {NULL_REVISION:[]}

1199

else:

1200

found_parents = {}

1201

for index, key, value, refs in self.iter_entries(search_keys):

1202

parents = refs[0]

1203

if not parents:

1204

parents = (NULL_REVISION,)

1205

found_parents[key] = parents

1206

return found_parents

1207

1208

has_key = _has_key_from_parent_map

1209

1210

def insert_index(self, pos, index):

1211

"""Insert a new index in the list of indices to query.

1212

1213

:param pos: The position to insert the index.

1214

:param index: The index to insert.

1215

"""

1216

self._indices.insert(pos, index)

1217

1218

def iter_all_entries(self):

1219

"""Iterate over all keys within the index

1220

1221

Duplicate keys across child indices are presumed to have the same

1222

value and are only reported once.

1223

1224

:return: An iterable of (index, key, reference_lists, value).

1225

There is no defined order for the result iteration - it will be in

1226

the most efficient order for the index.

1227

"""

1228

seen_keys = set()

1229

while True:

1230

try:

1231

for index in self._indices:

1232

for node in index.iter_all_entries():

1233

if node[1] not in seen_keys:

1234

yield node

1235

seen_keys.add(node[1])

1236

return

1237

except errors.NoSuchFile:

1238

self._reload_or_raise()

1239

1240

def iter_entries(self, keys):

1241

"""Iterate over keys within the index.

1242

1243

Duplicate keys across child indices are presumed to have the same

1244

value and are only reported once.

1245

1246

:param keys: An iterable providing the keys to be retrieved.

1247

:return: An iterable of (index, key, reference_lists, value). There is no

1248

defined order for the result iteration - it will be in the most

1249

efficient order for the index.

1250

"""

1251

keys = set(keys)

1252

while True:

1253

try:

1254

for index in self._indices:

1255

if not keys:

1256

return

1257

for node in index.iter_entries(keys):

1258

keys.remove(node[1])

1259

yield node

1260

return

1261

except errors.NoSuchFile:

1262

self._reload_or_raise()

1263

1264

def iter_entries_prefix(self, keys):

1265

"""Iterate over keys within the index using prefix matching.

1266

1267

Duplicate keys across child indices are presumed to have the same

1268

value and are only reported once.

1269

1270

Prefix matching is applied within the tuple of a key, not to within

1271

the bytestring of each key element. e.g. if you have the keys ('foo',

1272

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1273

only the former key is returned.

1274

1275

:param keys: An iterable providing the key prefixes to be retrieved.

1276

Each key prefix takes the form of a tuple the length of a key, but

1277

with the last N elements 'None' rather than a regular bytestring.

1278

The first element cannot be 'None'.

1279

:return: An iterable as per iter_all_entries, but restricted to the

1280

keys with a matching prefix to those supplied. No additional keys

1281

will be returned, and every match that is in the index will be

1282

returned.

1283

"""

1284

keys = set(keys)

1285

if not keys:

1286

return

1287

seen_keys = set()

1288

while True:

1289

try:

1290

for index in self._indices:

1291

for node in index.iter_entries_prefix(keys):

1292

if node[1] in seen_keys:

1293

continue

1294

seen_keys.add(node[1])

1295

yield node

1296

return

1297

except errors.NoSuchFile:

1298

self._reload_or_raise()

1299

1300

def key_count(self):

1301

"""Return an estimate of the number of keys in this index.

1302

1303

For CombinedGraphIndex this is approximated by the sum of the keys of

1304

the child indices. As child indices may have duplicate keys this can

1305

have a maximum error of the number of child indices * largest number of

1306

keys in any index.

1307

"""

1308

while True:

1309

try:

1310

return sum((index.key_count() for index in self._indices), 0)

1311

except errors.NoSuchFile:

1312

self._reload_or_raise()

1313

1314

missing_keys = _missing_keys_from_parent_map

1315

1316

def _reload_or_raise(self):

1317

"""We just got a NoSuchFile exception.

1318

1319

Try to reload the indices, if it fails, just raise the current

1320

exception.

1321

"""

1322

if self._reload_func is None:

1323

raise

1324

exc_type, exc_value, exc_traceback = sys.exc_info()

1325

trace.mutter('Trying to reload after getting exception: %s',

1326

exc_value)

1327

if not self._reload_func():

1328

# We tried to reload, but nothing changed, so we fail anyway

1329

trace.mutter('_reload_func indicated nothing has changed.'

1330

' Raising original exception.')

1331

raise exc_type, exc_value, exc_traceback

1332

1333

def validate(self):

1334

"""Validate that everything in the index can be accessed."""

1335

while True:

1336

try:

1337

for index in self._indices:

1338

index.validate()

1339

return

1340

except errors.NoSuchFile:

1341

self._reload_or_raise()

1342

1343

1344

class InMemoryGraphIndex(GraphIndexBuilder):

1345

"""A GraphIndex which operates entirely out of memory and is mutable.

1346

1347

This is designed to allow the accumulation of GraphIndex entries during a

1348

single write operation, where the accumulated entries need to be immediately

1349

available - for example via a CombinedGraphIndex.

1350

"""

1351

1352

def add_nodes(self, nodes):

1353

"""Add nodes to the index.

1354

1355

:param nodes: An iterable of (key, node_refs, value) entries to add.

1356

"""

1357

if self.reference_lists:

1358

for (key, value, node_refs) in nodes:

1359

self.add_node(key, value, node_refs)

1360

else:

1361

for (key, value) in nodes:

1362

self.add_node(key, value)

1363

1364

def iter_all_entries(self):

1365

"""Iterate over all keys within the index

1366

1367

:return: An iterable of (index, key, reference_lists, value). There is no

1368

defined order for the result iteration - it will be in the most

1369

efficient order for the index (in this case dictionary hash order).

1370

"""

1371

if 'evil' in debug.debug_flags:

1372

trace.mutter_callsite(3,

1373

"iter_all_entries scales with size of history.")

1374

if self.reference_lists:

1375

for key, (absent, references, value) in self._nodes.iteritems():

1376

if not absent:

1377

yield self, key, value, references

1378

else:

1379

for key, (absent, references, value) in self._nodes.iteritems():

1380

if not absent:

1381

yield self, key, value

1382

1383

def iter_entries(self, keys):

1384

"""Iterate over keys within the index.

1385

1386

:param keys: An iterable providing the keys to be retrieved.

1387

:return: An iterable of (index, key, value, reference_lists). There is no

1388

defined order for the result iteration - it will be in the most

1389

efficient order for the index (keys iteration order in this case).

1390

"""

1391

keys = set(keys)

1392

if self.reference_lists:

1393

for key in keys.intersection(self._keys):

1394

node = self._nodes[key]

1395

if not node[0]:

1396

yield self, key, node[2], node[1]

1397

else:

1398

for key in keys.intersection(self._keys):

1399

node = self._nodes[key]

1400

if not node[0]:

1401

yield self, key, node[2]

1402

1403

def iter_entries_prefix(self, keys):

1404

"""Iterate over keys within the index using prefix matching.

1405

1406

Prefix matching is applied within the tuple of a key, not to within

1407

the bytestring of each key element. e.g. if you have the keys ('foo',

1408

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1409

only the former key is returned.

1410

1411

:param keys: An iterable providing the key prefixes to be retrieved.

1412

Each key prefix takes the form of a tuple the length of a key, but

1413

with the last N elements 'None' rather than a regular bytestring.

1414

The first element cannot be 'None'.

1415

:return: An iterable as per iter_all_entries, but restricted to the

1416

keys with a matching prefix to those supplied. No additional keys

1417

will be returned, and every match that is in the index will be

1418

returned.

1419

"""

1420

# XXX: To much duplication with the GraphIndex class; consider finding

1421

# a good place to pull out the actual common logic.

1422

keys = set(keys)

1423

if not keys:

1424

return

1425

if self._key_length == 1:

1426

for key in keys:

1427

# sanity check

1428

if key[0] is None:

1429

raise errors.BadIndexKey(key)

1430

if len(key) != self._key_length:

1431

raise errors.BadIndexKey(key)

1432

node = self._nodes[key]

1433

if node[0]:

1434

continue

1435

if self.reference_lists:

1436

yield self, key, node[2], node[1]

1437

else:

1438

yield self, key, node[2]

1439

return

1440

nodes_by_key = self._get_nodes_by_key()

1441

for key in keys:

1442

# sanity check

1443

if key[0] is None:

1444

raise errors.BadIndexKey(key)

1445

if len(key) != self._key_length:

1446

raise errors.BadIndexKey(key)

1447

# find what it refers to:

1448

key_dict = nodes_by_key

1449

elements = list(key)

1450

# find the subdict to return

1451

try:

1452

while len(elements) and elements[0] is not None:

1453

key_dict = key_dict[elements[0]]

1454

elements.pop(0)

1455

except KeyError:

1456

# a non-existant lookup.

1457

continue

1458

if len(elements):

1459

dicts = [key_dict]

1460

while dicts:

1461

key_dict = dicts.pop(-1)

1462

# can't be empty or would not exist

1463

item, value = key_dict.iteritems().next()

1464

if type(value) == dict:

1465

# push keys

1466

dicts.extend(key_dict.itervalues())

1467

else:

1468

# yield keys

1469

for value in key_dict.itervalues():

1470

yield (self, ) + value

1471

else:

1472

yield (self, ) + key_dict

1473

1474

def key_count(self):

1475

"""Return an estimate of the number of keys in this index.

1476

1477

For InMemoryGraphIndex the estimate is exact.

1478

"""

1479

return len(self._keys)

1480

1481

def validate(self):

1482

"""In memory index's have no known corruption at the moment."""

1483

1484

1485

class GraphIndexPrefixAdapter(object):

1486

"""An adapter between GraphIndex with different key lengths.

1487

1488

Queries against this will emit queries against the adapted Graph with the

1489

prefix added, queries for all items use iter_entries_prefix. The returned

1490

nodes will have their keys and node references adjusted to remove the

1491

prefix. Finally, an add_nodes_callback can be supplied - when called the

1492

nodes and references being added will have prefix prepended.

1493

"""

1494

1495

def __init__(self, adapted, prefix, missing_key_length,

1496

add_nodes_callback=None):

1497

"""Construct an adapter against adapted with prefix."""

1498

self.adapted = adapted

1499

self.prefix_key = prefix + (None,)*missing_key_length

1500

self.prefix = prefix

1501

self.prefix_len = len(prefix)

1502

self.add_nodes_callback = add_nodes_callback

1503

1504

def add_nodes(self, nodes):

1505

"""Add nodes to the index.

1506

1507

:param nodes: An iterable of (key, node_refs, value) entries to add.

1508

"""

1509

# save nodes in case its an iterator

1510

nodes = tuple(nodes)

1511

translated_nodes = []

1512

try:

1513

# Add prefix_key to each reference node_refs is a tuple of tuples,

1514

# so split it apart, and add prefix_key to the internal reference

1515

for (key, value, node_refs) in nodes:

1516

adjusted_references = (

1517

tuple(tuple(self.prefix + ref_node for ref_node in ref_list)

1518

for ref_list in node_refs))

1519

translated_nodes.append((self.prefix + key, value,

1520

adjusted_references))

1521

except ValueError:

1522

# XXX: TODO add an explicit interface for getting the reference list

1523

# status, to handle this bit of user-friendliness in the API more

1524

# explicitly.

1525

for (key, value) in nodes:

1526

translated_nodes.append((self.prefix + key, value))

1527

self.add_nodes_callback(translated_nodes)

1528

1529

def add_node(self, key, value, references=()):

1530

"""Add a node to the index.

1531

1532

:param key: The key. keys are non-empty tuples containing

1533

as many whitespace-free utf8 bytestrings as the key length

1534

defined for this index.

1535

:param references: An iterable of iterables of keys. Each is a

1536

reference to another key.

1537

:param value: The value to associate with the key. It may be any

1538

bytes as long as it does not contain \0 or \n.

1539

"""

1540

self.add_nodes(((key, value, references), ))

1541

1542

def _strip_prefix(self, an_iter):

1543

"""Strip prefix data from nodes and return it."""

1544

for node in an_iter:

1545

# cross checks

1546

if node[1][:self.prefix_len] != self.prefix:

1547

raise errors.BadIndexData(self)

1548

for ref_list in node[3]:

1549

for ref_node in ref_list:

1550

if ref_node[:self.prefix_len] != self.prefix:

1551

raise errors.BadIndexData(self)

1552

yield node[0], node[1][self.prefix_len:], node[2], (

1553

tuple(tuple(ref_node[self.prefix_len:] for ref_node in ref_list)

1554

for ref_list in node[3]))

1555

1556

def iter_all_entries(self):

1557

"""Iterate over all keys within the index

1558

1559

iter_all_entries is implemented against the adapted index using

1560

iter_entries_prefix.

1561

1562

:return: An iterable of (index, key, reference_lists, value). There is no

1563

defined order for the result iteration - it will be in the most

1564

efficient order for the index (in this case dictionary hash order).

1565

"""

1566

return self._strip_prefix(self.adapted.iter_entries_prefix([self.prefix_key]))

1567

1568

def iter_entries(self, keys):

1569

"""Iterate over keys within the index.

1570

1571

:param keys: An iterable providing the keys to be retrieved.

1572

:return: An iterable of (index, key, value, reference_lists). There is no

1573

defined order for the result iteration - it will be in the most

1574

efficient order for the index (keys iteration order in this case).

1575

"""

1576

return self._strip_prefix(self.adapted.iter_entries(

1577

self.prefix + key for key in keys))

1578

1579

def iter_entries_prefix(self, keys):

1580

"""Iterate over keys within the index using prefix matching.

1581

1582

Prefix matching is applied within the tuple of a key, not to within

1583

the bytestring of each key element. e.g. if you have the keys ('foo',

1584

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1585

only the former key is returned.

1586

1587

:param keys: An iterable providing the key prefixes to be retrieved.

1588

Each key prefix takes the form of a tuple the length of a key, but

1589

with the last N elements 'None' rather than a regular bytestring.

1590

The first element cannot be 'None'.

1591

:return: An iterable as per iter_all_entries, but restricted to the

1592

keys with a matching prefix to those supplied. No additional keys

1593

will be returned, and every match that is in the index will be

1594

returned.

1595

"""

1596

return self._strip_prefix(self.adapted.iter_entries_prefix(

1597

self.prefix + key for key in keys))

1598

1599

def key_count(self):

1600

"""Return an estimate of the number of keys in this index.

1601

1602

For GraphIndexPrefixAdapter this is relatively expensive - key

1603

iteration with the prefix is done.

1604

"""

1605

return len(list(self.iter_all_entries()))

1606

1607

def validate(self):

1608

"""Call the adapted's validate."""

1609

self.adapted.validate()

Older »