~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/btree_index.py

Committer: John Arbash Meinel
Date: 2009-10-30 14:07:31 UTC
mto: (4634.93.1 2.0.2)
mto: This revision was merged to the branch mainline in revision 4782.
Revision ID: john@arbash-meinel.com-20091030140731-sjv0pr90ffvuqjst

Update the download location registered with pypi.

files added:
BRANCH.TODO

COPYING.txt

INSTALL

bzr.ico

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/annotate.py

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/sphinx_conf.py

bzrlib/email_message.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave_commands.py

bzrlib/win32utils.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/Bazaar-Logo-For-Manuals.png

doc/default.css

doc/developers

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/conf.py

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/implementation-notes.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/miscellaneous-notes.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/process.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/Makefile

doc/en/_static

doc/en/_static/bzr icon 16.png

doc/en/_static/bzr.ico

doc/en/_static/en

doc/en/_static/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/conf.py

doc/en/index.txt

doc/en/make.bat

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_static/es/Makefile

doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/_static/es/bzr-es-quick-reference.png

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/index.txt

doc/es/user-guide

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/news-template.txt

doc/ru

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_static/ru/Makefile

doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/index.txt

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/generate_docs.py

tools/generate_release_notes.py

tools/package_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
build-api

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/selftest/testremotebranch.py

bzrlib/store/compressed_text.py

bzrlib/upgrade.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

bzrlib/graph.py => bzrlib/deprecated_graph.py

bzr-man.py => bzrlib/doc_generate/autodoc_man.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/HTTPTestUtil.py => bzrlib/tests/http_utils.py

bzrlib/selftest/testbranch.py => bzrlib/tests/per_branch/test_branch.py

bzrlib/selftest/test_parent.py => bzrlib/tests/per_branch/test_parent.py

bzrlib/selftest/testgraph.py => bzrlib/tests/test_deprecated_graph.py

bzrlib/selftest/testdiff.py => bzrlib/tests/test_diff.py

bzrlib/selftest/testfetch.py => bzrlib/tests/test_fetch.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testlog.py => bzrlib/tests/test_log.py

bzrlib/selftest/testmerge.py => bzrlib/tests/test_merge.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevision.py => bzrlib/tests/test_revision.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionspec.py

bzrlib/selftest/teststore.py => bzrlib/tests/test_store.py

bzrlib/selftest/testtransport.py => bzrlib/tests/test_transport.py

tools/testweave.py => bzrlib/tests/test_weave.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

bzrlib/transport/http.py => bzrlib/transport/http/__init__.py

bzrlib/ui.py => bzrlib/ui/__init__.py

tools/history2weaves.py => bzrlib/upgrade.py

bzrlib/xml.py => bzrlib/xml_serializer.py

bzrlib/newinventory.py => contrib/newinventory.py

HACKING => doc/developers/HACKING.txt

tutorial.txt => doc/en/tutorials/tutorial.txt

files modified:
.bzrignore

.rsyncexclude

Makefile

NEWS

README

TODO

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_xml.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib/bash/bzr.simple

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

setup.py *

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/btree_index.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""B+Tree indices"""

from bisect import bisect_right

import math

import tempfile

import zlib

from bzrlib import (

chunk_writer,

debug,

errors,

fifo_cache,

index,

lru_cache,

osutils,

trace,

)

from bzrlib.index import _OPTION_NODE_REFS, _OPTION_KEY_ELEMENTS, _OPTION_LEN

from bzrlib.transport import get_transport

_BTSIGNATURE = "B+Tree Graph Index 2\n"

_OPTION_ROW_LENGTHS = "row_lengths="

_LEAF_FLAG = "type=leaf\n"

_INTERNAL_FLAG = "type=internal\n"

_INTERNAL_OFFSET = "offset="

_RESERVED_HEADER_BYTES = 120

_PAGE_SIZE = 4096

# 4K per page: 4MB - 1000 entries

_NODE_CACHE_SIZE = 1000

class _BuilderRow(object):

"""The stored state accumulated while writing out a row in the index.

:ivar spool: A temporary file used to accumulate nodes for this row

in the tree.

:ivar nodes: The count of nodes emitted so far.

"""

def __init__(self):

"""Create a _BuilderRow."""

self.nodes = 0

self.spool = tempfile.TemporaryFile()

self.writer = None

def finish_node(self, pad=True):

byte_lines, _, padding = self.writer.finish()

if self.nodes == 0:

# padded note:

self.spool.write("\x00" * _RESERVED_HEADER_BYTES)

skipped_bytes = 0

if not pad and padding:

del byte_lines[-1]

skipped_bytes = padding

self.spool.writelines(byte_lines)

remainder = (self.spool.tell() + skipped_bytes) % _PAGE_SIZE

if remainder != 0:

raise AssertionError("incorrect node length: %d, %d"

% (self.spool.tell(), remainder))

self.nodes += 1

self.writer = None

class _InternalBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out internal rows."""

def finish_node(self, pad=True):

if not pad:

raise AssertionError("Must pad internal nodes only.")

_BuilderRow.finish_node(self)

class _LeafBuilderRow(_BuilderRow):

"""The stored state accumulated while writing out a leaf rows."""

class BTreeBuilder(index.GraphIndexBuilder):

"""A Builder for B+Tree based Graph indices.

100

The resulting graph has the structure:

101

102

_SIGNATURE OPTIONS NODES

103

_SIGNATURE := 'B+Tree Graph Index 1' NEWLINE

104

OPTIONS := REF_LISTS KEY_ELEMENTS LENGTH

105

REF_LISTS := 'node_ref_lists=' DIGITS NEWLINE

106

KEY_ELEMENTS := 'key_elements=' DIGITS NEWLINE

107

LENGTH := 'len=' DIGITS NEWLINE

108

ROW_LENGTHS := 'row_lengths' DIGITS (COMMA DIGITS)*

109

NODES := NODE_COMPRESSED*

110

NODE_COMPRESSED:= COMPRESSED_BYTES{4096}

111

NODE_RAW := INTERNAL | LEAF

112

INTERNAL := INTERNAL_FLAG POINTERS

113

LEAF := LEAF_FLAG ROWS

114

KEY_ELEMENT := Not-whitespace-utf8

115

KEY := KEY_ELEMENT (NULL KEY_ELEMENT)*

116

ROWS := ROW*

117

ROW := KEY NULL ABSENT? NULL REFERENCES NULL VALUE NEWLINE

118

ABSENT := 'a'

119

REFERENCES := REFERENCE_LIST (TAB REFERENCE_LIST){node_ref_lists - 1}

120

REFERENCE_LIST := (REFERENCE (CR REFERENCE)*)?

121

REFERENCE := KEY

122

VALUE := no-newline-no-null-bytes

123

"""

124

125

def __init__(self, reference_lists=0, key_elements=1, spill_at=100000):

126

"""See GraphIndexBuilder.__init__.

127

128

:param spill_at: Optional parameter controlling the maximum number

129

of nodes that BTreeBuilder will hold in memory.

130

"""

131

index.GraphIndexBuilder.__init__(self, reference_lists=reference_lists,

132

key_elements=key_elements)

133

self._spill_at = spill_at

134

self._backing_indices = []

135

# A map of {key: (node_refs, value)}

136

self._nodes = {}

137

# Indicate it hasn't been built yet

138

self._nodes_by_key = None

139

self._optimize_for_size = False

140

141

def add_node(self, key, value, references=()):

142

"""Add a node to the index.

143

144

If adding the node causes the builder to reach its spill_at threshold,

145

disk spilling will be triggered.

146

147

:param key: The key. keys are non-empty tuples containing

148

as many whitespace-free utf8 bytestrings as the key length

149

defined for this index.

150

:param references: An iterable of iterables of keys. Each is a

151

reference to another key.

152

:param value: The value to associate with the key. It may be any

153

bytes as long as it does not contain \0 or \n.

154

"""

155

# we don't care about absent_references

156

node_refs, _ = self._check_key_ref_value(key, references, value)

157

if key in self._nodes:

158

raise errors.BadIndexDuplicateKey(key, self)

159

self._nodes[key] = (node_refs, value)

160

self._keys.add(key)

161

if self._nodes_by_key is not None and self._key_length > 1:

162

self._update_nodes_by_key(key, value, node_refs)

163

if len(self._keys) < self._spill_at:

164

return

165

self._spill_mem_keys_to_disk()

166

167

def _spill_mem_keys_to_disk(self):

168

"""Write the in memory keys down to disk to cap memory consumption.

169

170

If we already have some keys written to disk, we will combine them so

171

as to preserve the sorted order. The algorithm for combining uses

172

powers of two. So on the first spill, write all mem nodes into a

173

single index. On the second spill, combine the mem nodes with the nodes

174

on disk to create a 2x sized disk index and get rid of the first index.

175

On the third spill, create a single new disk index, which will contain

176

the mem nodes, and preserve the existing 2x sized index. On the fourth,

177

combine mem with the first and second indexes, creating a new one of

178

size 4x. On the fifth create a single new one, etc.

179

"""

180

if self._combine_backing_indices:

181

(new_backing_file, size,

182

backing_pos) = self._spill_mem_keys_and_combine()

183

else:

184

new_backing_file, size = self._spill_mem_keys_without_combining()

185

dir_path, base_name = osutils.split(new_backing_file.name)

186

# Note: The transport here isn't strictly needed, because we will use

187

# direct access to the new_backing._file object

188

new_backing = BTreeGraphIndex(get_transport(dir_path),

189

base_name, size)

190

# GC will clean up the file

191

new_backing._file = new_backing_file

192

if self._combine_backing_indices:

193

if len(self._backing_indices) == backing_pos:

194

self._backing_indices.append(None)

195

self._backing_indices[backing_pos] = new_backing

196

for backing_pos in range(backing_pos):

197

self._backing_indices[backing_pos] = None

198

else:

199

self._backing_indices.append(new_backing)

200

self._keys = set()

201

self._nodes = {}

202

self._nodes_by_key = None

203

204

def _spill_mem_keys_without_combining(self):

205

return self._write_nodes(self._iter_mem_nodes(), allow_optimize=False)

206

207

def _spill_mem_keys_and_combine(self):

208

iterators_to_combine = [self._iter_mem_nodes()]

209

pos = -1

210

for pos, backing in enumerate(self._backing_indices):

211

if backing is None:

212

pos -= 1

213

break

214

iterators_to_combine.append(backing.iter_all_entries())

215

backing_pos = pos + 1

216

new_backing_file, size = \

217

self._write_nodes(self._iter_smallest(iterators_to_combine),

218

allow_optimize=False)

219

return new_backing_file, size, backing_pos

220

221

def add_nodes(self, nodes):

222

"""Add nodes to the index.

223

224

:param nodes: An iterable of (key, node_refs, value) entries to add.

225

"""

226

if self.reference_lists:

227

for (key, value, node_refs) in nodes:

228

self.add_node(key, value, node_refs)

229

else:

230

for (key, value) in nodes:

231

self.add_node(key, value)

232

233

def _iter_mem_nodes(self):

234

"""Iterate over the nodes held in memory."""

235

nodes = self._nodes

236

if self.reference_lists:

237

for key in sorted(nodes):

238

references, value = nodes[key]

239

yield self, key, value, references

240

else:

241

for key in sorted(nodes):

242

references, value = nodes[key]

243

yield self, key, value

244

245

def _iter_smallest(self, iterators_to_combine):

246

if len(iterators_to_combine) == 1:

247

for value in iterators_to_combine[0]:

248

yield value

249

return

250

current_values = []

251

for iterator in iterators_to_combine:

252

try:

253

current_values.append(iterator.next())

254

except StopIteration:

255

current_values.append(None)

256

last = None

257

while True:

258

# Decorate candidates with the value to allow 2.4's min to be used.

259

candidates = [(item[1][1], item) for item

260

in enumerate(current_values) if item[1] is not None]

261

if not len(candidates):

262

return

263

selected = min(candidates)

264

# undecorate back to (pos, node)

265

selected = selected[1]

266

if last == selected[1][1]:

267

raise errors.BadIndexDuplicateKey(last, self)

268

last = selected[1][1]

269

# Yield, with self as the index

270

yield (self,) + selected[1][1:]

271

pos = selected[0]

272

try:

273

current_values[pos] = iterators_to_combine[pos].next()

274

except StopIteration:

275

current_values[pos] = None

276

277

def _add_key(self, string_key, line, rows, allow_optimize=True):

278

"""Add a key to the current chunk.

279

280

:param string_key: The key to add.

281

:param line: The fully serialised key and value.

282

:param allow_optimize: If set to False, prevent setting the optimize

283

flag when writing out. This is used by the _spill_mem_keys_to_disk

284

functionality.

285

"""

286

if rows[-1].writer is None:

287

# opening a new leaf chunk;

288

for pos, internal_row in enumerate(rows[:-1]):

289

# flesh out any internal nodes that are needed to

290

# preserve the height of the tree

291

if internal_row.writer is None:

292

length = _PAGE_SIZE

293

if internal_row.nodes == 0:

294

length -= _RESERVED_HEADER_BYTES # padded

295

if allow_optimize:

296

optimize_for_size = self._optimize_for_size

297

else:

298

optimize_for_size = False

299

internal_row.writer = chunk_writer.ChunkWriter(length, 0,

300

optimize_for_size=optimize_for_size)

301

internal_row.writer.write(_INTERNAL_FLAG)

302

internal_row.writer.write(_INTERNAL_OFFSET +

303

str(rows[pos + 1].nodes) + "\n")

304

# add a new leaf

305

length = _PAGE_SIZE

306

if rows[-1].nodes == 0:

307

length -= _RESERVED_HEADER_BYTES # padded

308

rows[-1].writer = chunk_writer.ChunkWriter(length,

309

optimize_for_size=self._optimize_for_size)

310

rows[-1].writer.write(_LEAF_FLAG)

311

if rows[-1].writer.write(line):

312

# this key did not fit in the node:

313

rows[-1].finish_node()

314

key_line = string_key + "\n"

315

new_row = True

316

for row in reversed(rows[:-1]):

317

# Mark the start of the next node in the node above. If it

318

# doesn't fit then propagate upwards until we find one that

319

# it does fit into.

320

if row.writer.write(key_line):

321

row.finish_node()

322

else:

323

# We've found a node that can handle the pointer.

324

new_row = False

325

break

326

# If we reached the current root without being able to mark the

327

# division point, then we need a new root:

328

if new_row:

329

# We need a new row

330

if 'index' in debug.debug_flags:

331

trace.mutter('Inserting new global row.')

332

new_row = _InternalBuilderRow()

333

reserved_bytes = 0

334

rows.insert(0, new_row)

335

# This will be padded, hence the -100

336

new_row.writer = chunk_writer.ChunkWriter(

337

_PAGE_SIZE - _RESERVED_HEADER_BYTES,

338

reserved_bytes,

339

optimize_for_size=self._optimize_for_size)

340

new_row.writer.write(_INTERNAL_FLAG)

341

new_row.writer.write(_INTERNAL_OFFSET +

342

str(rows[1].nodes - 1) + "\n")

343

new_row.writer.write(key_line)

344

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

345

346

def _write_nodes(self, node_iterator, allow_optimize=True):

347

"""Write node_iterator out as a B+Tree.

348

349

:param node_iterator: An iterator of sorted nodes. Each node should

350

match the output given by iter_all_entries.

351

:param allow_optimize: If set to False, prevent setting the optimize

352

flag when writing out. This is used by the _spill_mem_keys_to_disk

353

functionality.

354

:return: A file handle for a temporary file containing a B+Tree for

355

the nodes.

356

"""

357

# The index rows - rows[0] is the root, rows[1] is the layer under it

358

# etc.

359

rows = []

360

# forward sorted by key. In future we may consider topological sorting,

361

# at the cost of table scans for direct lookup, or a second index for

362

# direct lookup

363

key_count = 0

364

# A stack with the number of nodes of each size. 0 is the root node

365

# and must always be 1 (if there are any nodes in the tree).

366

self.row_lengths = []

367

# Loop over all nodes adding them to the bottom row

368

# (rows[-1]). When we finish a chunk in a row,

369

# propagate the key that didn't fit (comes after the chunk) to the

370

# row above, transitively.

371

for node in node_iterator:

372

if key_count == 0:

373

# First key triggers the first row

374

rows.append(_LeafBuilderRow())

375

key_count += 1

376

string_key, line = _btree_serializer._flatten_node(node,

377

self.reference_lists)

378

self._add_key(string_key, line, rows, allow_optimize=allow_optimize)

379

for row in reversed(rows):

380

pad = (type(row) != _LeafBuilderRow)

381

row.finish_node(pad=pad)

382

result = tempfile.NamedTemporaryFile(prefix='bzr-index-')

383

lines = [_BTSIGNATURE]

384

lines.append(_OPTION_NODE_REFS + str(self.reference_lists) + '\n')

385

lines.append(_OPTION_KEY_ELEMENTS + str(self._key_length) + '\n')

386

lines.append(_OPTION_LEN + str(key_count) + '\n')

387

row_lengths = [row.nodes for row in rows]

388

lines.append(_OPTION_ROW_LENGTHS + ','.join(map(str, row_lengths)) + '\n')

389

result.writelines(lines)

390

position = sum(map(len, lines))

391

root_row = True

392

if position > _RESERVED_HEADER_BYTES:

393

raise AssertionError("Could not fit the header in the"

394

" reserved space: %d > %d"

395

% (position, _RESERVED_HEADER_BYTES))

396

# write the rows out:

397

for row in rows:

398

reserved = _RESERVED_HEADER_BYTES # reserved space for first node

399

row.spool.flush()

400

row.spool.seek(0)

401

# copy nodes to the finalised file.

402

# Special case the first node as it may be prefixed

403

node = row.spool.read(_PAGE_SIZE)

404

result.write(node[reserved:])

405

result.write("\x00" * (reserved - position))

406

position = 0 # Only the root row actually has an offset

407

copied_len = osutils.pumpfile(row.spool, result)

408

if copied_len != (row.nodes - 1) * _PAGE_SIZE:

409

if type(row) != _LeafBuilderRow:

410

raise AssertionError("Incorrect amount of data copied"

411

" expected: %d, got: %d"

412

% ((row.nodes - 1) * _PAGE_SIZE,

413

copied_len))

414

result.flush()

415

size = result.tell()

416

result.seek(0)

417

return result, size

418

419

def finish(self):

420

"""Finalise the index.

421

422

:return: A file handle for a temporary file containing the nodes added

423

to the index.

424

"""

425

return self._write_nodes(self.iter_all_entries())[0]

426

427

def iter_all_entries(self):

428

"""Iterate over all keys within the index

429

430

:return: An iterable of (index, key, value, reference_lists). There is

431

no defined order for the result iteration - it will be in the most

432

efficient order for the index (in this case dictionary hash order).

433

"""

434

if 'evil' in debug.debug_flags:

435

trace.mutter_callsite(3,

436

"iter_all_entries scales with size of history.")

437

# Doing serial rather than ordered would be faster; but this shouldn't

438

# be getting called routinely anyway.

439

iterators = [self._iter_mem_nodes()]

440

for backing in self._backing_indices:

441

if backing is not None:

442

iterators.append(backing.iter_all_entries())

443

if len(iterators) == 1:

444

return iterators[0]

445

return self._iter_smallest(iterators)

446

447

def iter_entries(self, keys):

448

"""Iterate over keys within the index.

449

450

:param keys: An iterable providing the keys to be retrieved.

451

:return: An iterable of (index, key, value, reference_lists). There is no

452

defined order for the result iteration - it will be in the most

453

efficient order for the index (keys iteration order in this case).

454

"""

455

keys = set(keys)

456

local_keys = keys.intersection(self._keys)

457

if self.reference_lists:

458

for key in local_keys:

459

node = self._nodes[key]

460

yield self, key, node[1], node[0]

461

else:

462

for key in local_keys:

463

node = self._nodes[key]

464

yield self, key, node[1]

465

# Find things that are in backing indices that have not been handled

466

# yet.

467

if not self._backing_indices:

468

return # We won't find anything there either

469

# Remove all of the keys that we found locally

470

keys.difference_update(local_keys)

471

for backing in self._backing_indices:

472

if backing is None:

473

continue

474

if not keys:

475

return

476

for node in backing.iter_entries(keys):

477

keys.remove(node[1])

478

yield (self,) + node[1:]

479

480

def iter_entries_prefix(self, keys):

481

"""Iterate over keys within the index using prefix matching.

482

483

Prefix matching is applied within the tuple of a key, not to within

484

the bytestring of each key element. e.g. if you have the keys ('foo',

485

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

486

only the former key is returned.

487

488

:param keys: An iterable providing the key prefixes to be retrieved.

489

Each key prefix takes the form of a tuple the length of a key, but

490

with the last N elements 'None' rather than a regular bytestring.

491

The first element cannot be 'None'.

492

:return: An iterable as per iter_all_entries, but restricted to the

493

keys with a matching prefix to those supplied. No additional keys

494

will be returned, and every match that is in the index will be

495

returned.

496

"""

497

# XXX: To much duplication with the GraphIndex class; consider finding

498

# a good place to pull out the actual common logic.

499

keys = set(keys)

500

if not keys:

501

return

502

for backing in self._backing_indices:

503

if backing is None:

504

continue

505

for node in backing.iter_entries_prefix(keys):

506

yield (self,) + node[1:]

507

if self._key_length == 1:

508

for key in keys:

509

# sanity check

510

if key[0] is None:

511

raise errors.BadIndexKey(key)

512

if len(key) != self._key_length:

513

raise errors.BadIndexKey(key)

514

try:

515

node = self._nodes[key]

516

except KeyError:

517

continue

518

if self.reference_lists:

519

yield self, key, node[1], node[0]

520

else:

521

yield self, key, node[1]

522

return

523

for key in keys:

524

# sanity check

525

if key[0] is None:

526

raise errors.BadIndexKey(key)

527

if len(key) != self._key_length:

528

raise errors.BadIndexKey(key)

529

# find what it refers to:

530

key_dict = self._get_nodes_by_key()

531

elements = list(key)

532

# find the subdict to return

533

try:

534

while len(elements) and elements[0] is not None:

535

key_dict = key_dict[elements[0]]

536

elements.pop(0)

537

except KeyError:

538

# a non-existant lookup.

539

continue

540

if len(elements):

541

dicts = [key_dict]

542

while dicts:

543

key_dict = dicts.pop(-1)

544

# can't be empty or would not exist

545

item, value = key_dict.iteritems().next()

546

if type(value) == dict:

547

# push keys

548

dicts.extend(key_dict.itervalues())

549

else:

550

# yield keys

551

for value in key_dict.itervalues():

552

yield (self, ) + value

553

else:

554

yield (self, ) + key_dict

555

556

def _get_nodes_by_key(self):

557

if self._nodes_by_key is None:

558

nodes_by_key = {}

559

if self.reference_lists:

560

for key, (references, value) in self._nodes.iteritems():

561

key_dict = nodes_by_key

562

for subkey in key[:-1]:

563

key_dict = key_dict.setdefault(subkey, {})

564

key_dict[key[-1]] = key, value, references

565

else:

566

for key, (references, value) in self._nodes.iteritems():

567

key_dict = nodes_by_key

568

for subkey in key[:-1]:

569

key_dict = key_dict.setdefault(subkey, {})

570

key_dict[key[-1]] = key, value

571

self._nodes_by_key = nodes_by_key

572

return self._nodes_by_key

573

574

def key_count(self):

575

"""Return an estimate of the number of keys in this index.

576

577

For InMemoryGraphIndex the estimate is exact.

578

"""

579

return len(self._keys) + sum(backing.key_count() for backing in

580

self._backing_indices if backing is not None)

581

582

def validate(self):

583

"""In memory index's have no known corruption at the moment."""

584

585

586

class _LeafNode(object):

587

"""A leaf node for a serialised B+Tree index."""

588

589

__slots__ = ('keys', 'min_key', 'max_key')

590

591

def __init__(self, bytes, key_length, ref_list_length):

592

"""Parse bytes to create a leaf node object."""

593

# splitlines mangles the \r delimiters.. don't use it.

594

key_list = _btree_serializer._parse_leaf_lines(bytes,

595

key_length, ref_list_length)

596

if key_list:

597

self.min_key = key_list[0][0]

598

self.max_key = key_list[-1][0]

599

else:

600

self.min_key = self.max_key = None

601

self.keys = dict(key_list)

602

603

604

class _InternalNode(object):

605

"""An internal node for a serialised B+Tree index."""

606

607

__slots__ = ('keys', 'offset')

608

609

def __init__(self, bytes):

610

"""Parse bytes to create an internal node object."""

611

# splitlines mangles the \r delimiters.. don't use it.

612

self.keys = self._parse_lines(bytes.split('\n'))

613

614

def _parse_lines(self, lines):

615

nodes = []

616

self.offset = int(lines[1][7:])

617

for line in lines[2:]:

618

if line == '':

619

break

620

nodes.append(tuple(map(intern, line.split('\0'))))

621

return nodes

622

623

624

class BTreeGraphIndex(object):

625

"""Access to nodes via the standard GraphIndex interface for B+Tree's.

626

627

Individual nodes are held in a LRU cache. This holds the root node in

628

memory except when very large walks are done.

629

"""

630

631

def __init__(self, transport, name, size, unlimited_cache=False):

632

"""Create a B+Tree index object on the index name.

633

634

:param transport: The transport to read data for the index from.

635

:param name: The file name of the index on transport.

636

:param size: Optional size of the index in bytes. This allows

637

compatibility with the GraphIndex API, as well as ensuring that

638

the initial read (to read the root node header) can be done

639

without over-reading even on empty indices, and on small indices

640

allows single-IO to read the entire index.

641

:param unlimited_cache: If set to True, then instead of using an

642

LRUCache with size _NODE_CACHE_SIZE, we will use a dict and always

643

cache all leaf nodes.

644

"""

645

self._transport = transport

646

self._name = name

647

self._size = size

648

self._file = None

649

self._recommended_pages = self._compute_recommended_pages()

650

self._root_node = None

651

# Default max size is 100,000 leave values

652

self._leaf_value_cache = None # lru_cache.LRUCache(100*1000)

653

if unlimited_cache:

654

self._leaf_node_cache = {}

655

self._internal_node_cache = {}

656

else:

657

self._leaf_node_cache = lru_cache.LRUCache(_NODE_CACHE_SIZE)

658

# We use a FIFO here just to prevent possible blowout. However, a

659

# 300k record btree has only 3k leaf nodes, and only 20 internal

660

# nodes. A value of 100 scales to ~100*100*100 = 1M records.

661

self._internal_node_cache = fifo_cache.FIFOCache(100)

662

self._key_count = None

663

self._row_lengths = None

664

self._row_offsets = None # Start of each row, [-1] is the end

665

666

def __eq__(self, other):

667

"""Equal when self and other were created with the same parameters."""

668

return (

669

type(self) == type(other) and

670

self._transport == other._transport and

671

self._name == other._name and

672

self._size == other._size)

673

674

def __ne__(self, other):

675

return not self.__eq__(other)

676

677

def _get_and_cache_nodes(self, nodes):

678

"""Read nodes and cache them in the lru.

679

680

The nodes list supplied is sorted and then read from disk, each node

681

being inserted it into the _node_cache.

682

683

Note: Asking for more nodes than the _node_cache can contain will

684

result in some of the results being immediately discarded, to prevent

685

this an assertion is raised if more nodes are asked for than are

686

cachable.

687

688

:return: A dict of {node_pos: node}

689

"""

690

found = {}

691

start_of_leaves = None

692

for node_pos, node in self._read_nodes(sorted(nodes)):

693

if node_pos == 0: # Special case

694

self._root_node = node

695

else:

696

if start_of_leaves is None:

697

start_of_leaves = self._row_offsets[-2]

698

if node_pos < start_of_leaves:

699

self._internal_node_cache[node_pos] = node

700

else:

701

self._leaf_node_cache[node_pos] = node

702

found[node_pos] = node

703

return found

704

705

def _compute_recommended_pages(self):

706

"""Convert transport's recommended_page_size into btree pages.

707

708

recommended_page_size is in bytes, we want to know how many _PAGE_SIZE

709

pages fit in that length.

710

"""

711

recommended_read = self._transport.recommended_page_size()

712

recommended_pages = int(math.ceil(recommended_read /

713

float(_PAGE_SIZE)))

714

return recommended_pages

715

716

def _compute_total_pages_in_index(self):

717

"""How many pages are in the index.

718

719

If we have read the header we will use the value stored there.

720

Otherwise it will be computed based on the length of the index.

721

"""

722

if self._size is None:

723

raise AssertionError('_compute_total_pages_in_index should not be'

724

' called when self._size is None')

725

if self._root_node is not None:

726

# This is the number of pages as defined by the header

727

return self._row_offsets[-1]

728

# This is the number of pages as defined by the size of the index. They

729

# should be indentical.

730

total_pages = int(math.ceil(self._size / float(_PAGE_SIZE)))

731

return total_pages

732

733

def _expand_offsets(self, offsets):

734

"""Find extra pages to download.

735

736

The idea is that we always want to make big-enough requests (like 64kB

737

for http), so that we don't waste round trips. So given the entries

738

that we already have cached and the new pages being downloaded figure

739

out what other pages we might want to read.

740

741

See also doc/developers/btree_index_prefetch.txt for more details.

742

743

:param offsets: The offsets to be read

744

:return: A list of offsets to download

745

"""

746

if 'index' in debug.debug_flags:

747

trace.mutter('expanding: %s\toffsets: %s', self._name, offsets)

748

749

if len(offsets) >= self._recommended_pages:

750

# Don't add more, we are already requesting more than enough

751

if 'index' in debug.debug_flags:

752

trace.mutter(' not expanding large request (%s >= %s)',

753

len(offsets), self._recommended_pages)

754

return offsets

755

if self._size is None:

756

# Don't try anything, because we don't know where the file ends

757

if 'index' in debug.debug_flags:

758

trace.mutter(' not expanding without knowing index size')

759

return offsets

760

total_pages = self._compute_total_pages_in_index()

761

cached_offsets = self._get_offsets_to_cached_pages()

762

# If reading recommended_pages would read the rest of the index, just

763

# do so.

764

if total_pages - len(cached_offsets) <= self._recommended_pages:

765

# Read whatever is left

766

if cached_offsets:

767

expanded = [x for x in xrange(total_pages)

768

if x not in cached_offsets]

769

else:

770

expanded = range(total_pages)

771

if 'index' in debug.debug_flags:

772

trace.mutter(' reading all unread pages: %s', expanded)

773

return expanded

774

775

if self._root_node is None:

776

# ATM on the first read of the root node of a large index, we don't

777

# bother pre-reading any other pages. This is because the

778

# likelyhood of actually reading interesting pages is very low.

779

# See doc/developers/btree_index_prefetch.txt for a discussion, and

780

# a possible implementation when we are guessing that the second

781

# layer index is small

782

final_offsets = offsets

783

else:

784

tree_depth = len(self._row_lengths)

785

if len(cached_offsets) < tree_depth and len(offsets) == 1:

786

# We haven't read enough to justify expansion

787

# If we are only going to read the root node, and 1 leaf node,

788

# then it isn't worth expanding our request. Once we've read at

789

# least 2 nodes, then we are probably doing a search, and we

790

# start expanding our requests.

791

if 'index' in debug.debug_flags:

792

trace.mutter(' not expanding on first reads')

793

return offsets

794

final_offsets = self._expand_to_neighbors(offsets, cached_offsets,

795

total_pages)

796

797

final_offsets = sorted(final_offsets)

798

if 'index' in debug.debug_flags:

799

trace.mutter('expanded: %s', final_offsets)

800

return final_offsets

801

802

def _expand_to_neighbors(self, offsets, cached_offsets, total_pages):

803

"""Expand requests to neighbors until we have enough pages.

804

805

This is called from _expand_offsets after policy has determined that we

806

want to expand.

807

We only want to expand requests within a given layer. We cheat a little

808

bit and assume all requests will be in the same layer. This is true

809

given the current design, but if it changes this algorithm may perform

810

oddly.

811

812

:param offsets: requested offsets

813

:param cached_offsets: offsets for pages we currently have cached

814

:return: A set() of offsets after expansion

815

"""

816

final_offsets = set(offsets)

817

first = end = None

818

new_tips = set(final_offsets)

819

while len(final_offsets) < self._recommended_pages and new_tips:

820

next_tips = set()

821

for pos in new_tips:

822

if first is None:

823

first, end = self._find_layer_first_and_end(pos)

824

previous = pos - 1

825

if (previous > 0

826

and previous not in cached_offsets

827

and previous not in final_offsets

828

and previous >= first):

829

next_tips.add(previous)

830

after = pos + 1

831

if (after < total_pages

832

and after not in cached_offsets

833

and after not in final_offsets

834

and after < end):

835

next_tips.add(after)

836

# This would keep us from going bigger than

837

# recommended_pages by only expanding the first offsets.

838

# However, if we are making a 'wide' request, it is

839

# reasonable to expand all points equally.

840

# if len(final_offsets) > recommended_pages:

841

# break

842

final_offsets.update(next_tips)

843

new_tips = next_tips

844

return final_offsets

845

846

def external_references(self, ref_list_num):

847

if self._root_node is None:

848

self._get_root_node()

849

if ref_list_num + 1 > self.node_ref_lists:

850

raise ValueError('No ref list %d, index has %d ref lists'

851

% (ref_list_num, self.node_ref_lists))

852

keys = set()

853

refs = set()

854

for node in self.iter_all_entries():

855

keys.add(node[1])

856

refs.update(node[3][ref_list_num])

857

return refs - keys

858

859

def _find_layer_first_and_end(self, offset):

860

"""Find the start/stop nodes for the layer corresponding to offset.

861

862

:return: (first, end)

863

first is the first node in this layer

864

end is the first node of the next layer

865

"""

866

first = end = 0

867

for roffset in self._row_offsets:

868

first = end

869

end = roffset

870

if offset < roffset:

871

break

872

return first, end

873

874

def _get_offsets_to_cached_pages(self):

875

"""Determine what nodes we already have cached."""

876

cached_offsets = set(self._internal_node_cache.keys())

877

cached_offsets.update(self._leaf_node_cache.keys())

878

if self._root_node is not None:

879

cached_offsets.add(0)

880

return cached_offsets

881

882

def _get_root_node(self):

883

if self._root_node is None:

884

# We may not have a root node yet

885

self._get_internal_nodes([0])

886

return self._root_node

887

888

def _get_nodes(self, cache, node_indexes):

889

found = {}

890

needed = []

891

for idx in node_indexes:

892

if idx == 0 and self._root_node is not None:

893

found[0] = self._root_node

894

continue

895

try:

896

found[idx] = cache[idx]

897

except KeyError:

898

needed.append(idx)

899

if not needed:

900

return found

901

needed = self._expand_offsets(needed)

902

found.update(self._get_and_cache_nodes(needed))

903

return found

904

905

def _get_internal_nodes(self, node_indexes):

906

"""Get a node, from cache or disk.

907

908

After getting it, the node will be cached.

909

"""

910

return self._get_nodes(self._internal_node_cache, node_indexes)

911

912

def _cache_leaf_values(self, nodes):

913

"""Cache directly from key => value, skipping the btree."""

914

if self._leaf_value_cache is not None:

915

for node in nodes.itervalues():

916

for key, value in node.keys.iteritems():

917

if key in self._leaf_value_cache:

918

# Don't add the rest of the keys, we've seen this node

919

# before.

920

break

921

self._leaf_value_cache[key] = value

922

923

def _get_leaf_nodes(self, node_indexes):

924

"""Get a bunch of nodes, from cache or disk."""

925

found = self._get_nodes(self._leaf_node_cache, node_indexes)

926

self._cache_leaf_values(found)

927

return found

928

929

def iter_all_entries(self):

930

"""Iterate over all keys within the index.

931

932

:return: An iterable of (index, key, value) or (index, key, value, reference_lists).

933

The former tuple is used when there are no reference lists in the

934

index, making the API compatible with simple key:value index types.

935

There is no defined order for the result iteration - it will be in

936

the most efficient order for the index.

937

"""

938

if 'evil' in debug.debug_flags:

939

trace.mutter_callsite(3,

940

"iter_all_entries scales with size of history.")

941

if not self.key_count():

942

return

943

if self._row_offsets[-1] == 1:

944

# There is only the root node, and we read that via key_count()

945

if self.node_ref_lists:

946

for key, (value, refs) in sorted(self._root_node.keys.items()):

947

yield (self, key, value, refs)

948

else:

949

for key, (value, refs) in sorted(self._root_node.keys.items()):

950

yield (self, key, value)

951

return

952

start_of_leaves = self._row_offsets[-2]

953

end_of_leaves = self._row_offsets[-1]

954

needed_offsets = range(start_of_leaves, end_of_leaves)

955

if needed_offsets == [0]:

956

# Special case when we only have a root node, as we have already

957

# read everything

958

nodes = [(0, self._root_node)]

959

else:

960

nodes = self._read_nodes(needed_offsets)

961

# We iterate strictly in-order so that we can use this function

962

# for spilling index builds to disk.

963

if self.node_ref_lists:

964

for _, node in nodes:

965

for key, (value, refs) in sorted(node.keys.items()):

966

yield (self, key, value, refs)

967

else:

968

for _, node in nodes:

969

for key, (value, refs) in sorted(node.keys.items()):

970

yield (self, key, value)

971

972

@staticmethod

973

def _multi_bisect_right(in_keys, fixed_keys):

974

"""Find the positions where each 'in_key' would fit in fixed_keys.

975

976

This is equivalent to doing "bisect_right" on each in_key into

977

fixed_keys

978

979

:param in_keys: A sorted list of keys to match with fixed_keys

980

:param fixed_keys: A sorted list of keys to match against

981

:return: A list of (integer position, [key list]) tuples.

982

"""

983

if not in_keys:

984

return []

985

if not fixed_keys:

986

# no pointers in the fixed_keys list, which means everything must

987

# fall to the left.

988

return [(0, in_keys)]

989

990

# TODO: Iterating both lists will generally take M + N steps

991

# Bisecting each key will generally take M * log2 N steps.

992

# If we had an efficient way to compare, we could pick the method

993

# based on which has the fewer number of steps.

994

# There is also the argument that bisect_right is a compiled

995

# function, so there is even more to be gained.

996

# iter_steps = len(in_keys) + len(fixed_keys)

997

# bisect_steps = len(in_keys) * math.log(len(fixed_keys), 2)

998

if len(in_keys) == 1: # Bisect will always be faster for M = 1

999

return [(bisect_right(fixed_keys, in_keys[0]), in_keys)]

1000

# elif bisect_steps < iter_steps:

1001

# offsets = {}

1002

# for key in in_keys:

1003

# offsets.setdefault(bisect_right(fixed_keys, key),

1004

# []).append(key)

1005

# return [(o, offsets[o]) for o in sorted(offsets)]

1006

in_keys_iter = iter(in_keys)

1007

fixed_keys_iter = enumerate(fixed_keys)

1008

cur_in_key = in_keys_iter.next()

1009

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1010

1011

class InputDone(Exception): pass

1012

class FixedDone(Exception): pass

1013

1014

output = []

1015

cur_out = []

1016

1017

# TODO: Another possibility is that rather than iterating on each side,

1018

# we could use a combination of bisecting and iterating. For

1019

# example, while cur_in_key < fixed_key, bisect to find its

1020

# point, then iterate all matching keys, then bisect (restricted

1021

# to only the remainder) for the next one, etc.

1022

try:

1023

while True:

1024

if cur_in_key < cur_fixed_key:

1025

cur_keys = []

1026

cur_out = (cur_fixed_offset, cur_keys)

1027

output.append(cur_out)

1028

while cur_in_key < cur_fixed_key:

1029

cur_keys.append(cur_in_key)

1030

try:

1031

cur_in_key = in_keys_iter.next()

1032

except StopIteration:

1033

raise InputDone

1034

# At this point cur_in_key must be >= cur_fixed_key

1035

# step the cur_fixed_key until we pass the cur key, or walk off

1036

# the end

1037

while cur_in_key >= cur_fixed_key:

1038

try:

1039

cur_fixed_offset, cur_fixed_key = fixed_keys_iter.next()

1040

except StopIteration:

1041

raise FixedDone

1042

except InputDone:

1043

# We consumed all of the input, nothing more to do

1044

pass

1045

except FixedDone:

1046

# There was some input left, but we consumed all of fixed, so we

1047

# have to add one more for the tail

1048

cur_keys = [cur_in_key]

1049

cur_keys.extend(in_keys_iter)

1050

cur_out = (len(fixed_keys), cur_keys)

1051

output.append(cur_out)

1052

return output

1053

1054

def _walk_through_internal_nodes(self, keys):

1055

"""Take the given set of keys, and find the corresponding LeafNodes.

1056

1057

:param keys: An unsorted iterable of keys to search for

1058

:return: (nodes, index_and_keys)

1059

nodes is a dict mapping {index: LeafNode}

1060

keys_at_index is a list of tuples of [(index, [keys for Leaf])]

1061

"""

1062

# 6 seconds spent in miss_torture using the sorted() line.

1063

# Even with out of order disk IO it seems faster not to sort it when

1064

# large queries are being made.

1065

keys_at_index = [(0, sorted(keys))]

1066

1067

for row_pos, next_row_start in enumerate(self._row_offsets[1:-1]):

1068

node_indexes = [idx for idx, s_keys in keys_at_index]

1069

nodes = self._get_internal_nodes(node_indexes)

1070

1071

next_nodes_and_keys = []

1072

for node_index, sub_keys in keys_at_index:

1073

node = nodes[node_index]

1074

positions = self._multi_bisect_right(sub_keys, node.keys)

1075

node_offset = next_row_start + node.offset

1076

next_nodes_and_keys.extend([(node_offset + pos, s_keys)

1077

for pos, s_keys in positions])

1078

keys_at_index = next_nodes_and_keys

1079

# We should now be at the _LeafNodes

1080

node_indexes = [idx for idx, s_keys in keys_at_index]

1081

1082

# TODO: We may *not* want to always read all the nodes in one

1083

# big go. Consider setting a max size on this.

1084

nodes = self._get_leaf_nodes(node_indexes)

1085

return nodes, keys_at_index

1086

1087

def iter_entries(self, keys):

1088

"""Iterate over keys within the index.

1089

1090

:param keys: An iterable providing the keys to be retrieved.

1091

:return: An iterable as per iter_all_entries, but restricted to the

1092

keys supplied. No additional keys will be returned, and every

1093

key supplied that is in the index will be returned.

1094

"""

1095

# 6 seconds spent in miss_torture using the sorted() line.

1096

# Even with out of order disk IO it seems faster not to sort it when

1097

# large queries are being made.

1098

# However, now that we are doing multi-way bisecting, we need the keys

1099

# in sorted order anyway. We could change the multi-way code to not

1100

# require sorted order. (For example, it bisects for the first node,

1101

# does an in-order search until a key comes before the current point,

1102

# which it then bisects for, etc.)

1103

keys = frozenset(keys)

1104

if not keys:

1105

return

1106

1107

if not self.key_count():

1108

return

1109

1110

needed_keys = []

1111

if self._leaf_value_cache is None:

1112

needed_keys = keys

1113

else:

1114

for key in keys:

1115

value = self._leaf_value_cache.get(key, None)

1116

if value is not None:

1117

# This key is known not to be here, skip it

1118

value, refs = value

1119

if self.node_ref_lists:

1120

yield (self, key, value, refs)

1121

else:

1122

yield (self, key, value)

1123

else:

1124

needed_keys.append(key)

1125

1126

last_key = None

1127

needed_keys = keys

1128

if not needed_keys:

1129

return

1130

nodes, nodes_and_keys = self._walk_through_internal_nodes(needed_keys)

1131

for node_index, sub_keys in nodes_and_keys:

1132

if not sub_keys:

1133

continue

1134

node = nodes[node_index]

1135

for next_sub_key in sub_keys:

1136

if next_sub_key in node.keys:

1137

value, refs = node.keys[next_sub_key]

1138

if self.node_ref_lists:

1139

yield (self, next_sub_key, value, refs)

1140

else:

1141

yield (self, next_sub_key, value)

1142

1143

def _find_ancestors(self, keys, ref_list_num, parent_map, missing_keys):

1144

"""Find the parent_map information for the set of keys.

1145

1146

This populates the parent_map dict and missing_keys set based on the

1147

queried keys. It also can fill out an arbitrary number of parents that

1148

it finds while searching for the supplied keys.

1149

1150

It is unlikely that you want to call this directly. See

1151

"CombinedGraphIndex.find_ancestry()" for a more appropriate API.

1152

1153

:param keys: A keys whose ancestry we want to return

1154

Every key will either end up in 'parent_map' or 'missing_keys'.

1155

:param ref_list_num: This index in the ref_lists is the parents we

1156

care about.

1157

:param parent_map: {key: parent_keys} for keys that are present in this

1158

index. This may contain more entries than were in 'keys', that are

1159

reachable ancestors of the keys requested.

1160

:param missing_keys: keys which are known to be missing in this index.

1161

This may include parents that were not directly requested, but we

1162

were able to determine that they are not present in this index.

1163

:return: search_keys parents that were found but not queried to know

1164

if they are missing or present. Callers can re-query this index for

1165

those keys, and they will be placed into parent_map or missing_keys

1166

"""

1167

if not self.key_count():

1168

# We use key_count() to trigger reading the root node and

1169

# determining info about this BTreeGraphIndex

1170

# If we don't have any keys, then everything is missing

1171

missing_keys.update(keys)

1172

return set()

1173

if ref_list_num >= self.node_ref_lists:

1174

raise ValueError('No ref list %d, index has %d ref lists'

1175

% (ref_list_num, self.node_ref_lists))

1176

1177

# The main trick we are trying to accomplish is that when we find a

1178

# key listing its parents, we expect that the parent key is also likely

1179

# to sit on the same page. Allowing us to expand parents quickly

1180

# without suffering the full stack of bisecting, etc.

1181

nodes, nodes_and_keys = self._walk_through_internal_nodes(keys)

1182

1183

# These are parent keys which could not be immediately resolved on the

1184

# page where the child was present. Note that we may already be

1185

# searching for that key, and it may actually be present [or known

1186

# missing] on one of the other pages we are reading.

1187

# TODO:

1188

# We could try searching for them in the immediate previous or next

1189

# page. If they occur "later" we could put them in a pending lookup

1190

# set, and then for each node we read thereafter we could check to

1191

# see if they are present.

1192

# However, we don't know the impact of keeping this list of things

1193

# that I'm going to search for every node I come across from here on

1194

# out.

1195

# It doesn't handle the case when the parent key is missing on a

1196

# page that we *don't* read. So we already have to handle being

1197

# re-entrant for that.

1198

# Since most keys contain a date string, they are more likely to be

1199

# found earlier in the file than later, but we would know that right

1200

# away (key < min_key), and wouldn't keep searching it on every other

1201

# page that we read.

1202

# Mostly, it is an idea, one which should be benchmarked.

1203

parents_not_on_page = set()

1204

1205

for node_index, sub_keys in nodes_and_keys:

1206

if not sub_keys:

1207

continue

1208

# sub_keys is all of the keys we are looking for that should exist

1209

# on this page, if they aren't here, then they won't be found

1210

node = nodes[node_index]

1211

node_keys = node.keys

1212

parents_to_check = set()

1213

for next_sub_key in sub_keys:

1214

if next_sub_key not in node_keys:

1215

# This one is just not present in the index at all

1216

missing_keys.add(next_sub_key)

1217

else:

1218

value, refs = node_keys[next_sub_key]

1219

parent_keys = refs[ref_list_num]

1220

parent_map[next_sub_key] = parent_keys

1221

parents_to_check.update(parent_keys)

1222

# Don't look for things we've already found

1223

parents_to_check = parents_to_check.difference(parent_map)

1224

# this can be used to test the benefit of having the check loop

1225

# inlined.

1226

# parents_not_on_page.update(parents_to_check)

1227

# continue

1228

while parents_to_check:

1229

next_parents_to_check = set()

1230

for key in parents_to_check:

1231

if key in node_keys:

1232

value, refs = node_keys[key]

1233

parent_keys = refs[ref_list_num]

1234

parent_map[key] = parent_keys

1235

next_parents_to_check.update(parent_keys)

1236

else:

1237

# This parent either is genuinely missing, or should be

1238

# found on another page. Perf test whether it is better

1239

# to check if this node should fit on this page or not.

1240

# in the 'everything-in-one-pack' scenario, this *not*

1241

# doing the check is 237ms vs 243ms.

1242

# So slightly better, but I assume the standard 'lots

1243

# of packs' is going to show a reasonable improvement

1244

# from the check, because it avoids 'going around

1245

# again' for everything that is in another index

1246

# parents_not_on_page.add(key)

1247

# Missing for some reason

1248

if key < node.min_key:

1249

# in the case of bzr.dev, 3.4k/5.3k misses are

1250

# 'earlier' misses (65%)

1251

parents_not_on_page.add(key)

1252

elif key > node.max_key:

1253

# This parent key would be present on a different

1254

# LeafNode

1255

parents_not_on_page.add(key)

1256

else:

1257

# assert key != node.min_key and key != node.max_key

1258

# If it was going to be present, it would be on

1259

# *this* page, so mark it missing.

1260

missing_keys.add(key)

1261

parents_to_check = next_parents_to_check.difference(parent_map)

1262

# Might want to do another .difference() from missing_keys

1263

# parents_not_on_page could have been found on a different page, or be

1264

# known to be missing. So cull out everything that has already been

1265

# found.

1266

search_keys = parents_not_on_page.difference(

1267

parent_map).difference(missing_keys)

1268

return search_keys

1269

1270

def iter_entries_prefix(self, keys):

1271

"""Iterate over keys within the index using prefix matching.

1272

1273

Prefix matching is applied within the tuple of a key, not to within

1274

the bytestring of each key element. e.g. if you have the keys ('foo',

1275

'bar'), ('foobar', 'gam') and do a prefix search for ('foo', None) then

1276

only the former key is returned.

1277

1278

WARNING: Note that this method currently causes a full index parse

1279

unconditionally (which is reasonably appropriate as it is a means for

1280

thunking many small indices into one larger one and still supplies

1281

iter_all_entries at the thunk layer).

1282

1283

:param keys: An iterable providing the key prefixes to be retrieved.

1284

Each key prefix takes the form of a tuple the length of a key, but

1285

with the last N elements 'None' rather than a regular bytestring.

1286

The first element cannot be 'None'.

1287

:return: An iterable as per iter_all_entries, but restricted to the

1288

keys with a matching prefix to those supplied. No additional keys

1289

will be returned, and every match that is in the index will be

1290

returned.

1291

"""

1292

keys = sorted(set(keys))

1293

if not keys:

1294

return

1295

# Load if needed to check key lengths

1296

if self._key_count is None:

1297

self._get_root_node()

1298

# TODO: only access nodes that can satisfy the prefixes we are looking

1299

# for. For now, to meet API usage (as this function is not used by

1300

# current bzrlib) just suck the entire index and iterate in memory.

1301

nodes = {}

1302

if self.node_ref_lists:

1303

if self._key_length == 1:

1304

for _1, key, value, refs in self.iter_all_entries():

1305

nodes[key] = value, refs

1306

else:

1307

nodes_by_key = {}

1308

for _1, key, value, refs in self.iter_all_entries():

1309

key_value = key, value, refs

1310

# For a key of (foo, bar, baz) create

1311

# _nodes_by_key[foo][bar][baz] = key_value

1312

key_dict = nodes_by_key

1313

for subkey in key[:-1]:

1314

key_dict = key_dict.setdefault(subkey, {})

1315

key_dict[key[-1]] = key_value

1316

else:

1317

if self._key_length == 1:

1318

for _1, key, value in self.iter_all_entries():

1319

nodes[key] = value

1320

else:

1321

nodes_by_key = {}

1322

for _1, key, value in self.iter_all_entries():

1323

key_value = key, value

1324

# For a key of (foo, bar, baz) create

1325

# _nodes_by_key[foo][bar][baz] = key_value

1326

key_dict = nodes_by_key

1327

for subkey in key[:-1]:

1328

key_dict = key_dict.setdefault(subkey, {})

1329

key_dict[key[-1]] = key_value

1330

if self._key_length == 1:

1331

for key in keys:

1332

# sanity check

1333

if key[0] is None:

1334

raise errors.BadIndexKey(key)

1335

if len(key) != self._key_length:

1336

raise errors.BadIndexKey(key)

1337

try:

1338

if self.node_ref_lists:

1339

value, node_refs = nodes[key]

1340

yield self, key, value, node_refs

1341

else:

1342

yield self, key, nodes[key]

1343

except KeyError:

1344

pass

1345

return

1346

for key in keys:

1347

# sanity check

1348

if key[0] is None:

1349

raise errors.BadIndexKey(key)

1350

if len(key) != self._key_length:

1351

raise errors.BadIndexKey(key)

1352

# find what it refers to:

1353

key_dict = nodes_by_key

1354

elements = list(key)

1355

# find the subdict whose contents should be returned.

1356

try:

1357

while len(elements) and elements[0] is not None:

1358

key_dict = key_dict[elements[0]]

1359

elements.pop(0)

1360

except KeyError:

1361

# a non-existant lookup.

1362

continue

1363

if len(elements):

1364

dicts = [key_dict]

1365

while dicts:

1366

key_dict = dicts.pop(-1)

1367

# can't be empty or would not exist

1368

item, value = key_dict.iteritems().next()

1369

if type(value) == dict:

1370

# push keys

1371

dicts.extend(key_dict.itervalues())

1372

else:

1373

# yield keys

1374

for value in key_dict.itervalues():

1375

# each value is the key:value:node refs tuple

1376

# ready to yield.

1377

yield (self, ) + value

1378

else:

1379

# the last thing looked up was a terminal element

1380

yield (self, ) + key_dict

1381

1382

def key_count(self):

1383

"""Return an estimate of the number of keys in this index.

1384

1385

For BTreeGraphIndex the estimate is exact as it is contained in the

1386

header.

1387

"""

1388

if self._key_count is None:

1389

self._get_root_node()

1390

return self._key_count

1391

1392

def _compute_row_offsets(self):

1393

"""Fill out the _row_offsets attribute based on _row_lengths."""

1394

offsets = []

1395

row_offset = 0

1396

for row in self._row_lengths:

1397

offsets.append(row_offset)

1398

row_offset += row

1399

offsets.append(row_offset)

1400

self._row_offsets = offsets

1401

1402

def _parse_header_from_bytes(self, bytes):

1403

"""Parse the header from a region of bytes.

1404

1405

:param bytes: The data to parse.

1406

:return: An offset, data tuple such as readv yields, for the unparsed

1407

data. (which may be of length 0).

1408

"""

1409

signature = bytes[0:len(self._signature())]

1410

if not signature == self._signature():

1411

raise errors.BadIndexFormatSignature(self._name, BTreeGraphIndex)

1412

lines = bytes[len(self._signature()):].splitlines()

1413

options_line = lines[0]

1414

if not options_line.startswith(_OPTION_NODE_REFS):

1415

raise errors.BadIndexOptions(self)

1416

try:

1417

self.node_ref_lists = int(options_line[len(_OPTION_NODE_REFS):])

1418

except ValueError:

1419

raise errors.BadIndexOptions(self)

1420

options_line = lines[1]

1421

if not options_line.startswith(_OPTION_KEY_ELEMENTS):

1422

raise errors.BadIndexOptions(self)

1423

try:

1424

self._key_length = int(options_line[len(_OPTION_KEY_ELEMENTS):])

1425

except ValueError:

1426

raise errors.BadIndexOptions(self)

1427

options_line = lines[2]

1428

if not options_line.startswith(_OPTION_LEN):

1429

raise errors.BadIndexOptions(self)

1430

try:

1431

self._key_count = int(options_line[len(_OPTION_LEN):])

1432

except ValueError:

1433

raise errors.BadIndexOptions(self)

1434

options_line = lines[3]

1435

if not options_line.startswith(_OPTION_ROW_LENGTHS):

1436

raise errors.BadIndexOptions(self)

1437

try:

1438

self._row_lengths = map(int, [length for length in

1439

options_line[len(_OPTION_ROW_LENGTHS):].split(',')

1440

if len(length)])

1441

except ValueError:

1442

raise errors.BadIndexOptions(self)

1443

self._compute_row_offsets()

1444

1445

# calculate the bytes we have processed

1446

header_end = (len(signature) + sum(map(len, lines[0:4])) + 4)

1447

return header_end, bytes[header_end:]

1448

1449

def _read_nodes(self, nodes):

1450

"""Read some nodes from disk into the LRU cache.

1451

1452

This performs a readv to get the node data into memory, and parses each

1453

node, then yields it to the caller. The nodes are requested in the

1454

supplied order. If possible doing sort() on the list before requesting

1455

a read may improve performance.

1456

1457

:param nodes: The nodes to read. 0 - first node, 1 - second node etc.

1458

:return: None

1459

"""

1460

# may be the byte string of the whole file

1461

bytes = None

1462

# list of (offset, length) regions of the file that should, evenually

1463

# be read in to data_ranges, either from 'bytes' or from the transport

1464

ranges = []

1465

for index in nodes:

1466

offset = index * _PAGE_SIZE

1467

size = _PAGE_SIZE

1468

if index == 0:

1469

# Root node - special case

1470

if self._size:

1471

size = min(_PAGE_SIZE, self._size)

1472

else:

1473

# The only case where we don't know the size, is for very

1474

# small indexes. So we read the whole thing

1475

bytes = self._transport.get_bytes(self._name)

1476

self._size = len(bytes)

1477

# the whole thing should be parsed out of 'bytes'

1478

ranges.append((0, len(bytes)))

1479

break

1480

else:

1481

if offset > self._size:

1482

raise AssertionError('tried to read past the end'

1483

' of the file %s > %s'

1484

% (offset, self._size))

1485

size = min(size, self._size - offset)

1486

ranges.append((offset, size))

1487

if not ranges:

1488

return

1489

elif bytes is not None:

1490

# already have the whole file

1491

data_ranges = [(start, bytes[start:start+_PAGE_SIZE])

1492

for start in xrange(0, len(bytes), _PAGE_SIZE)]

1493

elif self._file is None:

1494

data_ranges = self._transport.readv(self._name, ranges)

1495

else:

1496

data_ranges = []

1497

for offset, size in ranges:

1498

self._file.seek(offset)

1499

data_ranges.append((offset, self._file.read(size)))

1500

for offset, data in data_ranges:

1501

if offset == 0:

1502

# extract the header

1503

offset, data = self._parse_header_from_bytes(data)

1504

if len(data) == 0:

1505

continue

1506

bytes = zlib.decompress(data)

1507

if bytes.startswith(_LEAF_FLAG):

1508

node = _LeafNode(bytes, self._key_length, self.node_ref_lists)

1509

elif bytes.startswith(_INTERNAL_FLAG):

1510

node = _InternalNode(bytes)

1511

else:

1512

raise AssertionError("Unknown node type for %r" % bytes)

1513

yield offset / _PAGE_SIZE, node

1514

1515

def _signature(self):

1516

"""The file signature for this index type."""

1517

return _BTSIGNATURE

1518

1519

def validate(self):

1520

"""Validate that everything in the index can be accessed."""

1521

# just read and parse every node.

1522

self._get_root_node()

1523

if len(self._row_lengths) > 1:

1524

start_node = self._row_offsets[1]

1525

else:

1526

# We shouldn't be reading anything anyway

1527

start_node = 1

1528

node_end = self._row_offsets[-1]

1529

for node in self._read_nodes(range(start_node, node_end)):

1530

pass

1531

1532

1533

try:

1534

from bzrlib import _btree_serializer_pyx as _btree_serializer

1535

except ImportError:

1536

from bzrlib import _btree_serializer_py as _btree_serializer

Older »