~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/groupcompress.py

Committer: Canonical.com Patch Queue Manager
Date: 2009-08-28 13:16:40 UTC
mfrom: (4661.1.1 integration)
Revision ID: pqm@pqm.ubuntu.com-20090828131640-u1s6d7cvjj5qsuwk

(vila) Don't restrict the command name used to run the test suite

files added:
BRANCH.TODO

COPYING.txt

INSTALL

bzr.ico

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/annotate.py

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/deprecated_graph.py

bzrlib/diff-delta.c

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/email_message.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help_topics

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_interrepository

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/util/tests

bzrlib/util/tests/__init__.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave_commands.py

bzrlib/win32utils.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/BUILD-NOTES

doc/Makefile

doc/_static

doc/_static/bzr icon 16.png

doc/_static/bzr.ico

doc/_static/en

doc/_static/en/quick-reference

doc/_static/en/quick-reference/Makefile

doc/_static/en/quick-reference/bzr-quick-reference.pdf

doc/_static/en/quick-reference/bzr-quick-reference.png

doc/_static/en/quick-reference/bzr-quick-reference.svg

doc/_templates

doc/_templates/index.html

doc/_templates/layout.html

doc/bazaar-vcs.org.kid

doc/conf.py

doc/contents.txt

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/bundle-creation.txt

doc/developers/bundle-format4.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/gc.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/indices.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/lca_tree_merging.txt

doc/developers/merge-scaling.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/uncommit.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/migration

doc/en/migration/index.txt

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/index.txt

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/index-for-2x.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/part2_intro.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/es

doc/es/developer-guide

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/quick-reference

doc/es/quick-reference/Makefile

doc/es/quick-reference/quick-start-summary.pdf

doc/es/quick-reference/quick-start-summary.png

doc/es/quick-reference/quick-start-summary.svg

doc/es/release-notes

doc/es/user-guide

doc/es/user-guide/index.txt

doc/es/user-guide/resolving_conflicts.txt

doc/es/user-guide/version_info.txt

doc/es/user-reference

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/make.bat

doc/news-template.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

man1

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/capture_tree.py

tools/check-newsbugs.py

tools/generate_docs.py

tools/package_mf.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/riodemo.py

tools/rst2html.py

tools/rst2pdf.py

tools/rst2prettyhtml.py

tools/time_graph.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/run_script.py

tools/win32/start_bzr.bat

files removed:
build-api

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/upgrade.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

bzr-man.py => bzrlib/doc_generate/autodoc_man.py

bzrlib/store.py => bzrlib/store/__init__.py

bzrlib/weavestore.py => bzrlib/store/versioned/__init__.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/testbranch.py => bzrlib/tests/per_branch/test_branch.py

bzrlib/selftest/test_parent.py => bzrlib/tests/per_branch/test_parent.py

bzrlib/selftest/testdiff.py => bzrlib/tests/test_diff.py

bzrlib/selftest/testfetch.py => bzrlib/tests/test_fetch.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testlog.py => bzrlib/tests/test_log.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevision.py => bzrlib/tests/test_revision.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionspec.py

bzrlib/selftest/teststore.py => bzrlib/tests/test_store.py

tools/testweave.py => bzrlib/tests/test_weave.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

bzrlib/ui.py => bzrlib/ui/__init__.py

tools/history2weaves.py => bzrlib/upgrade.py

bzrlib/xml5.py => bzrlib/xml8.py

bzrlib/xml.py => bzrlib/xml_serializer.py

HACKING => doc/en/developer-guide/HACKING.txt

tutorial.txt => doc/en/tutorials/tutorial.txt

files modified:
.bzrignore

.rsyncexclude

Makefile

NEWS

README

TODO

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_xml.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

setup.py *

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/groupcompress.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Core compression logic for compressing streams of related files."""

import time

import zlib

try:

import pylzma

except ImportError:

pylzma = None

from bzrlib import (

annotate,

debug,

errors,

graph as _mod_graph,

knit,

osutils,

pack,

trace,

)

from bzrlib.btree_index import BTreeBuilder

from bzrlib.lru_cache import LRUSizeCache

from bzrlib.tsort import topo_sort

from bzrlib.versionedfile import (

adapter_registry,

AbsentContentFactory,

ChunkedContentFactory,

FulltextContentFactory,

VersionedFiles,

)

# Minimum number of uncompressed bytes to try fetch at once when retrieving

# groupcompress blocks.

BATCH_SIZE = 2**16

_USE_LZMA = False and (pylzma is not None)

# osutils.sha_string('')

_null_sha1 = 'da39a3ee5e6b4b0d3255bfef95601890afd80709'

def sort_gc_optimal(parent_map):

"""Sort and group the keys in parent_map into groupcompress order.

groupcompress is defined (currently) as reverse-topological order, grouped

by the key prefix.

:return: A sorted-list of keys

"""

# groupcompress ordering is approximately reverse topological,

# properly grouped by file-id.

per_prefix_map = {}

for key, value in parent_map.iteritems():

if isinstance(key, str) or len(key) == 1:

prefix = ''

else:

prefix = key[0]

try:

per_prefix_map[prefix][key] = value

except KeyError:

per_prefix_map[prefix] = {key: value}

present_keys = []

for prefix in sorted(per_prefix_map):

present_keys.extend(reversed(topo_sort(per_prefix_map[prefix])))

return present_keys

# The max zlib window size is 32kB, so if we set 'max_size' output of the

# decompressor to the requested bytes + 32kB, then we should guarantee

# num_bytes coming out.

_ZLIB_DECOMP_WINDOW = 32*1024

class GroupCompressBlock(object):

"""An object which maintains the internal structure of the compressed data.

This tracks the meta info (start of text, length, type, etc.)

"""

# Group Compress Block v1 Zlib

GCB_HEADER = 'gcb1z\n'

# Group Compress Block v1 Lzma

GCB_LZ_HEADER = 'gcb1l\n'

GCB_KNOWN_HEADERS = (GCB_HEADER, GCB_LZ_HEADER)

100

def __init__(self):

101

# map by key? or just order in file?

102

self._compressor_name = None

103

self._z_content = None

104

self._z_content_decompressor = None

105

self._z_content_length = None

106

self._content_length = None

107

self._content = None

108

self._content_chunks = None

109

110

def __len__(self):

111

# This is the maximum number of bytes this object will reference if

112

# everything is decompressed. However, if we decompress less than

113

# everything... (this would cause some problems for LRUSizeCache)

114

return self._content_length + self._z_content_length

115

116

def _ensure_content(self, num_bytes=None):

117

"""Make sure that content has been expanded enough.

118

119

:param num_bytes: Ensure that we have extracted at least num_bytes of

120

content. If None, consume everything

121

"""

122

# TODO: If we re-use the same content block at different times during

123

# get_record_stream(), it is possible that the first pass will

124

# get inserted, triggering an extract/_ensure_content() which

125

# will get rid of _z_content. And then the next use of the block

126

# will try to access _z_content (to send it over the wire), and

127

# fail because it is already extracted. Consider never releasing

128

# _z_content because of this.

129

if num_bytes is None:

130

num_bytes = self._content_length

131

elif (self._content_length is not None

132

and num_bytes > self._content_length):

133

raise AssertionError(

134

'requested num_bytes (%d) > content length (%d)'

135

% (num_bytes, self._content_length))

136

# Expand the content if required

137

if self._content is None:

138

if self._content_chunks is not None:

139

self._content = ''.join(self._content_chunks)

140

self._content_chunks = None

141

if self._content is None:

142

if self._z_content is None:

143

raise AssertionError('No content to decompress')

144

if self._z_content == '':

145

self._content = ''

146

elif self._compressor_name == 'lzma':

147

# We don't do partial lzma decomp yet

148

self._content = pylzma.decompress(self._z_content)

149

elif self._compressor_name == 'zlib':

150

# Start a zlib decompressor

151

if num_bytes is None:

152

self._content = zlib.decompress(self._z_content)

153

else:

154

self._z_content_decompressor = zlib.decompressobj()

155

# Seed the decompressor with the uncompressed bytes, so

156

# that the rest of the code is simplified

157

self._content = self._z_content_decompressor.decompress(

158

self._z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

159

else:

160

raise AssertionError('Unknown compressor: %r'

161

% self._compressor_name)

162

# Any bytes remaining to be decompressed will be in the decompressors

163

# 'unconsumed_tail'

164

165

# Do we have enough bytes already?

166

if num_bytes is not None and len(self._content) >= num_bytes:

167

return

168

if num_bytes is None and self._z_content_decompressor is None:

169

# We must have already decompressed everything

170

return

171

# If we got this far, and don't have a decompressor, something is wrong

172

if self._z_content_decompressor is None:

173

raise AssertionError(

174

'No decompressor to decompress %d bytes' % num_bytes)

175

remaining_decomp = self._z_content_decompressor.unconsumed_tail

176

if num_bytes is None:

177

if remaining_decomp:

178

# We don't know how much is left, but we'll decompress it all

179

self._content += self._z_content_decompressor.decompress(

180

remaining_decomp)

181

# Note: There's what I consider a bug in zlib.decompressobj

182

# If you pass back in the entire unconsumed_tail, only

183

# this time you don't pass a max-size, it doesn't

184

# change the unconsumed_tail back to None/''.

185

# However, we know we are done with the whole stream

186

self._z_content_decompressor = None

187

# XXX: Why is this the only place in this routine we set this?

188

self._content_length = len(self._content)

189

else:

190

if not remaining_decomp:

191

raise AssertionError('Nothing left to decompress')

192

needed_bytes = num_bytes - len(self._content)

193

# We always set max_size to 32kB over the minimum needed, so that

194

# zlib will give us as much as we really want.

195

# TODO: If this isn't good enough, we could make a loop here,

196

# that keeps expanding the request until we get enough

197

self._content += self._z_content_decompressor.decompress(

198

remaining_decomp, needed_bytes + _ZLIB_DECOMP_WINDOW)

199

if len(self._content) < num_bytes:

200

raise AssertionError('%d bytes wanted, only %d available'

201

% (num_bytes, len(self._content)))

202

if not self._z_content_decompressor.unconsumed_tail:

203

# The stream is finished

204

self._z_content_decompressor = None

205

206

def _parse_bytes(self, bytes, pos):

207

"""Read the various lengths from the header.

208

209

This also populates the various 'compressed' buffers.

210

211

:return: The position in bytes just after the last newline

212

"""

213

# At present, we have 2 integers for the compressed and uncompressed

214

# content. In base10 (ascii) 14 bytes can represent > 1TB, so to avoid

215

# checking too far, cap the search to 14 bytes.

216

pos2 = bytes.index('\n', pos, pos + 14)

217

self._z_content_length = int(bytes[pos:pos2])

218

pos = pos2 + 1

219

pos2 = bytes.index('\n', pos, pos + 14)

220

self._content_length = int(bytes[pos:pos2])

221

pos = pos2 + 1

222

if len(bytes) != (pos + self._z_content_length):

223

# XXX: Define some GCCorrupt error ?

224

raise AssertionError('Invalid bytes: (%d) != %d + %d' %

225

(len(bytes), pos, self._z_content_length))

226

self._z_content = bytes[pos:]

227

228

@classmethod

229

def from_bytes(cls, bytes):

230

out = cls()

231

if bytes[:6] not in cls.GCB_KNOWN_HEADERS:

232

raise ValueError('bytes did not start with any of %r'

233

% (cls.GCB_KNOWN_HEADERS,))

234

# XXX: why not testing the whole header ?

235

if bytes[4] == 'z':

236

out._compressor_name = 'zlib'

237

elif bytes[4] == 'l':

238

out._compressor_name = 'lzma'

239

else:

240

raise ValueError('unknown compressor: %r' % (bytes,))

241

out._parse_bytes(bytes, 6)

242

return out

243

244

def extract(self, key, start, end, sha1=None):

245

"""Extract the text for a specific key.

246

247

:param key: The label used for this content

248

:param sha1: TODO (should we validate only when sha1 is supplied?)

249

:return: The bytes for the content

250

"""

251

if start == end == 0:

252

return ''

253

self._ensure_content(end)

254

# The bytes are 'f' or 'd' for the type, then a variable-length

255

# base128 integer for the content size, then the actual content

256

# We know that the variable-length integer won't be longer than 5

257

# bytes (it takes 5 bytes to encode 2^32)

258

c = self._content[start]

259

if c == 'f':

260

type = 'fulltext'

261

else:

262

if c != 'd':

263

raise ValueError('Unknown content control code: %s'

264

% (c,))

265

type = 'delta'

266

content_len, len_len = decode_base128_int(

267

self._content[start + 1:start + 6])

268

content_start = start + 1 + len_len

269

if end != content_start + content_len:

270

raise ValueError('end != len according to field header'

271

' %s != %s' % (end, content_start + content_len))

272

if c == 'f':

273

bytes = self._content[content_start:end]

274

elif c == 'd':

275

bytes = apply_delta_to_source(self._content, content_start, end)

276

return bytes

277

278

def set_chunked_content(self, content_chunks, length):

279

"""Set the content of this block to the given chunks."""

280

# If we have lots of short lines, it is may be more efficient to join

281

# the content ahead of time. If the content is <10MiB, we don't really

282

# care about the extra memory consumption, so we can just pack it and

283

# be done. However, timing showed 18s => 17.9s for repacking 1k revs of

284

# mysql, which is below the noise margin

285

self._content_length = length

286

self._content_chunks = content_chunks

287

self._content = None

288

self._z_content = None

289

290

def set_content(self, content):

291

"""Set the content of this block."""

292

self._content_length = len(content)

293

self._content = content

294

self._z_content = None

295

296

def _create_z_content_using_lzma(self):

297

if self._content_chunks is not None:

298

self._content = ''.join(self._content_chunks)

299

self._content_chunks = None

300

if self._content is None:

301

raise AssertionError('Nothing to compress')

302

self._z_content = pylzma.compress(self._content)

303

self._z_content_length = len(self._z_content)

304

305

def _create_z_content_from_chunks(self):

306

compressor = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION)

307

compressed_chunks = map(compressor.compress, self._content_chunks)

308

compressed_chunks.append(compressor.flush())

309

self._z_content = ''.join(compressed_chunks)

310

self._z_content_length = len(self._z_content)

311

312

def _create_z_content(self):

313

if self._z_content is not None:

314

return

315

if _USE_LZMA:

316

self._create_z_content_using_lzma()

317

return

318

if self._content_chunks is not None:

319

self._create_z_content_from_chunks()

320

return

321

self._z_content = zlib.compress(self._content)

322

self._z_content_length = len(self._z_content)

323

324

def to_bytes(self):

325

"""Encode the information into a byte stream."""

326

self._create_z_content()

327

if _USE_LZMA:

328

header = self.GCB_LZ_HEADER

329

else:

330

header = self.GCB_HEADER

331

chunks = [header,

332

'%d\n%d\n' % (self._z_content_length, self._content_length),

333

self._z_content,

334

]

335

return ''.join(chunks)

336

337

def _dump(self, include_text=False):

338

"""Take this block, and spit out a human-readable structure.

339

340

:param include_text: Inserts also include text bits, chose whether you

341

want this displayed in the dump or not.

342

:return: A dump of the given block. The layout is something like:

343

[('f', length), ('d', delta_length, text_length, [delta_info])]

344

delta_info := [('i', num_bytes, text), ('c', offset, num_bytes),

345

...]

346

"""

347

self._ensure_content()

348

result = []

349

pos = 0

350

while pos < self._content_length:

351

kind = self._content[pos]

352

pos += 1

353

if kind not in ('f', 'd'):

354

raise ValueError('invalid kind character: %r' % (kind,))

355

content_len, len_len = decode_base128_int(

356

self._content[pos:pos + 5])

357

pos += len_len

358

if content_len + pos > self._content_length:

359

raise ValueError('invalid content_len %d for record @ pos %d'

360

% (content_len, pos - len_len - 1))

361

if kind == 'f': # Fulltext

362

if include_text:

363

text = self._content[pos:pos+content_len]

364

result.append(('f', content_len, text))

365

else:

366

result.append(('f', content_len))

367

elif kind == 'd': # Delta

368

delta_content = self._content[pos:pos+content_len]

369

delta_info = []

370

# The first entry in a delta is the decompressed length

371

decomp_len, delta_pos = decode_base128_int(delta_content)

372

result.append(('d', content_len, decomp_len, delta_info))

373

measured_len = 0

374

while delta_pos < content_len:

375

c = ord(delta_content[delta_pos])

376

delta_pos += 1

377

if c & 0x80: # Copy

378

(offset, length,

379

delta_pos) = decode_copy_instruction(delta_content, c,

380

delta_pos)

381

if include_text:

382

text = self._content[offset:offset+length]

383

delta_info.append(('c', offset, length, text))

384

else:

385

delta_info.append(('c', offset, length))

386

measured_len += length

387

else: # Insert

388

if include_text:

389

txt = delta_content[delta_pos:delta_pos+c]

390

else:

391

txt = ''

392

delta_info.append(('i', c, txt))

393

measured_len += c

394

delta_pos += c

395

if delta_pos != content_len:

396

raise ValueError('Delta consumed a bad number of bytes:'

397

' %d != %d' % (delta_pos, content_len))

398

if measured_len != decomp_len:

399

raise ValueError('Delta claimed fulltext was %d bytes, but'

400

' extraction resulted in %d bytes'

401

% (decomp_len, measured_len))

402

pos += content_len

403

return result

404

405

406

class _LazyGroupCompressFactory(object):

407

"""Yield content from a GroupCompressBlock on demand."""

408

409

def __init__(self, key, parents, manager, start, end, first):

410

"""Create a _LazyGroupCompressFactory

411

412

:param key: The key of just this record

413

:param parents: The parents of this key (possibly None)

414

:param gc_block: A GroupCompressBlock object

415

:param start: Offset of the first byte for this record in the

416

uncompressd content

417

:param end: Offset of the byte just after the end of this record

418

(ie, bytes = content[start:end])

419

:param first: Is this the first Factory for the given block?

420

"""

421

self.key = key

422

self.parents = parents

423

self.sha1 = None

424

# Note: This attribute coupled with Manager._factories creates a

425

# reference cycle. Perhaps we would rather use a weakref(), or

426

# find an appropriate time to release the ref. After the first

427

# get_bytes_as call? After Manager.get_record_stream() returns

428

# the object?

429

self._manager = manager

430

self._bytes = None

431

self.storage_kind = 'groupcompress-block'

432

if not first:

433

self.storage_kind = 'groupcompress-block-ref'

434

self._first = first

435

self._start = start

436

self._end = end

437

438

def __repr__(self):

439

return '%s(%s, first=%s)' % (self.__class__.__name__,

440

self.key, self._first)

441

442

def get_bytes_as(self, storage_kind):

443

if storage_kind == self.storage_kind:

444

if self._first:

445

# wire bytes, something...

446

return self._manager._wire_bytes()

447

else:

448

return ''

449

if storage_kind in ('fulltext', 'chunked'):

450

if self._bytes is None:

451

# Grab and cache the raw bytes for this entry

452

# and break the ref-cycle with _manager since we don't need it

453

# anymore

454

self._manager._prepare_for_extract()

455

block = self._manager._block

456

self._bytes = block.extract(self.key, self._start, self._end)

457

# There are code paths that first extract as fulltext, and then

458

# extract as storage_kind (smart fetch). So we don't break the

459

# refcycle here, but instead in manager.get_record_stream()

460

# self._manager = None

461

if storage_kind == 'fulltext':

462

return self._bytes

463

else:

464

return [self._bytes]

465

raise errors.UnavailableRepresentation(self.key, storage_kind,

466

self.storage_kind)

467

468

469

class _LazyGroupContentManager(object):

470

"""This manages a group of _LazyGroupCompressFactory objects."""

471

472

def __init__(self, block):

473

self._block = block

474

# We need to preserve the ordering

475

self._factories = []

476

self._last_byte = 0

477

478

def add_factory(self, key, parents, start, end):

479

if not self._factories:

480

first = True

481

else:

482

first = False

483

# Note that this creates a reference cycle....

484

factory = _LazyGroupCompressFactory(key, parents, self,

485

start, end, first=first)

486

# max() works here, but as a function call, doing a compare seems to be

487

# significantly faster, timeit says 250ms for max() and 100ms for the

488

# comparison

489

if end > self._last_byte:

490

self._last_byte = end

491

self._factories.append(factory)

492

493

def get_record_stream(self):

494

"""Get a record for all keys added so far."""

495

for factory in self._factories:

496

yield factory

497

# Break the ref-cycle

498

factory._bytes = None

499

factory._manager = None

500

# TODO: Consider setting self._factories = None after the above loop,

501

# as it will break the reference cycle

502

503

def _trim_block(self, last_byte):

504

"""Create a new GroupCompressBlock, with just some of the content."""

505

# None of the factories need to be adjusted, because the content is

506

# located in an identical place. Just that some of the unreferenced

507

# trailing bytes are stripped

508

trace.mutter('stripping trailing bytes from groupcompress block'

509

' %d => %d', self._block._content_length, last_byte)

510

new_block = GroupCompressBlock()

511

self._block._ensure_content(last_byte)

512

new_block.set_content(self._block._content[:last_byte])

513

self._block = new_block

514

515

def _rebuild_block(self):

516

"""Create a new GroupCompressBlock with only the referenced texts."""

517

compressor = GroupCompressor()

518

tstart = time.time()

519

old_length = self._block._content_length

520

end_point = 0

521

for factory in self._factories:

522

bytes = factory.get_bytes_as('fulltext')

523

(found_sha1, start_point, end_point,

524

type) = compressor.compress(factory.key, bytes, factory.sha1)

525

# Now update this factory with the new offsets, etc

526

factory.sha1 = found_sha1

527

factory._start = start_point

528

factory._end = end_point

529

self._last_byte = end_point

530

new_block = compressor.flush()

531

# TODO: Should we check that new_block really *is* smaller than the old

532

# block? It seems hard to come up with a method that it would

533

# expand, since we do full compression again. Perhaps based on a

534

# request that ends up poorly ordered?

535

delta = time.time() - tstart

536

self._block = new_block

537

trace.mutter('creating new compressed block on-the-fly in %.3fs'

538

' %d bytes => %d bytes', delta, old_length,

539

self._block._content_length)

540

541

def _prepare_for_extract(self):

542

"""A _LazyGroupCompressFactory is about to extract to fulltext."""

543

# We expect that if one child is going to fulltext, all will be. This

544

# helps prevent all of them from extracting a small amount at a time.

545

# Which in itself isn't terribly expensive, but resizing 2MB 32kB at a

546

# time (self._block._content) is a little expensive.

547

self._block._ensure_content(self._last_byte)

548

549

def _check_rebuild_block(self):

550

"""Check to see if our block should be repacked."""

551

total_bytes_used = 0

552

last_byte_used = 0

553

for factory in self._factories:

554

total_bytes_used += factory._end - factory._start

555

last_byte_used = max(last_byte_used, factory._end)

556

# If we are using most of the bytes from the block, we have nothing

557

# else to check (currently more that 1/2)

558

if total_bytes_used * 2 >= self._block._content_length:

559

return

560

# Can we just strip off the trailing bytes? If we are going to be

561

# transmitting more than 50% of the front of the content, go ahead

562

if total_bytes_used * 2 > last_byte_used:

563

self._trim_block(last_byte_used)

564

return

565

566

# We are using a small amount of the data, and it isn't just packed

567

# nicely at the front, so rebuild the content.

568

# Note: This would be *nicer* as a strip-data-from-group, rather than

569

# building it up again from scratch

570

# It might be reasonable to consider the fulltext sizes for

571

# different bits when deciding this, too. As you may have a small

572

# fulltext, and a trivial delta, and you are just trading around

573

# for another fulltext. If we do a simple 'prune' you may end up

574

# expanding many deltas into fulltexts, as well.

575

# If we build a cheap enough 'strip', then we could try a strip,

576

# if that expands the content, we then rebuild.

577

self._rebuild_block()

578

579

def _wire_bytes(self):

580

"""Return a byte stream suitable for transmitting over the wire."""

581

self._check_rebuild_block()

582

# The outer block starts with:

583

# 'groupcompress-block\n'

584

# <length of compressed key info>\n

585

# <length of uncompressed info>\n

586

# <length of gc block>\n

587

# <header bytes>

588

# <gc-block>

589

lines = ['groupcompress-block\n']

590

# The minimal info we need is the key, the start offset, and the

591

# parents. The length and type are encoded in the record itself.

592

# However, passing in the other bits makes it easier. The list of

593

# keys, and the start offset, the length

594

# 1 line key

595

# 1 line with parents, '' for ()

596

# 1 line for start offset

597

# 1 line for end byte

598

header_lines = []

599

for factory in self._factories:

600

key_bytes = '\x00'.join(factory.key)

601

parents = factory.parents

602

if parents is None:

603

parent_bytes = 'None:'

604

else:

605

parent_bytes = '\t'.join('\x00'.join(key) for key in parents)

606

record_header = '%s\n%s\n%d\n%d\n' % (

607

key_bytes, parent_bytes, factory._start, factory._end)

608

header_lines.append(record_header)

609

# TODO: Can we break the refcycle at this point and set

610

# factory._manager = None?

611

header_bytes = ''.join(header_lines)

612

del header_lines

613

header_bytes_len = len(header_bytes)

614

z_header_bytes = zlib.compress(header_bytes)

615

del header_bytes

616

z_header_bytes_len = len(z_header_bytes)

617

block_bytes = self._block.to_bytes()

618

lines.append('%d\n%d\n%d\n' % (z_header_bytes_len, header_bytes_len,

619

len(block_bytes)))

620

lines.append(z_header_bytes)

621

lines.append(block_bytes)

622

del z_header_bytes, block_bytes

623

return ''.join(lines)

624

625

@classmethod

626

def from_bytes(cls, bytes):

627

# TODO: This does extra string copying, probably better to do it a

628

# different way

629

(storage_kind, z_header_len, header_len,

630

block_len, rest) = bytes.split('\n', 4)

631

del bytes

632

if storage_kind != 'groupcompress-block':

633

raise ValueError('Unknown storage kind: %s' % (storage_kind,))

634

z_header_len = int(z_header_len)

635

if len(rest) < z_header_len:

636

raise ValueError('Compressed header len shorter than all bytes')

637

z_header = rest[:z_header_len]

638

header_len = int(header_len)

639

header = zlib.decompress(z_header)

640

if len(header) != header_len:

641

raise ValueError('invalid length for decompressed bytes')

642

del z_header

643

block_len = int(block_len)

644

if len(rest) != z_header_len + block_len:

645

raise ValueError('Invalid length for block')

646

block_bytes = rest[z_header_len:]

647

del rest

648

# So now we have a valid GCB, we just need to parse the factories that

649

# were sent to us

650

header_lines = header.split('\n')

651

del header

652

last = header_lines.pop()

653

if last != '':

654

raise ValueError('header lines did not end with a trailing'

655

' newline')

656

if len(header_lines) % 4 != 0:

657

raise ValueError('The header was not an even multiple of 4 lines')

658

block = GroupCompressBlock.from_bytes(block_bytes)

659

del block_bytes

660

result = cls(block)

661

for start in xrange(0, len(header_lines), 4):

662

# intern()?

663

key = tuple(header_lines[start].split('\x00'))

664

parents_line = header_lines[start+1]

665

if parents_line == 'None:':

666

parents = None

667

else:

668

parents = tuple([tuple(segment.split('\x00'))

669

for segment in parents_line.split('\t')

670

if segment])

671

start_offset = int(header_lines[start+2])

672

end_offset = int(header_lines[start+3])

673

result.add_factory(key, parents, start_offset, end_offset)

674

return result

675

676

677

def network_block_to_records(storage_kind, bytes, line_end):

678

if storage_kind != 'groupcompress-block':

679

raise ValueError('Unknown storage kind: %s' % (storage_kind,))

680

manager = _LazyGroupContentManager.from_bytes(bytes)

681

return manager.get_record_stream()

682

683

684

class _CommonGroupCompressor(object):

685

686

def __init__(self):

687

"""Create a GroupCompressor."""

688

self.chunks = []

689

self._last = None

690

self.endpoint = 0

691

self.input_bytes = 0

692

self.labels_deltas = {}

693

self._delta_index = None # Set by the children

694

self._block = GroupCompressBlock()

695

696

def compress(self, key, bytes, expected_sha, nostore_sha=None, soft=False):

697

"""Compress lines with label key.

698

699

:param key: A key tuple. It is stored in the output

700

for identification of the text during decompression. If the last

701

element is 'None' it is replaced with the sha1 of the text -

702

e.g. sha1:xxxxxxx.

703

:param bytes: The bytes to be compressed

704

:param expected_sha: If non-None, the sha the lines are believed to

705

have. During compression the sha is calculated; a mismatch will

706

cause an error.

707

:param nostore_sha: If the computed sha1 sum matches, we will raise

708

ExistingContent rather than adding the text.

709

:param soft: Do a 'soft' compression. This means that we require larger

710

ranges to match to be considered for a copy command.

711

712

:return: The sha1 of lines, the start and end offsets in the delta, and

713

the type ('fulltext' or 'delta').

714

715

:seealso VersionedFiles.add_lines:

716

"""

717

if not bytes: # empty, like a dir entry, etc

718

if nostore_sha == _null_sha1:

719

raise errors.ExistingContent()

720

return _null_sha1, 0, 0, 'fulltext'

721

# we assume someone knew what they were doing when they passed it in

722

if expected_sha is not None:

723

sha1 = expected_sha

724

else:

725

sha1 = osutils.sha_string(bytes)

726

if nostore_sha is not None:

727

if sha1 == nostore_sha:

728

raise errors.ExistingContent()

729

if key[-1] is None:

730

key = key[:-1] + ('sha1:' + sha1,)

731

732

start, end, type = self._compress(key, bytes, len(bytes) / 2, soft)

733

return sha1, start, end, type

734

735

def _compress(self, key, bytes, max_delta_size, soft=False):

736

"""Compress lines with label key.

737

738

:param key: A key tuple. It is stored in the output for identification

739

of the text during decompression.

740

741

:param bytes: The bytes to be compressed

742

743

:param max_delta_size: The size above which we issue a fulltext instead

744

of a delta.

745

746

:param soft: Do a 'soft' compression. This means that we require larger

747

ranges to match to be considered for a copy command.

748

749

:return: The sha1 of lines, the start and end offsets in the delta, and

750

the type ('fulltext' or 'delta').

751

"""

752

raise NotImplementedError(self._compress)

753

754

def extract(self, key):

755

"""Extract a key previously added to the compressor.

756

757

:param key: The key to extract.

758

:return: An iterable over bytes and the sha1.

759

"""

760

(start_byte, start_chunk, end_byte, end_chunk) = self.labels_deltas[key]

761

delta_chunks = self.chunks[start_chunk:end_chunk]

762

stored_bytes = ''.join(delta_chunks)

763

if stored_bytes[0] == 'f':

764

fulltext_len, offset = decode_base128_int(stored_bytes[1:10])

765

data_len = fulltext_len + 1 + offset

766

if data_len != len(stored_bytes):

767

raise ValueError('Index claimed fulltext len, but stored bytes'

768

' claim %s != %s'

769

% (len(stored_bytes), data_len))

770

bytes = stored_bytes[offset + 1:]

771

else:

772

# XXX: This is inefficient at best

773

source = ''.join(self.chunks[:start_chunk])

774

if stored_bytes[0] != 'd':

775

raise ValueError('Unknown content kind, bytes claim %s'

776

% (stored_bytes[0],))

777

delta_len, offset = decode_base128_int(stored_bytes[1:10])

778

data_len = delta_len + 1 + offset

779

if data_len != len(stored_bytes):

780

raise ValueError('Index claimed delta len, but stored bytes'

781

' claim %s != %s'

782

% (len(stored_bytes), data_len))

783

bytes = apply_delta(source, stored_bytes[offset + 1:])

784

bytes_sha1 = osutils.sha_string(bytes)

785

return bytes, bytes_sha1

786

787

def flush(self):

788

"""Finish this group, creating a formatted stream.

789

790

After calling this, the compressor should no longer be used

791

"""

792

# TODO: this causes us to 'bloat' to 2x the size of content in the

793

# group. This has an impact for 'commit' of large objects.

794

# One possibility is to use self._content_chunks, and be lazy and

795

# only fill out self._content as a full string when we actually

796

# need it. That would at least drop the peak memory consumption

797

# for 'commit' down to ~1x the size of the largest file, at a

798

# cost of increased complexity within this code. 2x is still <<

799

# 3x the size of the largest file, so we are doing ok.

800

self._block.set_chunked_content(self.chunks, self.endpoint)

801

self.chunks = None

802

self._delta_index = None

803

return self._block

804

805

def pop_last(self):

806

"""Call this if you want to 'revoke' the last compression.

807

808

After this, the data structures will be rolled back, but you cannot do

809

more compression.

810

"""

811

self._delta_index = None

812

del self.chunks[self._last[0]:]

813

self.endpoint = self._last[1]

814

self._last = None

815

816

def ratio(self):

817

"""Return the overall compression ratio."""

818

return float(self.input_bytes) / float(self.endpoint)

819

820

821

class PythonGroupCompressor(_CommonGroupCompressor):

822

823

def __init__(self):

824

"""Create a GroupCompressor.

825

826

Used only if the pyrex version is not available.

827

"""

828

super(PythonGroupCompressor, self).__init__()

829

self._delta_index = LinesDeltaIndex([])

830

# The actual content is managed by LinesDeltaIndex

831

self.chunks = self._delta_index.lines

832

833

def _compress(self, key, bytes, max_delta_size, soft=False):

834

"""see _CommonGroupCompressor._compress"""

835

input_len = len(bytes)

836

new_lines = osutils.split_lines(bytes)

837

out_lines, index_lines = self._delta_index.make_delta(

838

new_lines, bytes_length=input_len, soft=soft)

839

delta_length = sum(map(len, out_lines))

840

if delta_length > max_delta_size:

841

# The delta is longer than the fulltext, insert a fulltext

842

type = 'fulltext'

843

out_lines = ['f', encode_base128_int(input_len)]

844

out_lines.extend(new_lines)

845

index_lines = [False, False]

846

index_lines.extend([True] * len(new_lines))

847

else:

848

# this is a worthy delta, output it

849

type = 'delta'

850

out_lines[0] = 'd'

851

# Update the delta_length to include those two encoded integers

852

out_lines[1] = encode_base128_int(delta_length)

853

# Before insertion

854

start = self.endpoint

855

chunk_start = len(self.chunks)

856

self._last = (chunk_start, self.endpoint)

857

self._delta_index.extend_lines(out_lines, index_lines)

858

self.endpoint = self._delta_index.endpoint

859

self.input_bytes += input_len

860

chunk_end = len(self.chunks)

861

self.labels_deltas[key] = (start, chunk_start,

862

self.endpoint, chunk_end)

863

return start, self.endpoint, type

864

865

866

class PyrexGroupCompressor(_CommonGroupCompressor):

867

"""Produce a serialised group of compressed texts.

868

869

It contains code very similar to SequenceMatcher because of having a similar

870

task. However some key differences apply:

871

- there is no junk, we want a minimal edit not a human readable diff.

872

- we don't filter very common lines (because we don't know where a good

873

range will start, and after the first text we want to be emitting minmal

874

edits only.

875

- we chain the left side, not the right side

876

- we incrementally update the adjacency matrix as new lines are provided.

877

- we look for matches in all of the left side, so the routine which does

878

the analagous task of find_longest_match does not need to filter on the

879

left side.

880

"""

881

882

def __init__(self):

883

super(PyrexGroupCompressor, self).__init__()

884

self._delta_index = DeltaIndex()

885

886

def _compress(self, key, bytes, max_delta_size, soft=False):

887

"""see _CommonGroupCompressor._compress"""

888

input_len = len(bytes)

889

# By having action/label/sha1/len, we can parse the group if the index

890

# was ever destroyed, we have the key in 'label', we know the final

891

# bytes are valid from sha1, and we know where to find the end of this

892

# record because of 'len'. (the delta record itself will store the

893

# total length for the expanded record)

894

# 'len: %d\n' costs approximately 1% increase in total data

895

# Having the labels at all costs us 9-10% increase, 38% increase for

896

# inventory pages, and 5.8% increase for text pages

897

# new_chunks = ['label:%s\nsha1:%s\n' % (label, sha1)]

898

if self._delta_index._source_offset != self.endpoint:

899

raise AssertionError('_source_offset != endpoint'

900

' somehow the DeltaIndex got out of sync with'

901

' the output lines')

902

delta = self._delta_index.make_delta(bytes, max_delta_size)

903

if (delta is None):

904

type = 'fulltext'

905

enc_length = encode_base128_int(len(bytes))

906

len_mini_header = 1 + len(enc_length)

907

self._delta_index.add_source(bytes, len_mini_header)

908

new_chunks = ['f', enc_length, bytes]

909

else:

910

type = 'delta'

911

enc_length = encode_base128_int(len(delta))

912

len_mini_header = 1 + len(enc_length)

913

new_chunks = ['d', enc_length, delta]

914

self._delta_index.add_delta_source(delta, len_mini_header)

915

# Before insertion

916

start = self.endpoint

917

chunk_start = len(self.chunks)

918

# Now output these bytes

919

self._output_chunks(new_chunks)

920

self.input_bytes += input_len

921

chunk_end = len(self.chunks)

922

self.labels_deltas[key] = (start, chunk_start,

923

self.endpoint, chunk_end)

924

if not self._delta_index._source_offset == self.endpoint:

925

raise AssertionError('the delta index is out of sync'

926

'with the output lines %s != %s'

927

% (self._delta_index._source_offset, self.endpoint))

928

return start, self.endpoint, type

929

930

def _output_chunks(self, new_chunks):

931

"""Output some chunks.

932

933

:param new_chunks: The chunks to output.

934

"""

935

self._last = (len(self.chunks), self.endpoint)

936

endpoint = self.endpoint

937

self.chunks.extend(new_chunks)

938

endpoint += sum(map(len, new_chunks))

939

self.endpoint = endpoint

940

941

942

def make_pack_factory(graph, delta, keylength, inconsistency_fatal=True):

943

"""Create a factory for creating a pack based groupcompress.

944

945

This is only functional enough to run interface tests, it doesn't try to

946

provide a full pack environment.

947

948

:param graph: Store a graph.

949

:param delta: Delta compress contents.

950

:param keylength: How long should keys be.

951

"""

952

def factory(transport):

953

parents = graph

954

ref_length = 0

955

if graph:

956

ref_length = 1

957

graph_index = BTreeBuilder(reference_lists=ref_length,

958

key_elements=keylength)

959

stream = transport.open_write_stream('newpack')

960

writer = pack.ContainerWriter(stream.write)

961

writer.begin()

962

index = _GCGraphIndex(graph_index, lambda:True, parents=parents,

963

add_callback=graph_index.add_nodes,

964

inconsistency_fatal=inconsistency_fatal)

965

access = knit._DirectPackAccess({})

966

access.set_writer(writer, graph_index, (transport, 'newpack'))

967

result = GroupCompressVersionedFiles(index, access, delta)

968

result.stream = stream

969

result.writer = writer

970

return result

971

return factory

972

973

974

def cleanup_pack_group(versioned_files):

975

versioned_files.writer.end()

976

versioned_files.stream.close()

977

978

979

class _BatchingBlockFetcher(object):

980

"""Fetch group compress blocks in batches.

981

982

:ivar total_bytes: int of expected number of bytes needed to fetch the

983

currently pending batch.

984

"""

985

986

def __init__(self, gcvf, locations):

987

self.gcvf = gcvf

988

self.locations = locations

989

self.keys = []

990

self.batch_memos = {}

991

self.memos_to_get = []

992

self.total_bytes = 0

993

self.last_read_memo = None

994

self.manager = None

995

996

def add_key(self, key):

997

"""Add another to key to fetch.

998

999

:return: The estimated number of bytes needed to fetch the batch so

1000

far.

1001

"""

1002

self.keys.append(key)

1003

index_memo, _, _, _ = self.locations[key]

1004

read_memo = index_memo[0:3]

1005

# Three possibilities for this read_memo:

1006

# - it's already part of this batch; or

1007

# - it's not yet part of this batch, but is already cached; or

1008

# - it's not yet part of this batch and will need to be fetched.

1009

if read_memo in self.batch_memos:

1010

# This read memo is already in this batch.

1011

return self.total_bytes

1012

try:

1013

cached_block = self.gcvf._group_cache[read_memo]

1014

except KeyError:

1015

# This read memo is new to this batch, and the data isn't cached

1016

# either.

1017

self.batch_memos[read_memo] = None

1018

self.memos_to_get.append(read_memo)

1019

byte_length = read_memo[2]

1020

self.total_bytes += byte_length

1021

else:

1022

# This read memo is new to this batch, but cached.

1023

# Keep a reference to the cached block in batch_memos because it's

1024

# certain that we'll use it when this batch is processed, but

1025

# there's a risk that it would fall out of _group_cache between now

1026

# and then.

1027

self.batch_memos[read_memo] = cached_block

1028

return self.total_bytes

1029

1030

def _flush_manager(self):

1031

if self.manager is not None:

1032

for factory in self.manager.get_record_stream():

1033

yield factory

1034

self.manager = None

1035

self.last_read_memo = None

1036

1037

def yield_factories(self, full_flush=False):

1038

"""Yield factories for keys added since the last yield. They will be

1039

returned in the order they were added via add_key.

1040

1041

:param full_flush: by default, some results may not be returned in case

1042

they can be part of the next batch. If full_flush is True, then

1043

all results are returned.

1044

"""

1045

if self.manager is None and not self.keys:

1046

return

1047

# Fetch all memos in this batch.

1048

blocks = self.gcvf._get_blocks(self.memos_to_get)

1049

# Turn blocks into factories and yield them.

1050

memos_to_get_stack = list(self.memos_to_get)

1051

memos_to_get_stack.reverse()

1052

for key in self.keys:

1053

index_memo, _, parents, _ = self.locations[key]

1054

read_memo = index_memo[:3]

1055

if self.last_read_memo != read_memo:

1056

# We are starting a new block. If we have a

1057

# manager, we have found everything that fits for

1058

# now, so yield records

1059

for factory in self._flush_manager():

1060

yield factory

1061

# Now start a new manager.

1062

if memos_to_get_stack and memos_to_get_stack[-1] == read_memo:

1063

# The next block from _get_blocks will be the block we

1064

# need.

1065

block_read_memo, block = blocks.next()

1066

if block_read_memo != read_memo:

1067

raise AssertionError(

1068

"block_read_memo out of sync with read_memo"

1069

"(%r != %r)" % (block_read_memo, read_memo))

1070

self.batch_memos[read_memo] = block

1071

memos_to_get_stack.pop()

1072

else:

1073

block = self.batch_memos[read_memo]

1074

self.manager = _LazyGroupContentManager(block)

1075

self.last_read_memo = read_memo

1076

start, end = index_memo[3:5]

1077

self.manager.add_factory(key, parents, start, end)

1078

if full_flush:

1079

for factory in self._flush_manager():

1080

yield factory

1081

del self.keys[:]

1082

self.batch_memos.clear()

1083

del self.memos_to_get[:]

1084

self.total_bytes = 0

1085

1086

1087

class GroupCompressVersionedFiles(VersionedFiles):

1088

"""A group-compress based VersionedFiles implementation."""

1089

1090

def __init__(self, index, access, delta=True):

1091

"""Create a GroupCompressVersionedFiles object.

1092

1093

:param index: The index object storing access and graph data.

1094

:param access: The access object storing raw data.

1095

:param delta: Whether to delta compress or just entropy compress.

1096

"""

1097

self._index = index

1098

self._access = access

1099

self._delta = delta

1100

self._unadded_refs = {}

1101

self._group_cache = LRUSizeCache(max_size=50*1024*1024)

1102

self._fallback_vfs = []

1103

1104

def add_lines(self, key, parents, lines, parent_texts=None,

1105

left_matching_blocks=None, nostore_sha=None, random_id=False,

1106

check_content=True):

1107

"""Add a text to the store.

1108

1109

:param key: The key tuple of the text to add.

1110

:param parents: The parents key tuples of the text to add.

1111

:param lines: A list of lines. Each line must be a bytestring. And all

1112

of them except the last must be terminated with \n and contain no

1113

other \n's. The last line may either contain no \n's or a single

1114

terminating \n. If the lines list does meet this constraint the add

1115

routine may error or may succeed - but you will be unable to read

1116

the data back accurately. (Checking the lines have been split

1117

correctly is expensive and extremely unlikely to catch bugs so it

1118

is not done at runtime unless check_content is True.)

1119

:param parent_texts: An optional dictionary containing the opaque

1120

representations of some or all of the parents of version_id to

1121

allow delta optimisations. VERY IMPORTANT: the texts must be those

1122

returned by add_lines or data corruption can be caused.

1123

:param left_matching_blocks: a hint about which areas are common

1124

between the text and its left-hand-parent. The format is

1125

the SequenceMatcher.get_matching_blocks format.

1126

:param nostore_sha: Raise ExistingContent and do not add the lines to

1127

the versioned file if the digest of the lines matches this.

1128

:param random_id: If True a random id has been selected rather than

1129

an id determined by some deterministic process such as a converter

1130

from a foreign VCS. When True the backend may choose not to check

1131

for uniqueness of the resulting key within the versioned file, so

1132

this should only be done when the result is expected to be unique

1133

anyway.

1134

:param check_content: If True, the lines supplied are verified to be

1135

bytestrings that are correctly formed lines.

1136

:return: The text sha1, the number of bytes in the text, and an opaque

1137

representation of the inserted version which can be provided

1138

back to future add_lines calls in the parent_texts dictionary.

1139

"""

1140

self._index._check_write_ok()

1141

self._check_add(key, lines, random_id, check_content)

1142

if parents is None:

1143

# The caller might pass None if there is no graph data, but kndx

1144

# indexes can't directly store that, so we give them

1145

# an empty tuple instead.

1146

parents = ()

1147

# double handling for now. Make it work until then.

1148

length = sum(map(len, lines))

1149

record = ChunkedContentFactory(key, parents, None, lines)

1150

sha1 = list(self._insert_record_stream([record], random_id=random_id,

1151

nostore_sha=nostore_sha))[0]

1152

return sha1, length, None

1153

1154

def _add_text(self, key, parents, text, nostore_sha=None, random_id=False):

1155

"""See VersionedFiles._add_text()."""

1156

self._index._check_write_ok()

1157

self._check_add(key, None, random_id, check_content=False)

1158

if text.__class__ is not str:

1159

raise errors.BzrBadParameterUnicode("text")

1160

if parents is None:

1161

# The caller might pass None if there is no graph data, but kndx

1162

# indexes can't directly store that, so we give them

1163

# an empty tuple instead.

1164

parents = ()

1165

# double handling for now. Make it work until then.

1166

length = len(text)

1167

record = FulltextContentFactory(key, parents, None, text)

1168

sha1 = list(self._insert_record_stream([record], random_id=random_id,

1169

nostore_sha=nostore_sha))[0]

1170

return sha1, length, None

1171

1172

def add_fallback_versioned_files(self, a_versioned_files):

1173

"""Add a source of texts for texts not present in this knit.

1174

1175

:param a_versioned_files: A VersionedFiles object.

1176

"""

1177

self._fallback_vfs.append(a_versioned_files)

1178

1179

def annotate(self, key):

1180

"""See VersionedFiles.annotate."""

1181

ann = annotate.Annotator(self)

1182

return ann.annotate_flat(key)

1183

1184

def get_annotator(self):

1185

return annotate.Annotator(self)

1186

1187

def check(self, progress_bar=None, keys=None):

1188

"""See VersionedFiles.check()."""

1189

if keys is None:

1190

keys = self.keys()

1191

for record in self.get_record_stream(keys, 'unordered', True):

1192

record.get_bytes_as('fulltext')

1193

else:

1194

return self.get_record_stream(keys, 'unordered', True)

1195

1196

def _check_add(self, key, lines, random_id, check_content):

1197

"""check that version_id and lines are safe to add."""

1198

version_id = key[-1]

1199

if version_id is not None:

1200

if osutils.contains_whitespace(version_id):

1201

raise errors.InvalidRevisionId(version_id, self)

1202

self.check_not_reserved_id(version_id)

1203

# TODO: If random_id==False and the key is already present, we should

1204

# probably check that the existing content is identical to what is

1205

# being inserted, and otherwise raise an exception. This would make

1206

# the bundle code simpler.

1207

if check_content:

1208

self._check_lines_not_unicode(lines)

1209

self._check_lines_are_lines(lines)

1210

1211

def get_known_graph_ancestry(self, keys):

1212

"""Get a KnownGraph instance with the ancestry of keys."""

1213

parent_map, missing_keys = self._index._graph_index.find_ancestry(keys,

1214

1215

kg = _mod_graph.KnownGraph(parent_map)

1216

return kg

1217

1218

def get_parent_map(self, keys):

1219

"""Get a map of the graph parents of keys.

1220

1221

:param keys: The keys to look up parents for.

1222

:return: A mapping from keys to parents. Absent keys are absent from

1223

the mapping.

1224

"""

1225

return self._get_parent_map_with_sources(keys)[0]

1226

1227

def _get_parent_map_with_sources(self, keys):

1228

"""Get a map of the parents of keys.

1229

1230

:param keys: The keys to look up parents for.

1231

:return: A tuple. The first element is a mapping from keys to parents.

1232

Absent keys are absent from the mapping. The second element is a

1233

list with the locations each key was found in. The first element

1234

is the in-this-knit parents, the second the first fallback source,

1235

and so on.

1236

"""

1237

result = {}

1238

sources = [self._index] + self._fallback_vfs

1239

source_results = []

1240

missing = set(keys)

1241

for source in sources:

1242

if not missing:

1243

break

1244

new_result = source.get_parent_map(missing)

1245

source_results.append(new_result)

1246

result.update(new_result)

1247

missing.difference_update(set(new_result))

1248

return result, source_results

1249

1250

def _get_blocks(self, read_memos):

1251

"""Get GroupCompressBlocks for the given read_memos.

1252

1253

:returns: a series of (read_memo, block) pairs, in the order they were

1254

originally passed.

1255

"""

1256

cached = {}

1257

for read_memo in read_memos:

1258

try:

1259

block = self._group_cache[read_memo]

1260

except KeyError:

1261

pass

1262

else:

1263

cached[read_memo] = block

1264

not_cached = []

1265

not_cached_seen = set()

1266

for read_memo in read_memos:

1267

if read_memo in cached:

1268

# Don't fetch what we already have

1269

continue

1270

if read_memo in not_cached_seen:

1271

# Don't try to fetch the same data twice

1272

continue

1273

not_cached.append(read_memo)

1274

not_cached_seen.add(read_memo)

1275

raw_records = self._access.get_raw_records(not_cached)

1276

for read_memo in read_memos:

1277

try:

1278

yield read_memo, cached[read_memo]

1279

except KeyError:

1280

# Read the block, and cache it.

1281

zdata = raw_records.next()

1282

block = GroupCompressBlock.from_bytes(zdata)

1283

self._group_cache[read_memo] = block

1284

cached[read_memo] = block

1285

yield read_memo, block

1286

1287

def get_missing_compression_parent_keys(self):

1288

"""Return the keys of missing compression parents.

1289

1290

Missing compression parents occur when a record stream was missing

1291

basis texts, or a index was scanned that had missing basis texts.

1292

"""

1293

# GroupCompress cannot currently reference texts that are not in the

1294

# group, so this is valid for now

1295

return frozenset()

1296

1297

def get_record_stream(self, keys, ordering, include_delta_closure):

1298

"""Get a stream of records for keys.

1299

1300

:param keys: The keys to include.

1301

:param ordering: Either 'unordered' or 'topological'. A topologically

1302

sorted stream has compression parents strictly before their

1303

children.

1304

:param include_delta_closure: If True then the closure across any

1305

compression parents will be included (in the opaque data).

1306

:return: An iterator of ContentFactory objects, each of which is only

1307

valid until the iterator is advanced.

1308

"""

1309

# keys might be a generator

1310

orig_keys = list(keys)

1311

keys = set(keys)

1312

if not keys:

1313

return

1314

if (not self._index.has_graph

1315

and ordering in ('topological', 'groupcompress')):

1316

# Cannot topological order when no graph has been stored.

1317

# but we allow 'as-requested' or 'unordered'

1318

ordering = 'unordered'

1319

1320

remaining_keys = keys

1321

while True:

1322

try:

1323

keys = set(remaining_keys)

1324

for content_factory in self._get_remaining_record_stream(keys,

1325

orig_keys, ordering, include_delta_closure):

1326

remaining_keys.discard(content_factory.key)

1327

yield content_factory

1328

return

1329

except errors.RetryWithNewPacks, e:

1330

self._access.reload_or_raise(e)

1331

1332

def _find_from_fallback(self, missing):

1333

"""Find whatever keys you can from the fallbacks.

1334

1335

:param missing: A set of missing keys. This set will be mutated as keys

1336

are found from a fallback_vfs

1337

:return: (parent_map, key_to_source_map, source_results)

1338

parent_map the overall key => parent_keys

1339

key_to_source_map a dict from {key: source}

1340

source_results a list of (source: keys)

1341

"""

1342

parent_map = {}

1343

key_to_source_map = {}

1344

source_results = []

1345

for source in self._fallback_vfs:

1346

if not missing:

1347

break

1348

source_parents = source.get_parent_map(missing)

1349

parent_map.update(source_parents)

1350

source_parents = list(source_parents)

1351

source_results.append((source, source_parents))

1352

key_to_source_map.update((key, source) for key in source_parents)

1353

missing.difference_update(source_parents)

1354

return parent_map, key_to_source_map, source_results

1355

1356

def _get_ordered_source_keys(self, ordering, parent_map, key_to_source_map):

1357

"""Get the (source, [keys]) list.

1358

1359

The returned objects should be in the order defined by 'ordering',

1360

which can weave between different sources.

1361

:param ordering: Must be one of 'topological' or 'groupcompress'

1362

:return: List of [(source, [keys])] tuples, such that all keys are in

1363

the defined order, regardless of source.

1364

"""

1365

if ordering == 'topological':

1366

present_keys = topo_sort(parent_map)

1367

else:

1368

# ordering == 'groupcompress'

1369

# XXX: This only optimizes for the target ordering. We may need

1370

# to balance that with the time it takes to extract

1371

# ordering, by somehow grouping based on

1372

# locations[key][0:3]

1373

present_keys = sort_gc_optimal(parent_map)

1374

# Now group by source:

1375

source_keys = []

1376

current_source = None

1377

for key in present_keys:

1378

source = key_to_source_map.get(key, self)

1379

if source is not current_source:

1380

source_keys.append((source, []))

1381

current_source = source

1382

source_keys[-1][1].append(key)

1383

return source_keys

1384

1385

def _get_as_requested_source_keys(self, orig_keys, locations, unadded_keys,

1386

key_to_source_map):

1387

source_keys = []

1388

current_source = None

1389

for key in orig_keys:

1390

if key in locations or key in unadded_keys:

1391

source = self

1392

elif key in key_to_source_map:

1393

source = key_to_source_map[key]

1394

else: # absent

1395

continue

1396

if source is not current_source:

1397

source_keys.append((source, []))

1398

current_source = source

1399

source_keys[-1][1].append(key)

1400

return source_keys

1401

1402

def _get_io_ordered_source_keys(self, locations, unadded_keys,

1403

source_result):

1404

def get_group(key):

1405

# This is the group the bytes are stored in, followed by the

1406

# location in the group

1407

return locations[key][0]

1408

present_keys = sorted(locations.iterkeys(), key=get_group)

1409

# We don't have an ordering for keys in the in-memory object, but

1410

# lets process the in-memory ones first.

1411

present_keys = list(unadded_keys) + present_keys

1412

# Now grab all of the ones from other sources

1413

source_keys = [(self, present_keys)]

1414

source_keys.extend(source_result)

1415

return source_keys

1416

1417

def _get_remaining_record_stream(self, keys, orig_keys, ordering,

1418

include_delta_closure):

1419

"""Get a stream of records for keys.

1420

1421

:param keys: The keys to include.

1422

:param ordering: one of 'unordered', 'topological', 'groupcompress' or

1423

'as-requested'

1424

:param include_delta_closure: If True then the closure across any

1425

compression parents will be included (in the opaque data).

1426

:return: An iterator of ContentFactory objects, each of which is only

1427

valid until the iterator is advanced.

1428

"""

1429

# Cheap: iterate

1430

locations = self._index.get_build_details(keys)

1431

unadded_keys = set(self._unadded_refs).intersection(keys)

1432

missing = keys.difference(locations)

1433

missing.difference_update(unadded_keys)

1434

(fallback_parent_map, key_to_source_map,

1435

source_result) = self._find_from_fallback(missing)

1436

if ordering in ('topological', 'groupcompress'):

1437

# would be better to not globally sort initially but instead

1438

# start with one key, recurse to its oldest parent, then grab

1439

# everything in the same group, etc.

1440

parent_map = dict((key, details[2]) for key, details in

1441

locations.iteritems())

1442

for key in unadded_keys:

1443

parent_map[key] = self._unadded_refs[key]

1444

parent_map.update(fallback_parent_map)

1445

source_keys = self._get_ordered_source_keys(ordering, parent_map,

1446

key_to_source_map)

1447

elif ordering == 'as-requested':

1448

source_keys = self._get_as_requested_source_keys(orig_keys,

1449

locations, unadded_keys, key_to_source_map)

1450

else:

1451

# We want to yield the keys in a semi-optimal (read-wise) ordering.

1452

# Otherwise we thrash the _group_cache and destroy performance

1453

source_keys = self._get_io_ordered_source_keys(locations,

1454

unadded_keys, source_result)

1455

for key in missing:

1456

yield AbsentContentFactory(key)

1457

# Batch up as many keys as we can until either:

1458

# - we encounter an unadded ref, or

1459

# - we run out of keys, or

1460

# - the total bytes to retrieve for this batch > BATCH_SIZE

1461

batcher = _BatchingBlockFetcher(self, locations)

1462

for source, keys in source_keys:

1463

if source is self:

1464

for key in keys:

1465

if key in self._unadded_refs:

1466

# Flush batch, then yield unadded ref from

1467

# self._compressor.

1468

for factory in batcher.yield_factories(full_flush=True):

1469

yield factory

1470

bytes, sha1 = self._compressor.extract(key)

1471

parents = self._unadded_refs[key]

1472

yield FulltextContentFactory(key, parents, sha1, bytes)

1473

continue

1474

if batcher.add_key(key) > BATCH_SIZE:

1475

# Ok, this batch is big enough. Yield some results.

1476

for factory in batcher.yield_factories():

1477

yield factory

1478

else:

1479

for factory in batcher.yield_factories(full_flush=True):

1480

yield factory

1481

for record in source.get_record_stream(keys, ordering,

1482

include_delta_closure):

1483

yield record

1484

for factory in batcher.yield_factories(full_flush=True):

1485

yield factory

1486

1487

def get_sha1s(self, keys):

1488

"""See VersionedFiles.get_sha1s()."""

1489

result = {}

1490

for record in self.get_record_stream(keys, 'unordered', True):

1491

if record.sha1 != None:

1492

result[record.key] = record.sha1

1493

else:

1494

if record.storage_kind != 'absent':

1495

result[record.key] = osutils.sha_string(

1496

record.get_bytes_as('fulltext'))

1497

return result

1498

1499

def insert_record_stream(self, stream):

1500

"""Insert a record stream into this container.

1501

1502

:param stream: A stream of records to insert.

1503

:return: None

1504

:seealso VersionedFiles.get_record_stream:

1505

"""

1506

# XXX: Setting random_id=True makes

1507

# test_insert_record_stream_existing_keys fail for groupcompress and

1508

# groupcompress-nograph, this needs to be revisited while addressing

1509

# 'bzr branch' performance issues.

1510

for _ in self._insert_record_stream(stream, random_id=False):

1511

pass

1512

1513

def _insert_record_stream(self, stream, random_id=False, nostore_sha=None,

1514

reuse_blocks=True):

1515

"""Internal core to insert a record stream into this container.

1516

1517

This helper function has a different interface than insert_record_stream

1518

to allow add_lines to be minimal, but still return the needed data.

1519

1520

:param stream: A stream of records to insert.

1521

:param nostore_sha: If the sha1 of a given text matches nostore_sha,

1522

raise ExistingContent, rather than committing the new text.

1523

:param reuse_blocks: If the source is streaming from

1524

groupcompress-blocks, just insert the blocks as-is, rather than

1525

expanding the texts and inserting again.

1526

:return: An iterator over the sha1 of the inserted records.

1527

:seealso insert_record_stream:

1528

:seealso add_lines:

1529

"""

1530

adapters = {}

1531

def get_adapter(adapter_key):

1532

try:

1533

return adapters[adapter_key]

1534

except KeyError:

1535

adapter_factory = adapter_registry.get(adapter_key)

1536

adapter = adapter_factory(self)

1537

adapters[adapter_key] = adapter

1538

return adapter

1539

# This will go up to fulltexts for gc to gc fetching, which isn't

1540

# ideal.

1541

self._compressor = GroupCompressor()

1542

self._unadded_refs = {}

1543

keys_to_add = []

1544

def flush():

1545

bytes = self._compressor.flush().to_bytes()

1546

index, start, length = self._access.add_raw_records(

1547

[(None, len(bytes))], bytes)[0]

1548

nodes = []

1549

for key, reads, refs in keys_to_add:

1550

nodes.append((key, "%d %d %s" % (start, length, reads), refs))

1551

self._index.add_records(nodes, random_id=random_id)

1552

self._unadded_refs = {}

1553

del keys_to_add[:]

1554

self._compressor = GroupCompressor()

1555

1556

last_prefix = None

1557

max_fulltext_len = 0

1558

max_fulltext_prefix = None

1559

insert_manager = None

1560

block_start = None

1561

block_length = None

1562

# XXX: TODO: remove this, it is just for safety checking for now

1563

inserted_keys = set()

1564

for record in stream:

1565

# Raise an error when a record is missing.

1566

if record.storage_kind == 'absent':

1567

raise errors.RevisionNotPresent(record.key, self)

1568

if random_id:

1569

if record.key in inserted_keys:

1570

trace.note('Insert claimed random_id=True,'

1571

' but then inserted %r two times', record.key)

1572

continue

1573

inserted_keys.add(record.key)

1574

if reuse_blocks:

1575

# If the reuse_blocks flag is set, check to see if we can just

1576

# copy a groupcompress block as-is.

1577

if record.storage_kind == 'groupcompress-block':

1578

# Insert the raw block into the target repo

1579

insert_manager = record._manager

1580

insert_manager._check_rebuild_block()

1581

bytes = record._manager._block.to_bytes()

1582

_, start, length = self._access.add_raw_records(

1583

[(None, len(bytes))], bytes)[0]

1584

del bytes

1585

block_start = start

1586

block_length = length

1587

if record.storage_kind in ('groupcompress-block',

1588

'groupcompress-block-ref'):

1589

if insert_manager is None:

1590

raise AssertionError('No insert_manager set')

1591

value = "%d %d %d %d" % (block_start, block_length,

1592

record._start, record._end)

1593

nodes = [(record.key, value, (record.parents,))]

1594

# TODO: Consider buffering up many nodes to be added, not

1595

# sure how much overhead this has, but we're seeing

1596

# ~23s / 120s in add_records calls

1597

self._index.add_records(nodes, random_id=random_id)

1598

continue

1599

try:

1600

bytes = record.get_bytes_as('fulltext')

1601

except errors.UnavailableRepresentation:

1602

adapter_key = record.storage_kind, 'fulltext'

1603

adapter = get_adapter(adapter_key)

1604

bytes = adapter.get_bytes(record)

1605

if len(record.key) > 1:

1606

prefix = record.key[0]

1607

soft = (prefix == last_prefix)

1608

else:

1609

prefix = None

1610

soft = False

1611

if max_fulltext_len < len(bytes):

1612

max_fulltext_len = len(bytes)

1613

max_fulltext_prefix = prefix

1614

(found_sha1, start_point, end_point,

1615

type) = self._compressor.compress(record.key,

1616

bytes, record.sha1, soft=soft,

1617

nostore_sha=nostore_sha)

1618

# delta_ratio = float(len(bytes)) / (end_point - start_point)

1619

# Check if we want to continue to include that text

1620

if (prefix == max_fulltext_prefix

1621

and end_point < 2 * max_fulltext_len):

1622

# As long as we are on the same file_id, we will fill at least

1623

# 2 * max_fulltext_len

1624

start_new_block = False

1625

elif end_point > 4*1024*1024:

1626

start_new_block = True

1627

elif (prefix is not None and prefix != last_prefix

1628

and end_point > 2*1024*1024):

1629

start_new_block = True

1630

else:

1631

start_new_block = False

1632

last_prefix = prefix

1633

if start_new_block:

1634

self._compressor.pop_last()

1635

flush()

1636

max_fulltext_len = len(bytes)

1637

(found_sha1, start_point, end_point,

1638

type) = self._compressor.compress(record.key, bytes,

1639

record.sha1)

1640

if record.key[-1] is None:

1641

key = record.key[:-1] + ('sha1:' + found_sha1,)

1642

else:

1643

key = record.key

1644

self._unadded_refs[key] = record.parents

1645

yield found_sha1

1646

keys_to_add.append((key, '%d %d' % (start_point, end_point),

1647

(record.parents,)))

1648

if len(keys_to_add):

1649

flush()

1650

self._compressor = None

1651

1652

def iter_lines_added_or_present_in_keys(self, keys, pb=None):

1653

"""Iterate over the lines in the versioned files from keys.

1654

1655

This may return lines from other keys. Each item the returned

1656

iterator yields is a tuple of a line and a text version that that line

1657

is present in (not introduced in).

1658

1659

Ordering of results is in whatever order is most suitable for the

1660

underlying storage format.

1661

1662

If a progress bar is supplied, it may be used to indicate progress.

1663

The caller is responsible for cleaning up progress bars (because this

1664

is an iterator).

1665

1666

NOTES:

1667

* Lines are normalised by the underlying store: they will all have \n

1668

terminators.

1669

* Lines are returned in arbitrary order.

1670

1671

:return: An iterator over (line, key).

1672

"""

1673

keys = set(keys)

1674

total = len(keys)

1675

# we don't care about inclusions, the caller cares.

1676

# but we need to setup a list of records to visit.

1677

# we need key, position, length

1678

for key_idx, record in enumerate(self.get_record_stream(keys,

1679

'unordered', True)):

1680

# XXX: todo - optimise to use less than full texts.

1681

key = record.key

1682

if pb is not None:

1683

pb.update('Walking content', key_idx, total)

1684

if record.storage_kind == 'absent':

1685

raise errors.RevisionNotPresent(key, self)

1686

lines = osutils.split_lines(record.get_bytes_as('fulltext'))

1687

for line in lines:

1688

yield line, key

1689

if pb is not None:

1690

pb.update('Walking content', total, total)

1691

1692

def keys(self):

1693

"""See VersionedFiles.keys."""

1694

if 'evil' in debug.debug_flags:

1695

trace.mutter_callsite(2, "keys scales with size of history")

1696

sources = [self._index] + self._fallback_vfs

1697

result = set()

1698

for source in sources:

1699

result.update(source.keys())

1700

return result

1701

1702

1703

class _GCGraphIndex(object):

1704

"""Mapper from GroupCompressVersionedFiles needs into GraphIndex storage."""

1705

1706

def __init__(self, graph_index, is_locked, parents=True,

1707

add_callback=None, track_external_parent_refs=False,

1708

inconsistency_fatal=True):

1709

"""Construct a _GCGraphIndex on a graph_index.

1710

1711

:param graph_index: An implementation of bzrlib.index.GraphIndex.

1712

:param is_locked: A callback, returns True if the index is locked and

1713

thus usable.

1714

:param parents: If True, record knits parents, if not do not record

1715

parents.

1716

:param add_callback: If not None, allow additions to the index and call

1717

this callback with a list of added GraphIndex nodes:

1718

[(node, value, node_refs), ...]

1719

:param track_external_parent_refs: As keys are added, keep track of the

1720

keys they reference, so that we can query get_missing_parents(),

1721

etc.

1722

:param inconsistency_fatal: When asked to add records that are already

1723

present, and the details are inconsistent with the existing

1724

record, raise an exception instead of warning (and skipping the

1725

record).

1726

"""

1727

self._add_callback = add_callback

1728

self._graph_index = graph_index

1729

self._parents = parents

1730

self.has_graph = parents

1731

self._is_locked = is_locked

1732

self._inconsistency_fatal = inconsistency_fatal

1733

if track_external_parent_refs:

1734

self._key_dependencies = knit._KeyRefs()

1735

else:

1736

self._key_dependencies = None

1737

1738

def add_records(self, records, random_id=False):

1739

"""Add multiple records to the index.

1740

1741

This function does not insert data into the Immutable GraphIndex

1742

backing the KnitGraphIndex, instead it prepares data for insertion by

1743

the caller and checks that it is safe to insert then calls

1744

self._add_callback with the prepared GraphIndex nodes.

1745

1746

:param records: a list of tuples:

1747

(key, options, access_memo, parents).

1748

:param random_id: If True the ids being added were randomly generated

1749

and no check for existence will be performed.

1750

"""

1751

if not self._add_callback:

1752

raise errors.ReadOnlyError(self)

1753

# we hope there are no repositories with inconsistent parentage

1754

# anymore.

1755

1756

changed = False

1757

keys = {}

1758

for (key, value, refs) in records:

1759

if not self._parents:

1760

if refs:

1761

for ref in refs:

1762

if ref:

1763

raise errors.KnitCorrupt(self,

1764

"attempt to add node with parents "

1765

"in parentless index.")

1766

refs = ()

1767

changed = True

1768

keys[key] = (value, refs)

1769

# check for dups

1770

if not random_id:

1771

present_nodes = self._get_entries(keys)

1772

for (index, key, value, node_refs) in present_nodes:

1773

if node_refs != keys[key][1]:

1774

details = '%s %s %s' % (key, (value, node_refs), keys[key])

1775

if self._inconsistency_fatal:

1776

raise errors.KnitCorrupt(self, "inconsistent details"

1777

" in add_records: %s" %

1778

details)

1779

else:

1780

trace.warning("inconsistent details in skipped"

1781

" record: %s", details)

1782

del keys[key]

1783

changed = True

1784

if changed:

1785

result = []

1786

if self._parents:

1787

for key, (value, node_refs) in keys.iteritems():

1788

result.append((key, value, node_refs))

1789

else:

1790

for key, (value, node_refs) in keys.iteritems():

1791

result.append((key, value))

1792

records = result

1793

key_dependencies = self._key_dependencies

1794

if key_dependencies is not None and self._parents:

1795

for key, value, refs in records:

1796

parents = refs[0]

1797

key_dependencies.add_references(key, parents)

1798

self._add_callback(records)

1799

1800

def _check_read(self):

1801

"""Raise an exception if reads are not permitted."""

1802

if not self._is_locked():

1803

raise errors.ObjectNotLocked(self)

1804

1805

def _check_write_ok(self):

1806

"""Raise an exception if writes are not permitted."""

1807

if not self._is_locked():

1808

raise errors.ObjectNotLocked(self)

1809

1810

def _get_entries(self, keys, check_present=False):

1811

"""Get the entries for keys.

1812

1813

Note: Callers are responsible for checking that the index is locked

1814

before calling this method.

1815

1816

:param keys: An iterable of index key tuples.

1817

"""

1818

keys = set(keys)

1819

found_keys = set()

1820

if self._parents:

1821

for node in self._graph_index.iter_entries(keys):

1822

yield node

1823

found_keys.add(node[1])

1824

else:

1825

# adapt parentless index to the rest of the code.

1826

for node in self._graph_index.iter_entries(keys):

1827

yield node[0], node[1], node[2], ()

1828

found_keys.add(node[1])

1829

if check_present:

1830

missing_keys = keys.difference(found_keys)

1831

if missing_keys:

1832

raise errors.RevisionNotPresent(missing_keys.pop(), self)

1833

1834

def get_parent_map(self, keys):

1835

"""Get a map of the parents of keys.

1836

1837

:param keys: The keys to look up parents for.

1838

:return: A mapping from keys to parents. Absent keys are absent from

1839

the mapping.

1840

"""

1841

self._check_read()

1842

nodes = self._get_entries(keys)

1843

result = {}

1844

if self._parents:

1845

for node in nodes:

1846

result[node[1]] = node[3][0]

1847

else:

1848

for node in nodes:

1849

result[node[1]] = None

1850

return result

1851

1852

def get_missing_parents(self):

1853

"""Return the keys of missing parents."""

1854

# Copied from _KnitGraphIndex.get_missing_parents

1855

# We may have false positives, so filter those out.

1856

self._key_dependencies.add_keys(

1857

self.get_parent_map(self._key_dependencies.get_unsatisfied_refs()))

1858

return frozenset(self._key_dependencies.get_unsatisfied_refs())

1859

1860

def get_build_details(self, keys):

1861

"""Get the various build details for keys.

1862

1863

Ghosts are omitted from the result.

1864

1865

:param keys: An iterable of keys.

1866

:return: A dict of key:

1867

(index_memo, compression_parent, parents, record_details).

1868

index_memo

1869

opaque structure to pass to read_records to extract the raw

1870

data

1871

compression_parent

1872

Content that this record is built upon, may be None

1873

parents

1874

Logical parents of this node

1875

record_details

1876

extra information about the content which needs to be passed to

1877

Factory.parse_record

1878

"""

1879

self._check_read()

1880

result = {}

1881

entries = self._get_entries(keys)

1882

for entry in entries:

1883

key = entry[1]

1884

if not self._parents:

1885

parents = None

1886

else:

1887

parents = entry[3][0]

1888

method = 'group'

1889

result[key] = (self._node_to_position(entry),

1890

None, parents, (method, None))

1891

return result

1892

1893

def keys(self):

1894

"""Get all the keys in the collection.

1895

1896

The keys are not ordered.

1897

"""

1898

self._check_read()

1899

return [node[1] for node in self._graph_index.iter_all_entries()]

1900

1901

def _node_to_position(self, node):

1902

"""Convert an index value to position details."""

1903

bits = node[2].split(' ')

1904

# It would be nice not to read the entire gzip.

1905

start = int(bits[0])

1906

stop = int(bits[1])

1907

basis_end = int(bits[2])

1908

delta_end = int(bits[3])

1909

return node[0], start, stop, basis_end, delta_end

1910

1911

def scan_unvalidated_index(self, graph_index):

1912

"""Inform this _GCGraphIndex that there is an unvalidated index.

1913

1914

This allows this _GCGraphIndex to keep track of any missing

1915

compression parents we may want to have filled in to make those

1916

indices valid.

1917

1918

:param graph_index: A GraphIndex

1919

"""

1920

if self._key_dependencies is not None:

1921

# Add parent refs from graph_index (and discard parent refs that

1922

# the graph_index has).

1923

add_refs = self._key_dependencies.add_references

1924

for node in graph_index.iter_all_entries():

1925

add_refs(node[1], node[3][0])

1926

1927

1928

1929

from bzrlib._groupcompress_py import (

1930

apply_delta,

1931

apply_delta_to_source,

1932

encode_base128_int,

1933

decode_base128_int,

1934

decode_copy_instruction,

1935

LinesDeltaIndex,

1936

)

1937

try:

1938

from bzrlib._groupcompress_pyx import (

1939

apply_delta,

1940

apply_delta_to_source,

1941

DeltaIndex,

1942

encode_base128_int,

1943

decode_base128_int,

1944

)

1945

GroupCompressor = PyrexGroupCompressor

1946

except ImportError:

1947

GroupCompressor = PythonGroupCompressor

1948

Older »