~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/groupcompress.py

Committer: Canonical.com Patch Queue Manager
Date: 2011-05-19 10:51:37 UTC
mfrom: (5891.1.3 api-docs)
Revision ID: pqm@pqm.ubuntu.com-20110519105137-amzagrral2ldm1lq

(spiv) Fix the formatting of more docstrings. (Andrew Bennetts)

files added:
NEWS

bzrlib/cethread.py

bzrlib/cmd_test_script.py

bzrlib/controldir.py

bzrlib/doc_generate/builders

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/writers

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/export_pot.py

bzrlib/library_state.py

bzrlib/mergetools.py

bzrlib/plugins/bash_completion

bzrlib/plugins/bash_completion/README.txt

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/bash_completion/tests

bzrlib/plugins/bash_completion/tests/__init__.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/changelog_merge

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/changelog_merge/tests

bzrlib/plugins/changelog_merge/tests/__init__.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/weave_fmt

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/tests

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/pyutils.py

bzrlib/recordcounter.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_lookup_revision.py

bzrlib/tests/blackbox/test_remember_option.py

bzrlib/tests/blackbox/test_repair_workingtree.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/doc_generate

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders

bzrlib/tests/doc_generate/builders/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers

bzrlib/tests/doc_generate/writers/__init__.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/fixtures.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/test_format.py

bzrlib/tests/per_interbranch/test_copy_content_into.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_interbranch/test_get.py

bzrlib/tests/per_repository/test_file_graph.py

bzrlib/tests/per_repository_reference/test__make_parents_provider.py

bzrlib/tests/per_repository_reference/test_commit_with_stacking.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_vf

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_repository_vf/test_check.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_repository_vf/test_write_group.py

bzrlib/tests/per_tree/test_export.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_workingtree/test_check_state.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/scenarios.py

bzrlib/tests/test__btree_serializer.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_fixtures.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_pyutils.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_utextwrap.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/testui.py

bzrlib/transport/gio_transport.py

bzrlib/utextwrap.py

bzrlib/vf_repository.py

bzrlib/workingtree_3.py

contrib/bash/bzr

contrib/zsh/README

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/configuration.txt

doc/developers/documenting-changes.txt

doc/developers/fetch.txt

doc/developers/transports.txt

doc/developers/ui.txt

doc/developers/xdg_config_spec.txt

doc/en/admin-guide/licence.txt

doc/en/release-notes/bzr-0.1.txt

doc/en/release-notes/bzr-0.10.txt

doc/en/release-notes/bzr-0.11.txt

doc/en/release-notes/bzr-0.12.txt

doc/en/release-notes/bzr-0.13.txt

doc/en/release-notes/bzr-0.14.txt

doc/en/release-notes/bzr-0.15.txt

doc/en/release-notes/bzr-0.16.txt

doc/en/release-notes/bzr-0.17.txt

doc/en/release-notes/bzr-0.18.txt

doc/en/release-notes/bzr-0.6.txt

doc/en/release-notes/bzr-0.7.txt

doc/en/release-notes/bzr-0.8.txt

doc/en/release-notes/bzr-0.9.txt

doc/en/release-notes/bzr-0.90.txt

doc/en/release-notes/bzr-0.91.txt

doc/en/release-notes/bzr-0.92.txt

doc/en/release-notes/bzr-1.0.txt

doc/en/release-notes/bzr-1.1.txt

doc/en/release-notes/bzr-1.10.txt

doc/en/release-notes/bzr-1.11.txt

doc/en/release-notes/bzr-1.12.txt

doc/en/release-notes/bzr-1.13.txt

doc/en/release-notes/bzr-1.14.txt

doc/en/release-notes/bzr-1.15.txt

doc/en/release-notes/bzr-1.16.txt

doc/en/release-notes/bzr-1.17.txt

doc/en/release-notes/bzr-1.18.txt

doc/en/release-notes/bzr-1.2.txt

doc/en/release-notes/bzr-1.3.txt

doc/en/release-notes/bzr-1.4.txt

doc/en/release-notes/bzr-1.5.txt

doc/en/release-notes/bzr-1.6.txt

doc/en/release-notes/bzr-1.7.txt

doc/en/release-notes/bzr-1.8.txt

doc/en/release-notes/bzr-1.9.txt

doc/en/release-notes/bzr-2.0.txt

doc/en/release-notes/bzr-2.1.txt

doc/en/release-notes/bzr-2.2.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/series-template.txt

doc/en/tutorials/licence.txt

doc/en/upgrade-guide/licence.txt

doc/en/user-guide/licence.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/en/whats-new/whats-new-in-2.4.txt

doc/ja/tutorials/licence.txt

doc/ja/user-guide/index-plain.txt

doc/ja/user-guide/licence.txt

tools/build_mo.py

tools/fixed-in.py

tools/msgfmt.py

tools/win32/py2exe_boot_common.py

files removed:
bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/deprecated_graph.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/util/bencode.py

contrib/add-bzr-to-baz

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

tools/convertfile.py

tools/convertinv.py

tools/trace-revisions

tools/weavebench.py

files renamed:
bzrlib/doc_generate/sphinx_conf.py => bzrlib/doc_generate/conf.py

bzrlib/repofmt/weaverepo.py => bzrlib/plugins/weave_fmt/repository.py

bzrlib/xml4.py => bzrlib/plugins/weave_fmt/xml4.py

bzrlib/tests/per_bzrdir/ => bzrlib/tests/per_controldir/

bzrlib/tests/per_bzrdir/test_bzrdir.py => bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/per_bzrdir_colo/ => bzrlib/tests/per_controldir_colo/

bzrlib/tests/per_repository/test_is_write_locked.py => bzrlib/tests/per_repository/test_locking.py

bzrlib/tests/per_repository/helpers.py => bzrlib/tests/per_repository_vf/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py => bzrlib/tests/per_repository_vf/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py => bzrlib/tests/per_repository_vf/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check_reconcile.py => bzrlib/tests/per_repository_vf/test_check_reconcile.py

bzrlib/tests/per_repository/test_find_text_key_references.py => bzrlib/tests/per_repository_vf/test_find_text_key_references.py

NEWS => doc/en/release-notes/bzr-2.3.txt

NEWS-template.txt => doc/en/release-notes/release-template.txt

files modified:
.bzrignore

.testr.conf

INSTALL

Makefile

README

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_pyx.pyx

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmd_version_info.py

bzrlib/cmdline.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/crash.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc/api/__init__.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflict-types.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/news_merge/__init__.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/sign_my_commits.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/status.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/features.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_controldir/__init__.py

bzrlib/tests/per_controldir/test_push.py

bzrlib/tests/per_controldir_colo/__init__.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/pathfilter.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/developers/authentication-ring.txt

doc/developers/bug-handling.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/conf.py

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/win32_build_setup.txt

doc/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates/index.html

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/index.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/conf.py

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference/readme.txt

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/es/conf.py

doc/es/index.txt

doc/es/mini-tutorial/index.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/index.txt

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-reference/index.txt

doc/ru/conf.py

doc/ru/index.txt

doc/ru/mini-tutorial/index.txt

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/introducing_bazaar.txt

profile_imports.py

setup.py

tools/check-newsbugs.py

tools/generate_release_notes.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/packaging/update-packaging-branches.sh

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/buildout.cfg

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/groupcompress.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

except ImportError:

pylzma = None

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import (

annotate,

config,

debug,

errors,

graph as _mod_graph,

knit,

osutils,

pack,

static_tuple,

trace,

tsort,

)

from bzrlib.repofmt import pack_repo

""")

from bzrlib.btree_index import BTreeBuilder

from bzrlib.lru_cache import LRUSizeCache

from bzrlib.tsort import topo_sort

from bzrlib.versionedfile import (

_KeyRefs,

adapter_registry,

AbsentContentFactory,

ChunkedContentFactory,

FulltextContentFactory,

VersionedFiles,

VersionedFilesWithFallbacks,

)

# Minimum number of uncompressed bytes to try fetch at once when retrieving

present_keys = []

for prefix in sorted(per_prefix_map):

present_keys.extend(reversed(topo_sort(per_prefix_map[prefix])))

present_keys.extend(reversed(tsort.topo_sort(per_prefix_map[prefix])))

return present_keys

101

108

def __init__(self):

102

109

# map by key? or just order in file?

103

110

self._compressor_name = None

104

self._z_content = None

111

self._z_content_chunks = None

105

112

self._z_content_decompressor = None

106

113

self._z_content_length = None

107

114

self._content_length = None

135

142

self._content = ''.join(self._content_chunks)

136

143

self._content_chunks = None

137

144

if self._content is None:

138

if self._z_content is None:

145

# We join self._z_content_chunks here, because if we are

146

# decompressing, then it is *very* likely that we have a single

147

# chunk

148

if self._z_content_chunks is None:

139

149

raise AssertionError('No content to decompress')

140

if self._z_content == '':

150

z_content = ''.join(self._z_content_chunks)

151

if z_content == '':

141

152

self._content = ''

142

153

elif self._compressor_name == 'lzma':

143

154

# We don't do partial lzma decomp yet

144

self._content = pylzma.decompress(self._z_content)

155

self._content = pylzma.decompress(z_content)

145

156

elif self._compressor_name == 'zlib':

146

157

# Start a zlib decompressor

147

158

if num_bytes * 4 > self._content_length * 3:

148

159

# If we are requesting more that 3/4ths of the content,

149

160

# just extract the whole thing in a single pass

150

161

num_bytes = self._content_length

151

self._content = zlib.decompress(self._z_content)

162

self._content = zlib.decompress(z_content)

152

163

else:

153

164

self._z_content_decompressor = zlib.decompressobj()

154

165

# Seed the decompressor with the uncompressed bytes, so

155

166

# that the rest of the code is simplified

156

167

self._content = self._z_content_decompressor.decompress(

157

self._z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

168

z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

158

169

if not self._z_content_decompressor.unconsumed_tail:

159

170

self._z_content_decompressor = None

160

171

else:

207

218

# XXX: Define some GCCorrupt error ?

208

219

raise AssertionError('Invalid bytes: (%d) != %d + %d' %

209

220

(len(bytes), pos, self._z_content_length))

210

self._z_content = bytes[pos:]

221

self._z_content_chunks = (bytes[pos:],)

222

223

@property

224

def _z_content(self):

225

"""Return z_content_chunks as a simple string.

226

227

Meant only to be used by the test suite.

228

"""

229

if self._z_content_chunks is not None:

230

return ''.join(self._z_content_chunks)

231

return None

211

232

212

233

@classmethod

213

234

def from_bytes(cls, bytes):

269

290

self._content_length = length

270

291

self._content_chunks = content_chunks

271

292

self._content = None

272

self._z_content = None

293

self._z_content_chunks = None

273

294

274

295

def set_content(self, content):

275

296

"""Set the content of this block."""

276

297

self._content_length = len(content)

277

298

self._content = content

278

self._z_content = None

299

self._z_content_chunks = None

279

300

280

301

def _create_z_content_using_lzma(self):

281

302

if self._content_chunks is not None:

283

304

self._content_chunks = None

284

305

if self._content is None:

285

306

raise AssertionError('Nothing to compress')

286

self._z_content = pylzma.compress(self._content)

287

self._z_content_length = len(self._z_content)

307

z_content = pylzma.compress(self._content)

308

self._z_content_chunks = (z_content,)

309

self._z_content_length = len(z_content)

288

310

289

def _create_z_content_from_chunks(self):

311

def _create_z_content_from_chunks(self, chunks):

290

312

compressor = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION)

291

compressed_chunks = map(compressor.compress, self._content_chunks)

313

# Peak in this point is 1 fulltext, 1 compressed text, + zlib overhead

314

# (measured peak is maybe 30MB over the above...)

315

compressed_chunks = map(compressor.compress, chunks)

292

316

compressed_chunks.append(compressor.flush())

293

self._z_content = ''.join(compressed_chunks)

294

self._z_content_length = len(self._z_content)

317

# Ignore empty chunks

318

self._z_content_chunks = [c for c in compressed_chunks if c]

319

self._z_content_length = sum(map(len, self._z_content_chunks))

295

320

296

321

def _create_z_content(self):

297

if self._z_content is not None:

322

if self._z_content_chunks is not None:

298

323

return

299

324

if _USE_LZMA:

300

325

self._create_z_content_using_lzma()

301

326

return

302

327

if self._content_chunks is not None:

303

self._create_z_content_from_chunks()

304

return

305

self._z_content = zlib.compress(self._content)

306

self._z_content_length = len(self._z_content)

328

chunks = self._content_chunks

329

else:

330

chunks = (self._content,)

331

self._create_z_content_from_chunks(chunks)

307

332

308

def to_bytes(self):

309

"""Encode the information into a byte stream."""

333

def to_chunks(self):

334

"""Create the byte stream as a series of 'chunks'"""

310

335

self._create_z_content()

311

336

if _USE_LZMA:

312

337

header = self.GCB_LZ_HEADER

313

338

else:

314

339

header = self.GCB_HEADER

315

chunks = [header,

316

'%d\n%d\n' % (self._z_content_length, self._content_length),

317

self._z_content,

340

chunks = ['%s%d\n%d\n'

341

% (header, self._z_content_length, self._content_length),

318

342

]

343

chunks.extend(self._z_content_chunks)

344

total_len = sum(map(len, chunks))

345

return total_len, chunks

346

347

def to_bytes(self):

348

"""Encode the information into a byte stream."""

349

total_len, chunks = self.to_chunks()

319

350

return ''.join(chunks)

320

351

321

352

def _dump(self, include_text=False):

460

491

_full_enough_block_size = 3*1024*1024 # size at which we won't repack

461

492

_full_enough_mixed_block_size = 2*768*1024 # 1.5MB

462

493

463

def __init__(self, block):

494

def __init__(self, block, get_compressor_settings=None):

464

495

self._block = block

465

496

# We need to preserve the ordering

466

497

self._factories = []

467

498

self._last_byte = 0

499

self._get_settings = get_compressor_settings

500

self._compressor_settings = None

501

502

def _get_compressor_settings(self):

503

if self._compressor_settings is not None:

504

return self._compressor_settings

505

settings = None

506

if self._get_settings is not None:

507

settings = self._get_settings()

508

if settings is None:

509

vf = GroupCompressVersionedFiles

510

settings = vf._DEFAULT_COMPRESSOR_SETTINGS

511

self._compressor_settings = settings

512

return self._compressor_settings

468

513

469

514

def add_factory(self, key, parents, start, end):

470

515

if not self._factories:

503

548

new_block.set_content(self._block._content[:last_byte])

504

549

self._block = new_block

505

550

551

def _make_group_compressor(self):

552

return GroupCompressor(self._get_compressor_settings())

553

506

554

def _rebuild_block(self):

507

555

"""Create a new GroupCompressBlock with only the referenced texts."""

508

compressor = GroupCompressor()

556

compressor = self._make_group_compressor()

509

557

tstart = time.time()

510

558

old_length = self._block._content_length

511

559

end_point = 0

523

571

# block? It seems hard to come up with a method that it would

524

572

# expand, since we do full compression again. Perhaps based on a

525

573

# request that ends up poorly ordered?

574

# TODO: If the content would have expanded, then we would want to

575

# handle a case where we need to split the block.

576

# Now that we have a user-tweakable option

577

# (max_bytes_to_index), it is possible that one person set it

578

# to a very low value, causing poor compression.

526

579

delta = time.time() - tstart

527

580

self._block = new_block

528

581

trace.mutter('creating new compressed block on-the-fly in %.3fs'

679

732

z_header_bytes = zlib.compress(header_bytes)

680

733

del header_bytes

681

734

z_header_bytes_len = len(z_header_bytes)

682

block_bytes = self._block.to_bytes()

735

block_bytes_len, block_chunks = self._block.to_chunks()

683

736

lines.append('%d\n%d\n%d\n' % (z_header_bytes_len, header_bytes_len,

684

len(block_bytes)))

737

block_bytes_len))

685

738

lines.append(z_header_bytes)

686

lines.append(block_bytes)

687

del z_header_bytes, block_bytes

739

lines.extend(block_chunks)

740

del z_header_bytes, block_chunks

741

# TODO: This is a point where we will double the memory consumption. To

742

# avoid this, we probably have to switch to a 'chunked' api

688

743

return ''.join(lines)

689

744

690

745

@classmethod

691

746

def from_bytes(cls, bytes):

692

747

# TODO: This does extra string copying, probably better to do it a

693

# different way

748

# different way. At a minimum this creates 2 copies of the

749

# compressed content

694

750

(storage_kind, z_header_len, header_len,

695

751

block_len, rest) = bytes.split('\n', 4)

696

752

del bytes

748

804

749

805

class _CommonGroupCompressor(object):

750

806

751

def __init__(self):

807

def __init__(self, settings=None):

752

808

"""Create a GroupCompressor."""

753

809

self.chunks = []

754

810

self._last = None

757

813

self.labels_deltas = {}

758

814

self._delta_index = None # Set by the children

759

815

self._block = GroupCompressBlock()

816

if settings is None:

817

self._settings = {}

818

else:

819

self._settings = settings

760

820

761

821

def compress(self, key, bytes, expected_sha, nostore_sha=None, soft=False):

762

822

"""Compress lines with label key.

854

914

855

915

After calling this, the compressor should no longer be used

856

916

"""

857

# TODO: this causes us to 'bloat' to 2x the size of content in the

858

# group. This has an impact for 'commit' of large objects.

859

# One possibility is to use self._content_chunks, and be lazy and

860

# only fill out self._content as a full string when we actually

861

# need it. That would at least drop the peak memory consumption

862

# for 'commit' down to ~1x the size of the largest file, at a

863

# cost of increased complexity within this code. 2x is still <<

864

# 3x the size of the largest file, so we are doing ok.

865

917

self._block.set_chunked_content(self.chunks, self.endpoint)

866

918

self.chunks = None

867

919

self._delta_index = None

885

937

886

938

class PythonGroupCompressor(_CommonGroupCompressor):

887

939

888

def __init__(self):

940

def __init__(self, settings=None):

889

941

"""Create a GroupCompressor.

890

942

891

943

Used only if the pyrex version is not available.

892

944

"""

893

super(PythonGroupCompressor, self).__init__()

945

super(PythonGroupCompressor, self).__init__(settings)

894

946

self._delta_index = LinesDeltaIndex([])

895

947

# The actual content is managed by LinesDeltaIndex

896

948

self.chunks = self._delta_index.lines

933

985

934

986

It contains code very similar to SequenceMatcher because of having a similar

935

987

task. However some key differences apply:

936

- there is no junk, we want a minimal edit not a human readable diff.

937

- we don't filter very common lines (because we don't know where a good

938

range will start, and after the first text we want to be emitting minmal

939

edits only.

940

- we chain the left side, not the right side

941

- we incrementally update the adjacency matrix as new lines are provided.

942

- we look for matches in all of the left side, so the routine which does

943

the analagous task of find_longest_match does not need to filter on the

944

left side.

988

989

* there is no junk, we want a minimal edit not a human readable diff.

990

* we don't filter very common lines (because we don't know where a good

991

range will start, and after the first text we want to be emitting minmal

992

edits only.

993

* we chain the left side, not the right side

994

* we incrementally update the adjacency matrix as new lines are provided.

995

* we look for matches in all of the left side, so the routine which does

996

the analagous task of find_longest_match does not need to filter on the

997

left side.

945

998

"""

946

999

947

def __init__(self):

948

super(PyrexGroupCompressor, self).__init__()

949

self._delta_index = DeltaIndex()

1000

def __init__(self, settings=None):

1001

super(PyrexGroupCompressor, self).__init__(settings)

1002

max_bytes_to_index = self._settings.get('max_bytes_to_index', 0)

1003

self._delta_index = DeltaIndex(max_bytes_to_index=max_bytes_to_index)

950

1004

951

1005

def _compress(self, key, bytes, max_delta_size, soft=False):

952

1006

"""see _CommonGroupCompressor._compress"""

1027

1081

index = _GCGraphIndex(graph_index, lambda:True, parents=parents,

1028

1082

add_callback=graph_index.add_nodes,

1029

1083

inconsistency_fatal=inconsistency_fatal)

1030

access = knit._DirectPackAccess({})

1084

access = pack_repo._DirectPackAccess({})

1031

1085

access.set_writer(writer, graph_index, (transport, 'newpack'))

1032

1086

result = GroupCompressVersionedFiles(index, access, delta)

1033

1087

result.stream = stream

1043

1097

1044

1098

class _BatchingBlockFetcher(object):

1045

1099

"""Fetch group compress blocks in batches.

1046

1100

1047

1101

:ivar total_bytes: int of expected number of bytes needed to fetch the

1048

1102

currently pending batch.

1049

1103

"""

1050

1104

1051

def __init__(self, gcvf, locations):

1105

def __init__(self, gcvf, locations, get_compressor_settings=None):

1052

1106

self.gcvf = gcvf

1053

1107

self.locations = locations

1054

1108

self.keys = []

1057

1111

self.total_bytes = 0

1058

1112

self.last_read_memo = None

1059

1113

self.manager = None

1114

self._get_compressor_settings = get_compressor_settings

1060

1115

1061

1116

def add_key(self, key):

1062

1117

"""Add another to key to fetch.

1063

1118

1064

1119

:return: The estimated number of bytes needed to fetch the batch so

1065

1120

far.

1066

1121

"""

1091

1146

# and then.

1092

1147

self.batch_memos[read_memo] = cached_block

1093

1148

return self.total_bytes

1094

1149

1095

1150

def _flush_manager(self):

1096

1151

if self.manager is not None:

1097

1152

for factory in self.manager.get_record_stream():

1102

1157

def yield_factories(self, full_flush=False):

1103

1158

"""Yield factories for keys added since the last yield. They will be

1104

1159

returned in the order they were added via add_key.

1105

1160

1106

1161

:param full_flush: by default, some results may not be returned in case

1107

1162

they can be part of the next batch. If full_flush is True, then

1108

1163

all results are returned.

1136

1191

memos_to_get_stack.pop()

1137

1192

else:

1138

1193

block = self.batch_memos[read_memo]

1139

self.manager = _LazyGroupContentManager(block)

1194

self.manager = _LazyGroupContentManager(block,

1195

get_compressor_settings=self._get_compressor_settings)

1140

1196

self.last_read_memo = read_memo

1141

1197

start, end = index_memo[3:5]

1142

1198

self.manager.add_factory(key, parents, start, end)

1149

1205

self.total_bytes = 0

1150

1206

1151

1207

1152

class GroupCompressVersionedFiles(VersionedFiles):

1208

class GroupCompressVersionedFiles(VersionedFilesWithFallbacks):

1153

1209

"""A group-compress based VersionedFiles implementation."""

1154

1210

1155

def __init__(self, index, access, delta=True, _unadded_refs=None):

1211

# This controls how the GroupCompress DeltaIndex works. Basically, we

1212

# compute hash pointers into the source blocks (so hash(text) => text).

1213

# However each of these references costs some memory in trade against a

1214

# more accurate match result. For very large files, they either are

1215

# pre-compressed and change in bulk whenever they change, or change in just

1216

# local blocks. Either way, 'improved resolution' is not very helpful,

1217

# versus running out of memory trying to track everything. The default max

1218

# gives 100% sampling of a 1MB file.

1219

_DEFAULT_MAX_BYTES_TO_INDEX = 1024 * 1024

1220

_DEFAULT_COMPRESSOR_SETTINGS = {'max_bytes_to_index':

1221

_DEFAULT_MAX_BYTES_TO_INDEX}

1222

1223

def __init__(self, index, access, delta=True, _unadded_refs=None,

1224

_group_cache=None):

1156

1225

"""Create a GroupCompressVersionedFiles object.

1157

1226

1158

1227

:param index: The index object storing access and graph data.

1159

1228

:param access: The access object storing raw data.

1160

1229

:param delta: Whether to delta compress or just entropy compress.

1161

1230

:param _unadded_refs: private parameter, don't use.

1231

:param _group_cache: private parameter, don't use.

1162

1232

"""

1163

1233

self._index = index

1164

1234

self._access = access

1166

1236

if _unadded_refs is None:

1167

1237

_unadded_refs = {}

1168

1238

self._unadded_refs = _unadded_refs

1169

self._group_cache = LRUSizeCache(max_size=50*1024*1024)

1170

self._fallback_vfs = []

1239

if _group_cache is None:

1240

_group_cache = LRUSizeCache(max_size=50*1024*1024)

1241

self._group_cache = _group_cache

1242

self._immediate_fallback_vfs = []

1243

self._max_bytes_to_index = None

1171

1244

1172

1245

def without_fallbacks(self):

1173

1246

"""Return a clone of this object without any fallbacks configured."""

1174

1247

return GroupCompressVersionedFiles(self._index, self._access,

1175

self._delta, _unadded_refs=dict(self._unadded_refs))

1248

self._delta, _unadded_refs=dict(self._unadded_refs),

1249

_group_cache=self._group_cache)

1176

1250

1177

1251

def add_lines(self, key, parents, lines, parent_texts=None,

1178

1252

left_matching_blocks=None, nostore_sha=None, random_id=False,

1182

1256

:param key: The key tuple of the text to add.

1183

1257

:param parents: The parents key tuples of the text to add.

1184

1258

:param lines: A list of lines. Each line must be a bytestring. And all

1185

of them except the last must be terminated with \n and contain no

1186

other \n's. The last line may either contain no \n's or a single

1187

terminating \n. If the lines list does meet this constraint the add

1188

routine may error or may succeed - but you will be unable to read

1189

the data back accurately. (Checking the lines have been split

1259

of them except the last must be terminated with \\n and contain no

1260

other \\n's. The last line may either contain no \\n's or a single

1261

terminating \\n. If the lines list does meet this constraint the

1262

add routine may error or may succeed - but you will be unable to

1263

read the data back accurately. (Checking the lines have been split

1190

1264

correctly is expensive and extremely unlikely to catch bugs so it

1191

1265

is not done at runtime unless check_content is True.)

1192

1266

:param parent_texts: An optional dictionary containing the opaque

1247

1321

1248

1322

:param a_versioned_files: A VersionedFiles object.

1249

1323

"""

1250

self._fallback_vfs.append(a_versioned_files)

1324

self._immediate_fallback_vfs.append(a_versioned_files)

1251

1325

1252

1326

def annotate(self, key):

1253

1327

"""See VersionedFiles.annotate."""

1287

1361

self._check_lines_not_unicode(lines)

1288

1362

self._check_lines_are_lines(lines)

1289

1363

1290

def get_known_graph_ancestry(self, keys):

1291

"""Get a KnownGraph instance with the ancestry of keys."""

1292

# Note that this is identical to

1293

# KnitVersionedFiles.get_known_graph_ancestry, but they don't share

1294

# ancestry.

1295

parent_map, missing_keys = self._index.find_ancestry(keys)

1296

for fallback in self._fallback_vfs:

1297

if not missing_keys:

1298

break

1299

(f_parent_map, f_missing_keys) = fallback._index.find_ancestry(

1300

missing_keys)

1301

parent_map.update(f_parent_map)

1302

missing_keys = f_missing_keys

1303

kg = _mod_graph.KnownGraph(parent_map)

1304

return kg

1305

1306

1364

def get_parent_map(self, keys):

1307

1365

"""Get a map of the graph parents of keys.

1308

1366

1323

1381

and so on.

1324

1382

"""

1325

1383

result = {}

1326

sources = [self._index] + self._fallback_vfs

1384

sources = [self._index] + self._immediate_fallback_vfs

1327

1385

source_results = []

1328

1386

missing = set(keys)

1329

1387

for source in sources:

1430

1488

parent_map = {}

1431

1489

key_to_source_map = {}

1432

1490

source_results = []

1433

for source in self._fallback_vfs:

1491

for source in self._immediate_fallback_vfs:

1434

1492

if not missing:

1435

1493

break

1436

1494

source_parents = source.get_parent_map(missing)

1446

1504

1447

1505

The returned objects should be in the order defined by 'ordering',

1448

1506

which can weave between different sources.

1507

1449

1508

:param ordering: Must be one of 'topological' or 'groupcompress'

1450

1509

:return: List of [(source, [keys])] tuples, such that all keys are in

1451

1510

the defined order, regardless of source.

1452

1511

"""

1453

1512

if ordering == 'topological':

1454

present_keys = topo_sort(parent_map)

1513

present_keys = tsort.topo_sort(parent_map)

1455

1514

else:

1456

1515

# ordering == 'groupcompress'

1457

1516

# XXX: This only optimizes for the target ordering. We may need

1546

1605

# - we encounter an unadded ref, or

1547

1606

# - we run out of keys, or

1548

1607

# - the total bytes to retrieve for this batch > BATCH_SIZE

1549

batcher = _BatchingBlockFetcher(self, locations)

1608

batcher = _BatchingBlockFetcher(self, locations,

1609

get_compressor_settings=self._get_compressor_settings)

1550

1610

for source, keys in source_keys:

1551

1611

if source is self:

1552

1612

for key in keys:

1598

1658

for _ in self._insert_record_stream(stream, random_id=False):

1599

1659

pass

1600

1660

1661

def _get_compressor_settings(self):

1662

if self._max_bytes_to_index is None:

1663

# TODO: VersionedFiles don't know about their containing

1664

# repository, so they don't have much of an idea about their

1665

# location. So for now, this is only a global option.

1666

c = config.GlobalConfig()

1667

val = c.get_user_option('bzr.groupcompress.max_bytes_to_index')

1668

if val is not None:

1669

try:

1670

val = int(val)

1671

except ValueError, e:

1672

trace.warning('Value for '

1673

'"bzr.groupcompress.max_bytes_to_index"'

1674

' %r is not an integer'

1675

% (val,))

1676

val = None

1677

if val is None:

1678

val = self._DEFAULT_MAX_BYTES_TO_INDEX

1679

self._max_bytes_to_index = val

1680

return {'max_bytes_to_index': self._max_bytes_to_index}

1681

1682

def _make_group_compressor(self):

1683

return GroupCompressor(self._get_compressor_settings())

1684

1601

1685

def _insert_record_stream(self, stream, random_id=False, nostore_sha=None,

1602

1686

reuse_blocks=True):

1603

1687

"""Internal core to insert a record stream into this container.

1626

1710

return adapter

1627

1711

# This will go up to fulltexts for gc to gc fetching, which isn't

1628

1712

# ideal.

1629

self._compressor = GroupCompressor()

1713

self._compressor = self._make_group_compressor()

1630

1714

self._unadded_refs = {}

1631

1715

keys_to_add = []

1632

1716

def flush():

1633

bytes = self._compressor.flush().to_bytes()

1634

self._compressor = GroupCompressor()

1717

bytes_len, chunks = self._compressor.flush().to_chunks()

1718

self._compressor = self._make_group_compressor()

1719

# Note: At this point we still have 1 copy of the fulltext (in

1720

# record and the var 'bytes'), and this generates 2 copies of

1721

# the compressed text (one for bytes, one in chunks)

1722

# TODO: Push 'chunks' down into the _access api, so that we don't

1723

# have to double compressed memory here

1724

# TODO: Figure out how to indicate that we would be happy to free

1725

# the fulltext content at this point. Note that sometimes we

1726

# will want it later (streaming CHK pages), but most of the

1727

# time we won't (everything else)

1728

bytes = ''.join(chunks)

1729

del chunks

1635

1730

index, start, length = self._access.add_raw_records(

1636

1731

[(None, len(bytes))], bytes)[0]

1637

1732

nodes = []

1802

1897

"""See VersionedFiles.keys."""

1803

1898

if 'evil' in debug.debug_flags:

1804

1899

trace.mutter_callsite(2, "keys scales with size of history")

1805

sources = [self._index] + self._fallback_vfs

1900

sources = [self._index] + self._immediate_fallback_vfs

1806

1901

result = set()

1807

1902

for source in sources:

1808

1903

result.update(source.keys())

1809

1904

return result

1810

1905

1811

1906

1907

class _GCBuildDetails(object):

1908

"""A blob of data about the build details.

1909

1910

This stores the minimal data, which then allows compatibility with the old

1911

api, without taking as much memory.

1912

"""

1913

1914

__slots__ = ('_index', '_group_start', '_group_end', '_basis_end',

1915

'_delta_end', '_parents')

1916

1917

method = 'group'

1918

compression_parent = None

1919

1920

def __init__(self, parents, position_info):

1921

self._parents = parents

1922

(self._index, self._group_start, self._group_end, self._basis_end,

1923

self._delta_end) = position_info

1924

1925

def __repr__(self):

1926

return '%s(%s, %s)' % (self.__class__.__name__,

1927

self.index_memo, self._parents)

1928

1929

@property

1930

def index_memo(self):

1931

return (self._index, self._group_start, self._group_end,

1932

self._basis_end, self._delta_end)

1933

1934

@property

1935

def record_details(self):

1936

return static_tuple.StaticTuple(self.method, None)

1937

1938

def __getitem__(self, offset):

1939

"""Compatibility thunk to act like a tuple."""

1940

if offset == 0:

1941

return self.index_memo

1942

elif offset == 1:

1943

return self.compression_parent # Always None

1944

elif offset == 2:

1945

return self._parents

1946

elif offset == 3:

1947

return self.record_details

1948

else:

1949

raise IndexError('offset out of range')

1950

1951

def __len__(self):

1952

return 4

1953

1954

1812

1955

class _GCGraphIndex(object):

1813

1956

"""Mapper from GroupCompressVersionedFiles needs into GraphIndex storage."""

1814

1957

1843

1986

# repeated over and over, this creates a surplus of ints

1844

1987

self._int_cache = {}

1845

1988

if track_external_parent_refs:

1846

self._key_dependencies = knit._KeyRefs(

1989

self._key_dependencies = _KeyRefs(

1847

1990

track_new_keys=track_new_keys)

1848

1991

else:

1849

1992

self._key_dependencies = None

1989

2132

:param keys: An iterable of keys.

1990

2133

:return: A dict of key:

1991

2134

(index_memo, compression_parent, parents, record_details).

1992

index_memo

1993

opaque structure to pass to read_records to extract the raw

1994

data

1995

compression_parent

1996

Content that this record is built upon, may be None

1997

parents

1998

Logical parents of this node

1999

record_details

2000

extra information about the content which needs to be passed to

2001

Factory.parse_record

2135

2136

* index_memo: opaque structure to pass to read_records to extract

2137

the raw data

2138

* compression_parent: Content that this record is built upon, may

2139

be None

2140

* parents: Logical parents of this node

2141

* record_details: extra information about the content which needs

2142

to be passed to Factory.parse_record

2002

2143

"""

2003

2144

self._check_read()

2004

2145

result = {}

2009

2150

parents = None

2010

2151

else:

2011

2152

parents = entry[3][0]

2012

method = 'group'

2013

result[key] = (self._node_to_position(entry),

2014

None, parents, (method, None))

2153

details = _GCBuildDetails(parents, self._node_to_position(entry))

2154

result[key] = details

2015

2155

return result

2016

2156

2017

2157

def keys(self):

2033

2173

# each, or about 7MB. Note that it might be even more when you consider

2034

2174

# how PyInt is allocated in separate slabs. And you can't return a slab

2035

2175

# to the OS if even 1 int on it is in use. Note though that Python uses

2036

# a LIFO when re-using PyInt slots, which probably causes more

2176

# a LIFO when re-using PyInt slots, which might cause more

2037

2177

# fragmentation.

2038

2178

start = int(bits[0])

2039

2179

start = self._int_cache.setdefault(start, start)

Older »