~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/groupcompress.py

Committer: Jonathan Riddell
Date: 2011-09-14 11:07:39 UTC
mto: (6138.3.3 i18n-gettext-more-strings)
mto: This revision was merged to the branch mainline in revision 6142.
Revision ID: jriddell@canonical.com-20110914110739-9be7tyglqj5x5ub8

add gettext to all the builtin commands outf usage

files added:
NEWS

bzrlib/cethread.py

bzrlib/cmd_test_script.py

bzrlib/estimate_compressed_size.py

bzrlib/export_pot.py

bzrlib/filter_tree.py

bzrlib/help_topics/en/url-special-chars.txt

bzrlib/i18n.py

bzrlib/mergetools.py

bzrlib/plugins/changelog_merge

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/changelog_merge/tests

bzrlib/plugins/changelog_merge/tests/__init__.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/launchpad/lp_api_lite.py

bzrlib/plugins/launchpad/test_lp_api_lite.py

bzrlib/plugins/weave_fmt

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/tests

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/pyutils.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/tests/blackbox/test_branches.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_remember_option.py

bzrlib/tests/blackbox/test_repair_workingtree.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/per_controldir/test_format.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_intertree/test_file_content_matches.py

bzrlib/tests/per_repository/test_file_graph.py

bzrlib/tests/per_repository_reference/test__make_parents_provider.py

bzrlib/tests/per_repository_reference/test_commit_with_stacking.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_vf

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_repository_vf/test_check.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_repository_vf/test_fileid_involved.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_refresh_data.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_repository_vf/test_write_group.py

bzrlib/tests/per_tree/test_export.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_workingtree/test_check_state.py

bzrlib/tests/scenarios.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_estimate_compressed_size.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_features.py

bzrlib/tests/test_filter_tree.py

bzrlib/tests/test_i18n.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_pyutils.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_utextwrap.py

bzrlib/utextwrap.py

bzrlib/vf_repository.py

bzrlib/workingtree_3.py

doc/developers/configuration.txt

doc/developers/documenting-changes.txt

doc/developers/fetch.txt

doc/developers/xdg_config_spec.txt

doc/en/admin-guide/licence.txt

doc/en/release-notes/bzr-0.1.txt

doc/en/release-notes/bzr-0.10.txt

doc/en/release-notes/bzr-0.11.txt

doc/en/release-notes/bzr-0.12.txt

doc/en/release-notes/bzr-0.13.txt

doc/en/release-notes/bzr-0.14.txt

doc/en/release-notes/bzr-0.15.txt

doc/en/release-notes/bzr-0.16.txt

doc/en/release-notes/bzr-0.17.txt

doc/en/release-notes/bzr-0.18.txt

doc/en/release-notes/bzr-0.6.txt

doc/en/release-notes/bzr-0.7.txt

doc/en/release-notes/bzr-0.8.txt

doc/en/release-notes/bzr-0.9.txt

doc/en/release-notes/bzr-0.90.txt

doc/en/release-notes/bzr-0.91.txt

doc/en/release-notes/bzr-0.92.txt

doc/en/release-notes/bzr-1.0.txt

doc/en/release-notes/bzr-1.1.txt

doc/en/release-notes/bzr-1.10.txt

doc/en/release-notes/bzr-1.11.txt

doc/en/release-notes/bzr-1.12.txt

doc/en/release-notes/bzr-1.13.txt

doc/en/release-notes/bzr-1.14.txt

doc/en/release-notes/bzr-1.15.txt

doc/en/release-notes/bzr-1.16.txt

doc/en/release-notes/bzr-1.17.txt

doc/en/release-notes/bzr-1.18.txt

doc/en/release-notes/bzr-1.2.txt

doc/en/release-notes/bzr-1.3.txt

doc/en/release-notes/bzr-1.4.txt

doc/en/release-notes/bzr-1.5.txt

doc/en/release-notes/bzr-1.6.txt

doc/en/release-notes/bzr-1.7.txt

doc/en/release-notes/bzr-1.8.txt

doc/en/release-notes/bzr-1.9.txt

doc/en/release-notes/bzr-2.0.txt

doc/en/release-notes/bzr-2.1.txt

doc/en/release-notes/bzr-2.2.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/bzr-2.5.txt

doc/en/release-notes/series-template.txt

doc/en/tutorials/licence.txt

doc/en/upgrade-guide/licence.txt

doc/en/user-guide/gpg_signatures.txt

doc/en/user-guide/licence.txt

doc/en/whats-new/template.txt

doc/en/whats-new/whats-new-in-2.4.txt

doc/en/whats-new/whats-new-in-2.5.txt

doc/ja/tutorials/licence.txt

doc/ja/user-guide/index-plain.txt

doc/ja/user-guide/licence.txt

po/bzr.pot

tools/build_mo.py

tools/fixed-in.py

tools/subunit-sum

files removed:
bzrlib/deprecated_graph.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/util/bencode.py

contrib/add-bzr-to-baz

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

tools/convertfile.py

tools/convertinv.py

tools/trace-revisions

tools/weavebench.py

files renamed:
bzrlib/sign_my_commits.py => bzrlib/commit_signature_commands.py

bzrlib/repofmt/weaverepo.py => bzrlib/plugins/weave_fmt/repository.py

bzrlib/xml4.py => bzrlib/plugins/weave_fmt/xml4.py

bzrlib/tests/per_repository/test_is_write_locked.py => bzrlib/tests/per_repository/test_locking.py

bzrlib/tests/per_repository/helpers.py => bzrlib/tests/per_repository_vf/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py => bzrlib/tests/per_repository_vf/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py => bzrlib/tests/per_repository_vf/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check_reconcile.py => bzrlib/tests/per_repository_vf/test_check_reconcile.py

bzrlib/tests/per_repository/test_find_text_key_references.py => bzrlib/tests/per_repository_vf/test_find_text_key_references.py

bzrlib/tests/per_repository/test_merge_directive.py => bzrlib/tests/per_repository_vf/test_merge_directive.py

NEWS => doc/en/release-notes/bzr-2.3.txt

NEWS-template.txt => doc/en/release-notes/release-template.txt

files modified:
.bzrignore

.testr.conf

Makefile

README

bzrlib/__init__.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/cleanup.py

bzrlib/cmd_version_info.py

bzrlib/cmdline.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/controldir.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/transport.txt

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/conf.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/filters/__init__.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflict-types.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/library_state.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/news_merge/__init__.py

bzrlib/push.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/status.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/features.py

bzrlib/tests/fixtures.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/__init__.py

bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_server.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/testui.py

bzrlib/tests/transport_util.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/gio_transport.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/pathfilter.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml8.py

doc/developers/HACKING.txt

doc/developers/authentication-ring.txt

doc/developers/bug-handling.txt

doc/developers/check.txt

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/cycle.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/transports.txt

doc/developers/win32_build_setup.txt

doc/en/_static/en/bzr-en-quick-reference.pdf

doc/en/_static/en/bzr-en-quick-reference.png

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates/index.html

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/index.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/simple-setups.txt

doc/en/conf.py

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/es/mini-tutorial/index.txt

doc/ja/index.txt

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-reference/index.txt

doc/ru/tutorials/tutorial.txt

doc/ru/user-guide/branching_a_project.txt

profile_imports.py

setup.py

tools/check-newsbugs.py

tools/generate_release_notes.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-control.sh

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/buildout.cfg

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/py2exe_boot_common.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/groupcompress.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

except ImportError:

pylzma = None

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import (

annotate,

config,

debug,

errors,

graph as _mod_graph,

knit,

osutils,

pack,

static_tuple,

trace,

tsort,

)

from bzrlib.repofmt import pack_repo

""")

from bzrlib.btree_index import BTreeBuilder

from bzrlib.lru_cache import LRUSizeCache

from bzrlib.tsort import topo_sort

from bzrlib.versionedfile import (

_KeyRefs,

adapter_registry,

AbsentContentFactory,

ChunkedContentFactory,

FulltextContentFactory,

VersionedFiles,

VersionedFilesWithFallbacks,

)

# Minimum number of uncompressed bytes to try fetch at once when retrieving

present_keys = []

for prefix in sorted(per_prefix_map):

present_keys.extend(reversed(topo_sort(per_prefix_map[prefix])))

present_keys.extend(reversed(tsort.topo_sort(per_prefix_map[prefix])))

return present_keys

101

108

def __init__(self):

102

109

# map by key? or just order in file?

103

110

self._compressor_name = None

104

self._z_content = None

111

self._z_content_chunks = None

105

112

self._z_content_decompressor = None

106

113

self._z_content_length = None

107

114

self._content_length = None

135

142

self._content = ''.join(self._content_chunks)

136

143

self._content_chunks = None

137

144

if self._content is None:

138

if self._z_content is None:

145

# We join self._z_content_chunks here, because if we are

146

# decompressing, then it is *very* likely that we have a single

147

# chunk

148

if self._z_content_chunks is None:

139

149

raise AssertionError('No content to decompress')

140

if self._z_content == '':

150

z_content = ''.join(self._z_content_chunks)

151

if z_content == '':

141

152

self._content = ''

142

153

elif self._compressor_name == 'lzma':

143

154

# We don't do partial lzma decomp yet

144

self._content = pylzma.decompress(self._z_content)

155

self._content = pylzma.decompress(z_content)

145

156

elif self._compressor_name == 'zlib':

146

157

# Start a zlib decompressor

147

158

if num_bytes * 4 > self._content_length * 3:

148

159

# If we are requesting more that 3/4ths of the content,

149

160

# just extract the whole thing in a single pass

150

161

num_bytes = self._content_length

151

self._content = zlib.decompress(self._z_content)

162

self._content = zlib.decompress(z_content)

152

163

else:

153

164

self._z_content_decompressor = zlib.decompressobj()

154

165

# Seed the decompressor with the uncompressed bytes, so

155

166

# that the rest of the code is simplified

156

167

self._content = self._z_content_decompressor.decompress(

157

self._z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

168

z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

158

169

if not self._z_content_decompressor.unconsumed_tail:

159

170

self._z_content_decompressor = None

160

171

else:

207

218

# XXX: Define some GCCorrupt error ?

208

219

raise AssertionError('Invalid bytes: (%d) != %d + %d' %

209

220

(len(bytes), pos, self._z_content_length))

210

self._z_content = bytes[pos:]

221

self._z_content_chunks = (bytes[pos:],)

222

223

@property

224

def _z_content(self):

225

"""Return z_content_chunks as a simple string.

226

227

Meant only to be used by the test suite.

228

"""

229

if self._z_content_chunks is not None:

230

return ''.join(self._z_content_chunks)

231

return None

211

232

212

233

@classmethod

213

234

def from_bytes(cls, bytes):

269

290

self._content_length = length

270

291

self._content_chunks = content_chunks

271

292

self._content = None

272

self._z_content = None

293

self._z_content_chunks = None

273

294

274

295

def set_content(self, content):

275

296

"""Set the content of this block."""

276

297

self._content_length = len(content)

277

298

self._content = content

278

self._z_content = None

299

self._z_content_chunks = None

279

300

280

301

def _create_z_content_using_lzma(self):

281

302

if self._content_chunks is not None:

283

304

self._content_chunks = None

284

305

if self._content is None:

285

306

raise AssertionError('Nothing to compress')

286

self._z_content = pylzma.compress(self._content)

287

self._z_content_length = len(self._z_content)

307

z_content = pylzma.compress(self._content)

308

self._z_content_chunks = (z_content,)

309

self._z_content_length = len(z_content)

288

310

289

def _create_z_content_from_chunks(self):

311

def _create_z_content_from_chunks(self, chunks):

290

312

compressor = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION)

291

compressed_chunks = map(compressor.compress, self._content_chunks)

313

# Peak in this point is 1 fulltext, 1 compressed text, + zlib overhead

314

# (measured peak is maybe 30MB over the above...)

315

compressed_chunks = map(compressor.compress, chunks)

292

316

compressed_chunks.append(compressor.flush())

293

self._z_content = ''.join(compressed_chunks)

294

self._z_content_length = len(self._z_content)

317

# Ignore empty chunks

318

self._z_content_chunks = [c for c in compressed_chunks if c]

319

self._z_content_length = sum(map(len, self._z_content_chunks))

295

320

296

321

def _create_z_content(self):

297

if self._z_content is not None:

322

if self._z_content_chunks is not None:

298

323

return

299

324

if _USE_LZMA:

300

325

self._create_z_content_using_lzma()

301

326

return

302

327

if self._content_chunks is not None:

303

self._create_z_content_from_chunks()

304

return

305

self._z_content = zlib.compress(self._content)

306

self._z_content_length = len(self._z_content)

328

chunks = self._content_chunks

329

else:

330

chunks = (self._content,)

331

self._create_z_content_from_chunks(chunks)

307

332

308

def to_bytes(self):

309

"""Encode the information into a byte stream."""

333

def to_chunks(self):

334

"""Create the byte stream as a series of 'chunks'"""

310

335

self._create_z_content()

311

336

if _USE_LZMA:

312

337

header = self.GCB_LZ_HEADER

313

338

else:

314

339

header = self.GCB_HEADER

315

chunks = [header,

316

'%d\n%d\n' % (self._z_content_length, self._content_length),

317

self._z_content,

340

chunks = ['%s%d\n%d\n'

341

% (header, self._z_content_length, self._content_length),

318

342

]

343

chunks.extend(self._z_content_chunks)

344

total_len = sum(map(len, chunks))

345

return total_len, chunks

346

347

def to_bytes(self):

348

"""Encode the information into a byte stream."""

349

total_len, chunks = self.to_chunks()

319

350

return ''.join(chunks)

320

351

321

352

def _dump(self, include_text=False):

435

466

# Grab and cache the raw bytes for this entry

436

467

# and break the ref-cycle with _manager since we don't need it

437

468

# anymore

438

self._manager._prepare_for_extract()

469

try:

470

self._manager._prepare_for_extract()

471

except zlib.error as value:

472

raise errors.DecompressCorruption("zlib: " + str(value))

439

473

block = self._manager._block

440

474

self._bytes = block.extract(self.key, self._start, self._end)

441

475

# There are code paths that first extract as fulltext, and then

460

494

_full_enough_block_size = 3*1024*1024 # size at which we won't repack

461

495

_full_enough_mixed_block_size = 2*768*1024 # 1.5MB

462

496

463

def __init__(self, block):

497

def __init__(self, block, get_compressor_settings=None):

464

498

self._block = block

465

499

# We need to preserve the ordering

466

500

self._factories = []

467

501

self._last_byte = 0

502

self._get_settings = get_compressor_settings

503

self._compressor_settings = None

504

505

def _get_compressor_settings(self):

506

if self._compressor_settings is not None:

507

return self._compressor_settings

508

settings = None

509

if self._get_settings is not None:

510

settings = self._get_settings()

511

if settings is None:

512

vf = GroupCompressVersionedFiles

513

settings = vf._DEFAULT_COMPRESSOR_SETTINGS

514

self._compressor_settings = settings

515

return self._compressor_settings

468

516

469

517

def add_factory(self, key, parents, start, end):

470

518

if not self._factories:

503

551

new_block.set_content(self._block._content[:last_byte])

504

552

self._block = new_block

505

553

554

def _make_group_compressor(self):

555

return GroupCompressor(self._get_compressor_settings())

556

506

557

def _rebuild_block(self):

507

558

"""Create a new GroupCompressBlock with only the referenced texts."""

508

compressor = GroupCompressor()

559

compressor = self._make_group_compressor()

509

560

tstart = time.time()

510

561

old_length = self._block._content_length

511

562

end_point = 0

523

574

# block? It seems hard to come up with a method that it would

524

575

# expand, since we do full compression again. Perhaps based on a

525

576

# request that ends up poorly ordered?

577

# TODO: If the content would have expanded, then we would want to

578

# handle a case where we need to split the block.

579

# Now that we have a user-tweakable option

580

# (max_bytes_to_index), it is possible that one person set it

581

# to a very low value, causing poor compression.

526

582

delta = time.time() - tstart

527

583

self._block = new_block

528

584

trace.mutter('creating new compressed block on-the-fly in %.3fs'

679

735

z_header_bytes = zlib.compress(header_bytes)

680

736

del header_bytes

681

737

z_header_bytes_len = len(z_header_bytes)

682

block_bytes = self._block.to_bytes()

738

block_bytes_len, block_chunks = self._block.to_chunks()

683

739

lines.append('%d\n%d\n%d\n' % (z_header_bytes_len, header_bytes_len,

684

len(block_bytes)))

740

block_bytes_len))

685

741

lines.append(z_header_bytes)

686

lines.append(block_bytes)

687

del z_header_bytes, block_bytes

742

lines.extend(block_chunks)

743

del z_header_bytes, block_chunks

744

# TODO: This is a point where we will double the memory consumption. To

745

# avoid this, we probably have to switch to a 'chunked' api

688

746

return ''.join(lines)

689

747

690

748

@classmethod

691

749

def from_bytes(cls, bytes):

692

750

# TODO: This does extra string copying, probably better to do it a

693

# different way

751

# different way. At a minimum this creates 2 copies of the

752

# compressed content

694

753

(storage_kind, z_header_len, header_len,

695

754

block_len, rest) = bytes.split('\n', 4)

696

755

del bytes

748

807

749

808

class _CommonGroupCompressor(object):

750

809

751

def __init__(self):

810

def __init__(self, settings=None):

752

811

"""Create a GroupCompressor."""

753

812

self.chunks = []

754

813

self._last = None

757

816

self.labels_deltas = {}

758

817

self._delta_index = None # Set by the children

759

818

self._block = GroupCompressBlock()

819

if settings is None:

820

self._settings = {}

821

else:

822

self._settings = settings

760

823

761

824

def compress(self, key, bytes, expected_sha, nostore_sha=None, soft=False):

762

825

"""Compress lines with label key.

854

917

855

918

After calling this, the compressor should no longer be used

856

919

"""

857

# TODO: this causes us to 'bloat' to 2x the size of content in the

858

# group. This has an impact for 'commit' of large objects.

859

# One possibility is to use self._content_chunks, and be lazy and

860

# only fill out self._content as a full string when we actually

861

# need it. That would at least drop the peak memory consumption

862

# for 'commit' down to ~1x the size of the largest file, at a

863

# cost of increased complexity within this code. 2x is still <<

864

# 3x the size of the largest file, so we are doing ok.

865

920

self._block.set_chunked_content(self.chunks, self.endpoint)

866

921

self.chunks = None

867

922

self._delta_index = None

885

940

886

941

class PythonGroupCompressor(_CommonGroupCompressor):

887

942

888

def __init__(self):

943

def __init__(self, settings=None):

889

944

"""Create a GroupCompressor.

890

945

891

946

Used only if the pyrex version is not available.

892

947

"""

893

super(PythonGroupCompressor, self).__init__()

948

super(PythonGroupCompressor, self).__init__(settings)

894

949

self._delta_index = LinesDeltaIndex([])

895

950

# The actual content is managed by LinesDeltaIndex

896

951

self.chunks = self._delta_index.lines

933

988

934

989

It contains code very similar to SequenceMatcher because of having a similar

935

990

task. However some key differences apply:

936

- there is no junk, we want a minimal edit not a human readable diff.

937

- we don't filter very common lines (because we don't know where a good

938

range will start, and after the first text we want to be emitting minmal

939

edits only.

940

- we chain the left side, not the right side

941

- we incrementally update the adjacency matrix as new lines are provided.

942

- we look for matches in all of the left side, so the routine which does

943

the analagous task of find_longest_match does not need to filter on the

944

left side.

991

992

* there is no junk, we want a minimal edit not a human readable diff.

993

* we don't filter very common lines (because we don't know where a good

994

range will start, and after the first text we want to be emitting minmal

995

edits only.

996

* we chain the left side, not the right side

997

* we incrementally update the adjacency matrix as new lines are provided.

998

* we look for matches in all of the left side, so the routine which does

999

the analagous task of find_longest_match does not need to filter on the

1000

left side.

945

1001

"""

946

1002

947

def __init__(self):

948

super(PyrexGroupCompressor, self).__init__()

949

self._delta_index = DeltaIndex()

1003

def __init__(self, settings=None):

1004

super(PyrexGroupCompressor, self).__init__(settings)

1005

max_bytes_to_index = self._settings.get('max_bytes_to_index', 0)

1006

self._delta_index = DeltaIndex(max_bytes_to_index=max_bytes_to_index)

950

1007

951

1008

def _compress(self, key, bytes, max_delta_size, soft=False):

952

1009

"""see _CommonGroupCompressor._compress"""

1027

1084

index = _GCGraphIndex(graph_index, lambda:True, parents=parents,

1028

1085

add_callback=graph_index.add_nodes,

1029

1086

inconsistency_fatal=inconsistency_fatal)

1030

access = knit._DirectPackAccess({})

1087

access = pack_repo._DirectPackAccess({})

1031

1088

access.set_writer(writer, graph_index, (transport, 'newpack'))

1032

1089

result = GroupCompressVersionedFiles(index, access, delta)

1033

1090

result.stream = stream

1043

1100

1044

1101

class _BatchingBlockFetcher(object):

1045

1102

"""Fetch group compress blocks in batches.

1046

1103

1047

1104

:ivar total_bytes: int of expected number of bytes needed to fetch the

1048

1105

currently pending batch.

1049

1106

"""

1050

1107

1051

def __init__(self, gcvf, locations):

1108

def __init__(self, gcvf, locations, get_compressor_settings=None):

1052

1109

self.gcvf = gcvf

1053

1110

self.locations = locations

1054

1111

self.keys = []

1057

1114

self.total_bytes = 0

1058

1115

self.last_read_memo = None

1059

1116

self.manager = None

1117

self._get_compressor_settings = get_compressor_settings

1060

1118

1061

1119

def add_key(self, key):

1062

1120

"""Add another to key to fetch.

1063

1121

1064

1122

:return: The estimated number of bytes needed to fetch the batch so

1065

1123

far.

1066

1124

"""

1091

1149

# and then.

1092

1150

self.batch_memos[read_memo] = cached_block

1093

1151

return self.total_bytes

1094

1152

1095

1153

def _flush_manager(self):

1096

1154

if self.manager is not None:

1097

1155

for factory in self.manager.get_record_stream():

1102

1160

def yield_factories(self, full_flush=False):

1103

1161

"""Yield factories for keys added since the last yield. They will be

1104

1162

returned in the order they were added via add_key.

1105

1163

1106

1164

:param full_flush: by default, some results may not be returned in case

1107

1165

they can be part of the next batch. If full_flush is True, then

1108

1166

all results are returned.

1136

1194

memos_to_get_stack.pop()

1137

1195

else:

1138

1196

block = self.batch_memos[read_memo]

1139

self.manager = _LazyGroupContentManager(block)

1197

self.manager = _LazyGroupContentManager(block,

1198

get_compressor_settings=self._get_compressor_settings)

1140

1199

self.last_read_memo = read_memo

1141

1200

start, end = index_memo[3:5]

1142

1201

self.manager.add_factory(key, parents, start, end)

1149

1208

self.total_bytes = 0

1150

1209

1151

1210

1152

class GroupCompressVersionedFiles(VersionedFiles):

1211

class GroupCompressVersionedFiles(VersionedFilesWithFallbacks):

1153

1212

"""A group-compress based VersionedFiles implementation."""

1154

1213

1155

def __init__(self, index, access, delta=True, _unadded_refs=None):

1214

# This controls how the GroupCompress DeltaIndex works. Basically, we

1215

# compute hash pointers into the source blocks (so hash(text) => text).

1216

# However each of these references costs some memory in trade against a

1217

# more accurate match result. For very large files, they either are

1218

# pre-compressed and change in bulk whenever they change, or change in just

1219

# local blocks. Either way, 'improved resolution' is not very helpful,

1220

# versus running out of memory trying to track everything. The default max

1221

# gives 100% sampling of a 1MB file.

1222

_DEFAULT_MAX_BYTES_TO_INDEX = 1024 * 1024

1223

_DEFAULT_COMPRESSOR_SETTINGS = {'max_bytes_to_index':

1224

_DEFAULT_MAX_BYTES_TO_INDEX}

1225

1226

def __init__(self, index, access, delta=True, _unadded_refs=None,

1227

_group_cache=None):

1156

1228

"""Create a GroupCompressVersionedFiles object.

1157

1229

1158

1230

:param index: The index object storing access and graph data.

1159

1231

:param access: The access object storing raw data.

1160

1232

:param delta: Whether to delta compress or just entropy compress.

1161

1233

:param _unadded_refs: private parameter, don't use.

1234

:param _group_cache: private parameter, don't use.

1162

1235

"""

1163

1236

self._index = index

1164

1237

self._access = access

1166

1239

if _unadded_refs is None:

1167

1240

_unadded_refs = {}

1168

1241

self._unadded_refs = _unadded_refs

1169

self._group_cache = LRUSizeCache(max_size=50*1024*1024)

1170

self._fallback_vfs = []

1242

if _group_cache is None:

1243

_group_cache = LRUSizeCache(max_size=50*1024*1024)

1244

self._group_cache = _group_cache

1245

self._immediate_fallback_vfs = []

1246

self._max_bytes_to_index = None

1171

1247

1172

1248

def without_fallbacks(self):

1173

1249

"""Return a clone of this object without any fallbacks configured."""

1174

1250

return GroupCompressVersionedFiles(self._index, self._access,

1175

self._delta, _unadded_refs=dict(self._unadded_refs))

1251

self._delta, _unadded_refs=dict(self._unadded_refs),

1252

_group_cache=self._group_cache)

1176

1253

1177

1254

def add_lines(self, key, parents, lines, parent_texts=None,

1178

1255

left_matching_blocks=None, nostore_sha=None, random_id=False,

1182

1259

:param key: The key tuple of the text to add.

1183

1260

:param parents: The parents key tuples of the text to add.

1184

1261

:param lines: A list of lines. Each line must be a bytestring. And all

1185

of them except the last must be terminated with \n and contain no

1186

other \n's. The last line may either contain no \n's or a single

1187

terminating \n. If the lines list does meet this constraint the add

1188

routine may error or may succeed - but you will be unable to read

1189

the data back accurately. (Checking the lines have been split

1262

of them except the last must be terminated with \\n and contain no

1263

other \\n's. The last line may either contain no \\n's or a single

1264

terminating \\n. If the lines list does meet this constraint the

1265

add routine may error or may succeed - but you will be unable to

1266

read the data back accurately. (Checking the lines have been split

1190

1267

correctly is expensive and extremely unlikely to catch bugs so it

1191

1268

is not done at runtime unless check_content is True.)

1192

1269

:param parent_texts: An optional dictionary containing the opaque

1247

1324

1248

1325

:param a_versioned_files: A VersionedFiles object.

1249

1326

"""

1250

self._fallback_vfs.append(a_versioned_files)

1327

self._immediate_fallback_vfs.append(a_versioned_files)

1251

1328

1252

1329

def annotate(self, key):

1253

1330

"""See VersionedFiles.annotate."""

1287

1364

self._check_lines_not_unicode(lines)

1288

1365

self._check_lines_are_lines(lines)

1289

1366

1290

def get_known_graph_ancestry(self, keys):

1291

"""Get a KnownGraph instance with the ancestry of keys."""

1292

# Note that this is identical to

1293

# KnitVersionedFiles.get_known_graph_ancestry, but they don't share

1294

# ancestry.

1295

parent_map, missing_keys = self._index.find_ancestry(keys)

1296

for fallback in self._fallback_vfs:

1297

if not missing_keys:

1298

break

1299

(f_parent_map, f_missing_keys) = fallback._index.find_ancestry(

1300

missing_keys)

1301

parent_map.update(f_parent_map)

1302

missing_keys = f_missing_keys

1303

kg = _mod_graph.KnownGraph(parent_map)

1304

return kg

1305

1306

1367

def get_parent_map(self, keys):

1307

1368

"""Get a map of the graph parents of keys.

1308

1369

1323

1384

and so on.

1324

1385

"""

1325

1386

result = {}

1326

sources = [self._index] + self._fallback_vfs

1387

sources = [self._index] + self._immediate_fallback_vfs

1327

1388

source_results = []

1328

1389

missing = set(keys)

1329

1390

for source in sources:

1430

1491

parent_map = {}

1431

1492

key_to_source_map = {}

1432

1493

source_results = []

1433

for source in self._fallback_vfs:

1494

for source in self._immediate_fallback_vfs:

1434

1495

if not missing:

1435

1496

break

1436

1497

source_parents = source.get_parent_map(missing)

1446

1507

1447

1508

The returned objects should be in the order defined by 'ordering',

1448

1509

which can weave between different sources.

1510

1449

1511

:param ordering: Must be one of 'topological' or 'groupcompress'

1450

1512

:return: List of [(source, [keys])] tuples, such that all keys are in

1451

1513

the defined order, regardless of source.

1452

1514

"""

1453

1515

if ordering == 'topological':

1454

present_keys = topo_sort(parent_map)

1516

present_keys = tsort.topo_sort(parent_map)

1455

1517

else:

1456

1518

# ordering == 'groupcompress'

1457

1519

# XXX: This only optimizes for the target ordering. We may need

1546

1608

# - we encounter an unadded ref, or

1547

1609

# - we run out of keys, or

1548

1610

# - the total bytes to retrieve for this batch > BATCH_SIZE

1549

batcher = _BatchingBlockFetcher(self, locations)

1611

batcher = _BatchingBlockFetcher(self, locations,

1612

get_compressor_settings=self._get_compressor_settings)

1550

1613

for source, keys in source_keys:

1551

1614

if source is self:

1552

1615

for key in keys:

1598

1661

for _ in self._insert_record_stream(stream, random_id=False):

1599

1662

pass

1600

1663

1664

def _get_compressor_settings(self):

1665

if self._max_bytes_to_index is None:

1666

# TODO: VersionedFiles don't know about their containing

1667

# repository, so they don't have much of an idea about their

1668

# location. So for now, this is only a global option.

1669

c = config.GlobalConfig()

1670

val = c.get_user_option('bzr.groupcompress.max_bytes_to_index')

1671

if val is not None:

1672

try:

1673

val = int(val)

1674

except ValueError, e:

1675

trace.warning('Value for '

1676

'"bzr.groupcompress.max_bytes_to_index"'

1677

' %r is not an integer'

1678

% (val,))

1679

val = None

1680

if val is None:

1681

val = self._DEFAULT_MAX_BYTES_TO_INDEX

1682

self._max_bytes_to_index = val

1683

return {'max_bytes_to_index': self._max_bytes_to_index}

1684

1685

def _make_group_compressor(self):

1686

return GroupCompressor(self._get_compressor_settings())

1687

1601

1688

def _insert_record_stream(self, stream, random_id=False, nostore_sha=None,

1602

1689

reuse_blocks=True):

1603

1690

"""Internal core to insert a record stream into this container.

1626

1713

return adapter

1627

1714

# This will go up to fulltexts for gc to gc fetching, which isn't

1628

1715

# ideal.

1629

self._compressor = GroupCompressor()

1716

self._compressor = self._make_group_compressor()

1630

1717

self._unadded_refs = {}

1631

1718

keys_to_add = []

1632

1719

def flush():

1633

bytes = self._compressor.flush().to_bytes()

1634

self._compressor = GroupCompressor()

1720

bytes_len, chunks = self._compressor.flush().to_chunks()

1721

self._compressor = self._make_group_compressor()

1722

# Note: At this point we still have 1 copy of the fulltext (in

1723

# record and the var 'bytes'), and this generates 2 copies of

1724

# the compressed text (one for bytes, one in chunks)

1725

# TODO: Push 'chunks' down into the _access api, so that we don't

1726

# have to double compressed memory here

1727

# TODO: Figure out how to indicate that we would be happy to free

1728

# the fulltext content at this point. Note that sometimes we

1729

# will want it later (streaming CHK pages), but most of the

1730

# time we won't (everything else)

1731

bytes = ''.join(chunks)

1732

del chunks

1635

1733

index, start, length = self._access.add_raw_records(

1636

1734

[(None, len(bytes))], bytes)[0]

1637

1735

nodes = []

1802

1900

"""See VersionedFiles.keys."""

1803

1901

if 'evil' in debug.debug_flags:

1804

1902

trace.mutter_callsite(2, "keys scales with size of history")

1805

sources = [self._index] + self._fallback_vfs

1903

sources = [self._index] + self._immediate_fallback_vfs

1806

1904

result = set()

1807

1905

for source in sources:

1808

1906

result.update(source.keys())

1891

1989

# repeated over and over, this creates a surplus of ints

1892

1990

self._int_cache = {}

1893

1991

if track_external_parent_refs:

1894

self._key_dependencies = knit._KeyRefs(

1992

self._key_dependencies = _KeyRefs(

1895

1993

track_new_keys=track_new_keys)

1896

1994

else:

1897

1995

self._key_dependencies = None

2037

2135

:param keys: An iterable of keys.

2038

2136

:return: A dict of key:

2039

2137

(index_memo, compression_parent, parents, record_details).

2040

index_memo

2041

opaque structure to pass to read_records to extract the raw

2042

data

2043

compression_parent

2044

Content that this record is built upon, may be None

2045

parents

2046

Logical parents of this node

2047

record_details

2048

extra information about the content which needs to be passed to

2049

Factory.parse_record

2138

2139

* index_memo: opaque structure to pass to read_records to extract

2140

the raw data

2141

* compression_parent: Content that this record is built upon, may

2142

be None

2143

* parents: Logical parents of this node

2144

* record_details: extra information about the content which needs

2145

to be passed to Factory.parse_record

2050

2146

"""

2051

2147

self._check_read()

2052

2148

result = {}

Older »