~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/groupcompress.py

Committer: Vincent Ladeuil
Date: 2017-01-30 14:30:10 UTC
mfrom: (6615.3.7 merges)
mto: This revision was merged to the branch mainline in revision 6621.
Revision ID: v.ladeuil+lp@free.fr-20170130143010-p31t1ranfeqbaeki

Merge 2.7 into trunk including fix for bug #1657238

files added:
.testr.conf

MANIFEST.in

NEWS

README_BDIST_RPM

apport

apport/README

apport/bzr-crashdb.conf

apport/source_bzr.py

bzrlib/_export_c_api.h

bzrlib/_import_c_api.h

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.h

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_termcolor.py

bzrlib/branchfmt

bzrlib/branchfmt/__init__.py

bzrlib/branchfmt/fullhistory.py

bzrlib/bzr_distutils.py

bzrlib/cethread.py

bzrlib/cleanup.py

bzrlib/cmd_test_script.py

bzrlib/cmdline.py

bzrlib/controldir.py

bzrlib/crash.py

bzrlib/doc_generate/conf.py

bzrlib/estimate_compressed_size.py

bzrlib/export_pot.py

bzrlib/filter_tree.py

bzrlib/help_topics/en/url-special-chars.txt

bzrlib/help_topics/es

bzrlib/i18n.py

bzrlib/library_state.py

bzrlib/mergetools.py

bzrlib/plugins/bash_completion

bzrlib/plugins/bash_completion/README.txt

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/bash_completion/tests

bzrlib/plugins/bash_completion/tests/__init__.py

bzrlib/plugins/bash_completion/tests/test_bashcomp.py

bzrlib/plugins/changelog_merge

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/changelog_merge/tests

bzrlib/plugins/changelog_merge/tests/__init__.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/grep

bzrlib/plugins/grep/.bzrignore

bzrlib/plugins/grep/NEWS

bzrlib/plugins/grep/__init__.py

bzrlib/plugins/grep/cmds.py

bzrlib/plugins/grep/grep.py

bzrlib/plugins/grep/test_grep.py

bzrlib/plugins/launchpad/cmds.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_api_lite.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_api_lite.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/plugins/po_merge

bzrlib/plugins/po_merge/README

bzrlib/plugins/po_merge/__init__.py

bzrlib/plugins/po_merge/po_merge.py

bzrlib/plugins/po_merge/tests

bzrlib/plugins/po_merge/tests/__init__.py

bzrlib/plugins/po_merge/tests/test_po_merge.py

bzrlib/plugins/weave_fmt

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/tests

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/pyutils.py

bzrlib/recordcounter.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/smart/ping.py

bzrlib/smart/signals.py

bzrlib/static_tuple.py

bzrlib/tests/blackbox/test_branches.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_export_pot.py

bzrlib/tests/blackbox/test_lookup_revision.py

bzrlib/tests/blackbox/test_mkdir.py

bzrlib/tests/blackbox/test_ping.py

bzrlib/tests/blackbox/test_remember_option.py

bzrlib/tests/blackbox/test_repair_workingtree.py

bzrlib/tests/blackbox/test_resolve.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/blackbox/test_shell_complete.py

bzrlib/tests/blackbox/test_verify_signatures.py

bzrlib/tests/commands/test_revert.py

bzrlib/tests/features.py

bzrlib/tests/fixtures.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_bzrdir

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/test_format.py

bzrlib/tests/per_controldir_colo

bzrlib/tests/per_controldir_colo/__init__.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_interbranch/test_copy_content_into.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_interbranch/test_get.py

bzrlib/tests/per_intertree/test_file_content_matches.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_repository/test_file_graph.py

bzrlib/tests/per_repository/test_signatures.py

bzrlib/tests/per_repository_reference/test__make_parents_provider.py

bzrlib/tests/per_repository_reference/test_commit_with_stacking.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_vf

bzrlib/tests/per_repository_vf/__init__.py

bzrlib/tests/per_repository_vf/test_check.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_repository_vf/test_fileid_involved.py

bzrlib/tests/per_repository_vf/test_merge_directive.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_refresh_data.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_repository_vf/test_write_group.py

bzrlib/tests/per_tree/test_export.py

bzrlib/tests/per_tree/test_ids.py

bzrlib/tests/per_tree/test_is_executable.py

bzrlib/tests/per_tree/test_locking.py

bzrlib/tests/per_uifactory

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_check_state.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/scenarios.py

bzrlib/tests/script.py

bzrlib/tests/test__btree_serializer.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_estimate_compressed_size.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_features.py

bzrlib/tests/test_filter_tree.py

bzrlib/tests/test_fixtures.py

bzrlib/tests/test_https_urllib.py

bzrlib/tests/test_i18n.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_library_state.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

bzrlib/tests/test_pyutils.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_script.py

bzrlib/tests/test_server.py

bzrlib/tests/test_smart_signals.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_treeshape.py

bzrlib/tests/test_url_policy_open.py

bzrlib/tests/test_utextwrap.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_vf_search.py

bzrlib/tests/testui.py

bzrlib/transport/gio_transport.py

bzrlib/transport/pathfilter.py

bzrlib/url_policy_open.py

bzrlib/utextwrap.py

bzrlib/vf_repository.py

bzrlib/vf_search.py

bzrlib/workingtree_3.py

contrib/bash/bzr

contrib/debian

contrib/debian/default

contrib/debian/init.d

contrib/zsh/README

doc/Bazaar-Logo-For-Manuals.png

doc/developers/_static

doc/developers/_static/bzr icon 16.png

doc/developers/_static/bzr-doc.css

doc/developers/_static/bzr.ico

doc/developers/_templates

doc/developers/_templates/layout.html

doc/developers/apport.txt

doc/developers/check.txt

doc/developers/code-review.txt

doc/developers/code-style.txt

doc/developers/conf.py

doc/developers/configuration.txt

doc/developers/content-filtering.txt

doc/developers/contribution-quickstart.txt

doc/developers/documenting-changes.txt

doc/developers/feature-flags.txt

doc/developers/fetch.txt

doc/developers/implementation-notes.txt

doc/developers/index-plain.txt

doc/developers/miscellaneous-notes.txt

doc/developers/nested-trees.txt

doc/developers/new-config-rationale.txt

doc/developers/plans.txt

doc/developers/principles.txt

doc/developers/specifications.txt

doc/developers/transports.txt

doc/developers/ui.txt

doc/developers/win32_build_setup.txt

doc/developers/xdg_config_spec.txt

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/licence.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/en/release-notes/bzr-0.1.txt

doc/en/release-notes/bzr-0.10.txt

doc/en/release-notes/bzr-0.11.txt

doc/en/release-notes/bzr-0.12.txt

doc/en/release-notes/bzr-0.13.txt

doc/en/release-notes/bzr-0.14.txt

doc/en/release-notes/bzr-0.15.txt

doc/en/release-notes/bzr-0.16.txt

doc/en/release-notes/bzr-0.17.txt

doc/en/release-notes/bzr-0.18.txt

doc/en/release-notes/bzr-0.6.txt

doc/en/release-notes/bzr-0.7.txt

doc/en/release-notes/bzr-0.8.txt

doc/en/release-notes/bzr-0.9.txt

doc/en/release-notes/bzr-0.90.txt

doc/en/release-notes/bzr-0.91.txt

doc/en/release-notes/bzr-0.92.txt

doc/en/release-notes/bzr-1.0.txt

doc/en/release-notes/bzr-1.1.txt

doc/en/release-notes/bzr-1.10.txt

doc/en/release-notes/bzr-1.11.txt

doc/en/release-notes/bzr-1.12.txt

doc/en/release-notes/bzr-1.13.txt

doc/en/release-notes/bzr-1.14.txt

doc/en/release-notes/bzr-1.15.txt

doc/en/release-notes/bzr-1.16.txt

doc/en/release-notes/bzr-1.17.txt

doc/en/release-notes/bzr-1.18.txt

doc/en/release-notes/bzr-1.2.txt

doc/en/release-notes/bzr-1.3.txt

doc/en/release-notes/bzr-1.4.txt

doc/en/release-notes/bzr-1.5.txt

doc/en/release-notes/bzr-1.6.txt

doc/en/release-notes/bzr-1.7.txt

doc/en/release-notes/bzr-1.8.txt

doc/en/release-notes/bzr-1.9.txt

doc/en/release-notes/bzr-2.0.txt

doc/en/release-notes/bzr-2.1.txt

doc/en/release-notes/bzr-2.2.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/bzr-2.5.txt

doc/en/release-notes/bzr-2.6.txt

doc/en/release-notes/bzr-2.7.txt

doc/en/release-notes/bzr-2.8.txt

doc/en/release-notes/release-template.txt

doc/en/release-notes/series-template.txt

doc/en/tutorials/licence.txt

doc/en/upgrade-guide/licence.txt

doc/en/user-guide/gpg_signatures.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/licence.txt

doc/en/user-guide/switch_store.txt

doc/en/whats-new

doc/en/whats-new/template.txt

doc/en/whats-new/whats-new-in-2.1.txt

doc/en/whats-new/whats-new-in-2.2.txt

doc/en/whats-new/whats-new-in-2.3.txt

doc/en/whats-new/whats-new-in-2.4.txt

doc/en/whats-new/whats-new-in-2.5.txt

doc/en/whats-new/whats-new-in-2.6.txt

doc/en/whats-new/whats-new-in-2.7.txt

doc/en/whats-new/whats-new-in-2.8.txt

doc/es/_static

doc/es/_static/bzr icon 16.png

doc/es/_static/bzr.ico

doc/es/_static/es

doc/es/_templates

doc/es/_templates/layout.html

doc/es/conf.py

doc/es/quick-reference/index.txt

doc/es/user-guide/index-plain.txt

doc/index.es.txt

doc/index.ja.txt

doc/index.ru.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/licence.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index-plain.txt

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/licence.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

doc/ru/_static

doc/ru/_static/bzr icon 16.png

doc/ru/_static/bzr.ico

doc/ru/_static/ru

doc/ru/_templates

doc/ru/_templates/layout.html

doc/ru/conf.py

doc/ru/quick-reference/index.txt

doc/ru/user-guide/index-plain.txt

po/ar.po

po/ast.po

po/bs.po

po/bzr.pot

po/ca.po

po/cs.po

po/de.po

po/el.po

po/en_AU.po

po/en_GB.po

po/es.po

po/fa.po

po/fo.po

po/fr.po

po/gl.po

po/he.po

po/id.po

po/it.po

po/ja.po

po/ko.po

po/ms.po

po/my.po

po/nb.po

po/nl.po

po/oc.po

po/pl.po

po/pt_BR.po

po/ro.po

po/ru.po

po/sco.po

po/si.po

po/sk.po

po/sr.po

po/sv.po

po/tr.po

po/ug.po

po/uk.po

po/vi.po

po/zh_CN.po

tools/fixed-in.py

tools/generate_release_notes.py

tools/package_docs.py

tools/packaging/update-control.sh

tools/subunit-sum

tools/win32/py2exe_boot_common.py

files removed:
bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_tags.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/deprecated_graph.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/textui.py

bzrlib/util/bencode.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/weave_commands.py

contrib/add-bzr-to-baz

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/zsh/_bzr

doc/BUILD-NOTES

doc/_static/en/quick-reference

doc/bazaar-vcs.org.kid

doc/en/developer-guide

doc/en/migration

doc/en/migration/index.txt

doc/en/user-guide/index.txt

doc/es/developer-guide

doc/es/release-notes

doc/es/user-reference

tools/biobench.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/trace-revisions

tools/weavebench.py

files renamed:
bzrlib/sign_my_commits.py => bzrlib/commit_signature_commands.py

bzrlib/help_topics/en/conflicts.txt => bzrlib/help_topics/en/conflict-types.txt

doc/es/user-guide/resolving_conflicts.txt => bzrlib/help_topics/es/conflict-types.txt

bzrlib/repofmt/weaverepo.py => bzrlib/plugins/weave_fmt/repository.py

bzrlib/xml4.py => bzrlib/plugins/weave_fmt/xml4.py

bzrlib/tests/per_bzrdir/ => bzrlib/tests/per_controldir/

bzrlib/tests/per_bzrdir/test_bzrdir.py => bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/test_pack_repository.py => bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/test_is_write_locked.py => bzrlib/tests/per_repository/test_locking.py

bzrlib/tests/per_repository/helpers.py => bzrlib/tests/per_repository_vf/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py => bzrlib/tests/per_repository_vf/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py => bzrlib/tests/per_repository_vf/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_check_reconcile.py => bzrlib/tests/per_repository_vf/test_check_reconcile.py

bzrlib/tests/per_repository/test_find_text_key_references.py => bzrlib/tests/per_repository_vf/test_find_text_key_references.py

bzrlib/tests/test_versionedfile.py => bzrlib/tests/per_versionedfile.py

bzrlib/tests/test_bencode.py => bzrlib/tests/test__bencode.py

doc/en/developer-guide/HACKING.txt => doc/developers/HACKING.txt

doc/Makefile => doc/en/Makefile

doc/_static/ => doc/en/_static/

doc/_static/en/quick-reference/Makefile => doc/en/_static/en/Makefile

doc/_static/en/quick-reference/bzr-quick-reference.pdf => doc/en/_static/en/bzr-en-quick-reference.pdf

doc/_static/en/quick-reference/bzr-quick-reference.png => doc/en/_static/en/bzr-en-quick-reference.png

doc/_static/en/quick-reference/bzr-quick-reference.svg => doc/en/_static/en/bzr-en-quick-reference.svg

doc/_templates/ => doc/en/_templates/

doc/conf.py => doc/en/conf.py

doc/contents.txt => doc/en/index.txt

doc/make.bat => doc/en/make.bat

NEWS => doc/en/release-notes/bzr-2.3.txt

doc/en/user-guide/index-for-2x.txt => doc/en/user-guide/index.txt

doc/es/quick-reference/Makefile => doc/es/_static/es/Makefile

doc/es/quick-reference/quick-start-summary.pdf => doc/es/_static/es/bzr-es-quick-reference.pdf

doc/es/quick-reference/quick-start-summary.png => doc/es/_static/es/bzr-es-quick-reference.png

doc/es/quick-reference/quick-start-summary.svg => doc/es/_static/es/bzr-es-quick-reference.svg

doc/index.es.txt => doc/es/index.txt

doc/ru/quick-reference/Makefile => doc/ru/_static/ru/Makefile

doc/ru/quick-reference/quick-start-summary.pdf => doc/ru/_static/ru/bzr-ru-quick-reference.pdf

doc/ru/quick-reference/quick-start-summary.png => doc/ru/_static/ru/bzr-ru-quick-reference.png

doc/ru/quick-reference/quick-start-summary.svg => doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/index.ru.txt => doc/ru/index.txt

files modified:
.bzrignore

COPYING.txt

INSTALL

Makefile

README

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_dirstate_helpers_py.py

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.h

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/https_server.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_controldir/__init__.py

bzrlib/tests/per_controldir/test_push.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/add.txt

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/bug-handling.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/dirstate.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/packrepo.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/revision-properties.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/update.txt

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide/index.txt

doc/en/mini-tutorial/index.txt

doc/en/quick-reference/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/index.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-guide/zen.txt

doc/en/user-reference/readme.txt

doc/es/mini-tutorial/index.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.txt

doc/ru/mini-tutorial/index.txt

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/zen.txt

profile_imports.py

setup.py

tools/check-newsbugs.py

tools/generate_docs.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/win32/bazaar.url

tools/win32/build_release.py

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/info.txt

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/groupcompress.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

"""Core compression logic for compressing streams of related files."""

from __future__ import absolute_import

import time

import zlib

try:

import pylzma

except ImportError:

pylzma = None

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import (

annotate,

config,

debug,

errors,

graph as _mod_graph,

knit,

osutils,

pack,

static_tuple,

trace,

tsort,

)

from bzrlib.graph import Graph

from bzrlib.repofmt import pack_repo

from bzrlib.i18n import gettext

""")

from bzrlib.btree_index import BTreeBuilder

from bzrlib.lru_cache import LRUSizeCache

from bzrlib.tsort import topo_sort

from bzrlib.versionedfile import (

_KeyRefs,

adapter_registry,

AbsentContentFactory,

ChunkedContentFactory,

FulltextContentFactory,

VersionedFiles,

VersionedFilesWithFallbacks,

)

_USE_LZMA = False and (pylzma is not None)

# Minimum number of uncompressed bytes to try fetch at once when retrieving

# groupcompress blocks.

BATCH_SIZE = 2**16

# osutils.sha_string('')

_null_sha1 = 'da39a3ee5e6b4b0d3255bfef95601890afd80709'

def sort_gc_optimal(parent_map):

"""Sort and group the keys in parent_map into groupcompress order.

# groupcompress ordering is approximately reverse topological,

# properly grouped by file-id.

per_prefix_map = {}

for item in parent_map.iteritems():

key = item[0]

for key, value in parent_map.iteritems():

if isinstance(key, str) or len(key) == 1:

prefix = ''

else:

prefix = key[0]

try:

per_prefix_map[prefix].append(item)

per_prefix_map[prefix][key] = value

except KeyError:

per_prefix_map[prefix] = [item]

per_prefix_map[prefix] = {key: value}

present_keys = []

for prefix in sorted(per_prefix_map):

present_keys.extend(reversed(topo_sort(per_prefix_map[prefix])))

present_keys.extend(reversed(tsort.topo_sort(per_prefix_map[prefix])))

return present_keys

105

def __init__(self):

100

106

# map by key? or just order in file?

101

107

self._compressor_name = None

102

self._z_content = None

108

self._z_content_chunks = None

103

109

self._z_content_decompressor = None

104

110

self._z_content_length = None

105

111

self._content_length = None

118

124

:param num_bytes: Ensure that we have extracted at least num_bytes of

119

125

content. If None, consume everything

120

126

"""

121

# TODO: If we re-use the same content block at different times during

122

# get_record_stream(), it is possible that the first pass will

123

# get inserted, triggering an extract/_ensure_content() which

124

# will get rid of _z_content. And then the next use of the block

125

# will try to access _z_content (to send it over the wire), and

126

# fail because it is already extracted. Consider never releasing

127

# _z_content because of this.

127

if self._content_length is None:

128

raise AssertionError('self._content_length should never be None')

128

129

if num_bytes is None:

129

130

num_bytes = self._content_length

130

131

elif (self._content_length is not None

138

139

self._content = ''.join(self._content_chunks)

139

140

self._content_chunks = None

140

141

if self._content is None:

141

if self._z_content is None:

142

# We join self._z_content_chunks here, because if we are

143

# decompressing, then it is *very* likely that we have a single

144

# chunk

145

if self._z_content_chunks is None:

142

146

raise AssertionError('No content to decompress')

143

if self._z_content == '':

147

z_content = ''.join(self._z_content_chunks)

148

if z_content == '':

144

149

self._content = ''

145

150

elif self._compressor_name == 'lzma':

146

151

# We don't do partial lzma decomp yet

147

self._content = pylzma.decompress(self._z_content)

152

import pylzma

153

self._content = pylzma.decompress(z_content)

148

154

elif self._compressor_name == 'zlib':

149

155

# Start a zlib decompressor

150

if num_bytes is None:

151

self._content = zlib.decompress(self._z_content)

156

if num_bytes * 4 > self._content_length * 3:

157

# If we are requesting more that 3/4ths of the content,

158

# just extract the whole thing in a single pass

159

num_bytes = self._content_length

160

self._content = zlib.decompress(z_content)

152

161

else:

153

162

self._z_content_decompressor = zlib.decompressobj()

154

163

# Seed the decompressor with the uncompressed bytes, so

155

164

# that the rest of the code is simplified

156

165

self._content = self._z_content_decompressor.decompress(

157

self._z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

166

z_content, num_bytes + _ZLIB_DECOMP_WINDOW)

167

if not self._z_content_decompressor.unconsumed_tail:

168

self._z_content_decompressor = None

158

169

else:

159

170

raise AssertionError('Unknown compressor: %r'

160

171

% self._compressor_name)

162

173

# 'unconsumed_tail'

163

174

164

175

# Do we have enough bytes already?

165

if num_bytes is not None and len(self._content) >= num_bytes:

166

return

167

if num_bytes is None and self._z_content_decompressor is None:

168

# We must have already decompressed everything

176

if len(self._content) >= num_bytes:

169

177

return

170

178

# If we got this far, and don't have a decompressor, something is wrong

171

179

if self._z_content_decompressor is None:

172

180

raise AssertionError(

173

181

'No decompressor to decompress %d bytes' % num_bytes)

174

182

remaining_decomp = self._z_content_decompressor.unconsumed_tail

175

if num_bytes is None:

176

if remaining_decomp:

177

# We don't know how much is left, but we'll decompress it all

178

self._content += self._z_content_decompressor.decompress(

179

remaining_decomp)

180

# Note: There's what I consider a bug in zlib.decompressobj

181

# If you pass back in the entire unconsumed_tail, only

182

# this time you don't pass a max-size, it doesn't

183

# change the unconsumed_tail back to None/''.

184

# However, we know we are done with the whole stream

185

self._z_content_decompressor = None

186

# XXX: Why is this the only place in this routine we set this?

187

self._content_length = len(self._content)

188

else:

189

if not remaining_decomp:

190

raise AssertionError('Nothing left to decompress')

191

needed_bytes = num_bytes - len(self._content)

192

# We always set max_size to 32kB over the minimum needed, so that

193

# zlib will give us as much as we really want.

194

# TODO: If this isn't good enough, we could make a loop here,

195

# that keeps expanding the request until we get enough

196

self._content += self._z_content_decompressor.decompress(

197

remaining_decomp, needed_bytes + _ZLIB_DECOMP_WINDOW)

198

if len(self._content) < num_bytes:

199

raise AssertionError('%d bytes wanted, only %d available'

200

% (num_bytes, len(self._content)))

201

if not self._z_content_decompressor.unconsumed_tail:

202

# The stream is finished

203

self._z_content_decompressor = None

183

if not remaining_decomp:

184

raise AssertionError('Nothing left to decompress')

185

needed_bytes = num_bytes - len(self._content)

186

# We always set max_size to 32kB over the minimum needed, so that

187

# zlib will give us as much as we really want.

188

# TODO: If this isn't good enough, we could make a loop here,

189

# that keeps expanding the request until we get enough

190

self._content += self._z_content_decompressor.decompress(

191

remaining_decomp, needed_bytes + _ZLIB_DECOMP_WINDOW)

192

if len(self._content) < num_bytes:

193

raise AssertionError('%d bytes wanted, only %d available'

194

% (num_bytes, len(self._content)))

195

if not self._z_content_decompressor.unconsumed_tail:

196

# The stream is finished

197

self._z_content_decompressor = None

204

198

205

199

def _parse_bytes(self, bytes, pos):

206

200

"""Read the various lengths from the header.

222

216

# XXX: Define some GCCorrupt error ?

223

217

raise AssertionError('Invalid bytes: (%d) != %d + %d' %

224

218

(len(bytes), pos, self._z_content_length))

225

self._z_content = bytes[pos:]

219

self._z_content_chunks = (bytes[pos:],)

220

221

@property

222

def _z_content(self):

223

"""Return z_content_chunks as a simple string.

224

225

Meant only to be used by the test suite.

226

"""

227

if self._z_content_chunks is not None:

228

return ''.join(self._z_content_chunks)

229

return None

226

230

227

231

@classmethod

228

232

def from_bytes(cls, bytes):

284

288

self._content_length = length

285

289

self._content_chunks = content_chunks

286

290

self._content = None

287

self._z_content = None

291

self._z_content_chunks = None

288

292

289

293

def set_content(self, content):

290

294

"""Set the content of this block."""

291

295

self._content_length = len(content)

292

296

self._content = content

293

self._z_content = None

294

295

def _create_z_content_using_lzma(self):

296

if self._content_chunks is not None:

297

self._content = ''.join(self._content_chunks)

298

self._content_chunks = None

299

if self._content is None:

300

raise AssertionError('Nothing to compress')

301

self._z_content = pylzma.compress(self._content)

302

self._z_content_length = len(self._z_content)

303

304

def _create_z_content_from_chunks(self):

297

self._z_content_chunks = None

298

299

def _create_z_content_from_chunks(self, chunks):

305

300

compressor = zlib.compressobj(zlib.Z_DEFAULT_COMPRESSION)

306

compressed_chunks = map(compressor.compress, self._content_chunks)

301

# Peak in this point is 1 fulltext, 1 compressed text, + zlib overhead

302

# (measured peak is maybe 30MB over the above...)

303

compressed_chunks = map(compressor.compress, chunks)

307

304

compressed_chunks.append(compressor.flush())

308

self._z_content = ''.join(compressed_chunks)

309

self._z_content_length = len(self._z_content)

305

# Ignore empty chunks

306

self._z_content_chunks = [c for c in compressed_chunks if c]

307

self._z_content_length = sum(map(len, self._z_content_chunks))

310

308

311

309

def _create_z_content(self):

312

if self._z_content is not None:

313

return

314

if _USE_LZMA:

315

self._create_z_content_using_lzma()

310

if self._z_content_chunks is not None:

316

311

return

317

312

if self._content_chunks is not None:

318

self._create_z_content_from_chunks()

319

return

320

self._z_content = zlib.compress(self._content)

321

self._z_content_length = len(self._z_content)

313

chunks = self._content_chunks

314

else:

315

chunks = (self._content,)

316

self._create_z_content_from_chunks(chunks)

317

318

def to_chunks(self):

319

"""Create the byte stream as a series of 'chunks'"""

320

self._create_z_content()

321

header = self.GCB_HEADER

322

chunks = ['%s%d\n%d\n'

323

% (header, self._z_content_length, self._content_length),

324

]

325

chunks.extend(self._z_content_chunks)

326

total_len = sum(map(len, chunks))

327

return total_len, chunks

322

328

323

329

def to_bytes(self):

324

330

"""Encode the information into a byte stream."""

325

self._create_z_content()

326

if _USE_LZMA:

327

header = self.GCB_LZ_HEADER

328

else:

329

header = self.GCB_HEADER

330

chunks = [header,

331

'%d\n%d\n' % (self._z_content_length, self._content_length),

332

self._z_content,

333

]

331

total_len, chunks = self.to_chunks()

334

332

return ''.join(chunks)

335

333

336

334

def _dump(self, include_text=False):

450

448

# Grab and cache the raw bytes for this entry

451

449

# and break the ref-cycle with _manager since we don't need it

452

450

# anymore

453

self._manager._prepare_for_extract()

451

try:

452

self._manager._prepare_for_extract()

453

except zlib.error as value:

454

raise errors.DecompressCorruption("zlib: " + str(value))

454

455

block = self._manager._block

455

456

self._bytes = block.extract(self.key, self._start, self._end)

456

457

# There are code paths that first extract as fulltext, and then

457

458

# extract as storage_kind (smart fetch). So we don't break the

458

459

# refcycle here, but instead in manager.get_record_stream()

459

# self._manager = None

460

if storage_kind == 'fulltext':

461

return self._bytes

462

else:

468

class _LazyGroupContentManager(object):

469

"""This manages a group of _LazyGroupCompressFactory objects."""

470

471

def __init__(self, block):

471

_max_cut_fraction = 0.75 # We allow a block to be trimmed to 75% of

472

# current size, and still be considered

473

# resuable

474

_full_block_size = 4*1024*1024

475

_full_mixed_block_size = 2*1024*1024

476

_full_enough_block_size = 3*1024*1024 # size at which we won't repack

477

_full_enough_mixed_block_size = 2*768*1024 # 1.5MB

478

479

def __init__(self, block, get_compressor_settings=None):

472

480

self._block = block

473

481

# We need to preserve the ordering

474

482

self._factories = []

475

483

self._last_byte = 0

484

self._get_settings = get_compressor_settings

485

self._compressor_settings = None

486

487

def _get_compressor_settings(self):

488

if self._compressor_settings is not None:

489

return self._compressor_settings

490

settings = None

491

if self._get_settings is not None:

492

settings = self._get_settings()

493

if settings is None:

494

vf = GroupCompressVersionedFiles

495

settings = vf._DEFAULT_COMPRESSOR_SETTINGS

496

self._compressor_settings = settings

497

return self._compressor_settings

476

498

477

499

def add_factory(self, key, parents, start, end):

478

500

if not self._factories:

511

533

new_block.set_content(self._block._content[:last_byte])

512

534

self._block = new_block

513

535

536

def _make_group_compressor(self):

537

return GroupCompressor(self._get_compressor_settings())

538

514

539

def _rebuild_block(self):

515

540

"""Create a new GroupCompressBlock with only the referenced texts."""

516

compressor = GroupCompressor()

541

compressor = self._make_group_compressor()

517

542

tstart = time.time()

518

543

old_length = self._block._content_length

519

544

end_point = 0

531

556

# block? It seems hard to come up with a method that it would

532

557

# expand, since we do full compression again. Perhaps based on a

533

558

# request that ends up poorly ordered?

559

# TODO: If the content would have expanded, then we would want to

560

# handle a case where we need to split the block.

561

# Now that we have a user-tweakable option

562

# (max_bytes_to_index), it is possible that one person set it

563

# to a very low value, causing poor compression.

534

564

delta = time.time() - tstart

535

565

self._block = new_block

536

566

trace.mutter('creating new compressed block on-the-fly in %.3fs'

545

575

# time (self._block._content) is a little expensive.

546

576

self._block._ensure_content(self._last_byte)

547

577

548

def _check_rebuild_block(self):

578

def _check_rebuild_action(self):

549

579

"""Check to see if our block should be repacked."""

550

580

total_bytes_used = 0

551

581

last_byte_used = 0

552

582

for factory in self._factories:

553

583

total_bytes_used += factory._end - factory._start

554

last_byte_used = max(last_byte_used, factory._end)

555

# If we are using most of the bytes from the block, we have nothing

556

# else to check (currently more that 1/2)

584

if last_byte_used < factory._end:

585

last_byte_used = factory._end

586

# If we are using more than half of the bytes from the block, we have

587

# nothing else to check

557

588

if total_bytes_used * 2 >= self._block._content_length:

558

return

559

# Can we just strip off the trailing bytes? If we are going to be

560

# transmitting more than 50% of the front of the content, go ahead

589

return None, last_byte_used, total_bytes_used

590

# We are using less than 50% of the content. Is the content we are

591

# using at the beginning of the block? If so, we can just trim the

592

# tail, rather than rebuilding from scratch.

561

593

if total_bytes_used * 2 > last_byte_used:

562

self._trim_block(last_byte_used)

563

return

594

return 'trim', last_byte_used, total_bytes_used

564

595

565

596

# We are using a small amount of the data, and it isn't just packed

566

597

# nicely at the front, so rebuild the content.

573

604

# expanding many deltas into fulltexts, as well.

574

605

# If we build a cheap enough 'strip', then we could try a strip,

575

606

# if that expands the content, we then rebuild.

576

self._rebuild_block()

607

return 'rebuild', last_byte_used, total_bytes_used

608

609

def check_is_well_utilized(self):

610

"""Is the current block considered 'well utilized'?

611

612

This heuristic asks if the current block considers itself to be a fully

613

developed group, rather than just a loose collection of data.

614

"""

615

if len(self._factories) == 1:

616

# A block of length 1 could be improved by combining with other

617

# groups - don't look deeper. Even larger than max size groups

618

# could compress well with adjacent versions of the same thing.

619

return False

620

action, last_byte_used, total_bytes_used = self._check_rebuild_action()

621

block_size = self._block._content_length

622

if total_bytes_used < block_size * self._max_cut_fraction:

623

# This block wants to trim itself small enough that we want to

624

# consider it under-utilized.

625

return False

626

# TODO: This code is meant to be the twin of _insert_record_stream's

627

# 'start_new_block' logic. It would probably be better to factor

628

# out that logic into a shared location, so that it stays

629

# together better

630

# We currently assume a block is properly utilized whenever it is >75%

631

# of the size of a 'full' block. In normal operation, a block is

632

# considered full when it hits 4MB of same-file content. So any block

633

# >3MB is 'full enough'.

634

# The only time this isn't true is when a given block has large-object

635

# content. (a single file >4MB, etc.)

636

# Under these circumstances, we allow a block to grow to

637

# 2 x largest_content. Which means that if a given block had a large

638

# object, it may actually be under-utilized. However, given that this

639

# is 'pack-on-the-fly' it is probably reasonable to not repack large

640

# content blobs on-the-fly. Note that because we return False for all

641

# 1-item blobs, we will repack them; we may wish to reevaluate our

642

# treatment of large object blobs in the future.

643

if block_size >= self._full_enough_block_size:

644

return True

645

# If a block is <3MB, it still may be considered 'full' if it contains

646

# mixed content. The current rule is 2MB of mixed content is considered

647

# full. So check to see if this block contains mixed content, and

648

# set the threshold appropriately.

649

common_prefix = None

650

for factory in self._factories:

651

prefix = factory.key[:-1]

652

if common_prefix is None:

653

common_prefix = prefix

654

elif prefix != common_prefix:

655

# Mixed content, check the size appropriately

656

if block_size >= self._full_enough_mixed_block_size:

657

return True

658

break

659

# The content failed both the mixed check and the single-content check

660

# so obviously it is not fully utilized

661

# TODO: there is one other constraint that isn't being checked

662

# namely, that the entries in the block are in the appropriate

663

# order. For example, you could insert the entries in exactly

664

# reverse groupcompress order, and we would think that is ok.

665

# (all the right objects are in one group, and it is fully

666

# utilized, etc.) For now, we assume that case is rare,

667

# especially since we should always fetch in 'groupcompress'

668

# order.

669

return False

670

671

def _check_rebuild_block(self):

672

action, last_byte_used, total_bytes_used = self._check_rebuild_action()

673

if action is None:

674

return

675

if action == 'trim':

676

self._trim_block(last_byte_used)

677

elif action == 'rebuild':

678

self._rebuild_block()

679

else:

680

raise ValueError('unknown rebuild action: %r' % (action,))

577

681

578

682

def _wire_bytes(self):

579

683

"""Return a byte stream suitable for transmitting over the wire."""

613

717

z_header_bytes = zlib.compress(header_bytes)

614

718

del header_bytes

615

719

z_header_bytes_len = len(z_header_bytes)

616

block_bytes = self._block.to_bytes()

720

block_bytes_len, block_chunks = self._block.to_chunks()

617

721

lines.append('%d\n%d\n%d\n' % (z_header_bytes_len, header_bytes_len,

618

len(block_bytes)))

722

block_bytes_len))

619

723

lines.append(z_header_bytes)

620

lines.append(block_bytes)

621

del z_header_bytes, block_bytes

724

lines.extend(block_chunks)

725

del z_header_bytes, block_chunks

726

# TODO: This is a point where we will double the memory consumption. To

727

# avoid this, we probably have to switch to a 'chunked' api

622

728

return ''.join(lines)

623

729

624

730

@classmethod

625

731

def from_bytes(cls, bytes):

626

732

# TODO: This does extra string copying, probably better to do it a

627

# different way

733

# different way. At a minimum this creates 2 copies of the

734

# compressed content

628

735

(storage_kind, z_header_len, header_len,

629

736

block_len, rest) = bytes.split('\n', 4)

630

737

del bytes

682

789

683

790

class _CommonGroupCompressor(object):

684

791

685

def __init__(self):

792

def __init__(self, settings=None):

686

793

"""Create a GroupCompressor."""

687

794

self.chunks = []

688

795

self._last = None

691

798

self.labels_deltas = {}

692

799

self._delta_index = None # Set by the children

693

800

self._block = GroupCompressBlock()

801

if settings is None:

802

self._settings = {}

803

else:

804

self._settings = settings

694

805

695

806

def compress(self, key, bytes, expected_sha, nostore_sha=None, soft=False):

696

807

"""Compress lines with label key.

788

899

789

900

After calling this, the compressor should no longer be used

790

901

"""

791

# TODO: this causes us to 'bloat' to 2x the size of content in the

792

# group. This has an impact for 'commit' of large objects.

793

# One possibility is to use self._content_chunks, and be lazy and

794

# only fill out self._content as a full string when we actually

795

# need it. That would at least drop the peak memory consumption

796

# for 'commit' down to ~1x the size of the largest file, at a

797

# cost of increased complexity within this code. 2x is still <<

798

# 3x the size of the largest file, so we are doing ok.

799

902

self._block.set_chunked_content(self.chunks, self.endpoint)

800

903

self.chunks = None

801

904

self._delta_index = None

819

922

820

923

class PythonGroupCompressor(_CommonGroupCompressor):

821

924

822

def __init__(self):

925

def __init__(self, settings=None):

823

926

"""Create a GroupCompressor.

824

927

825

928

Used only if the pyrex version is not available.

826

929

"""

827

super(PythonGroupCompressor, self).__init__()

930

super(PythonGroupCompressor, self).__init__(settings)

828

931

self._delta_index = LinesDeltaIndex([])

829

932

# The actual content is managed by LinesDeltaIndex

830

933

self.chunks = self._delta_index.lines

867

970

868

971

It contains code very similar to SequenceMatcher because of having a similar

869

972

task. However some key differences apply:

870

- there is no junk, we want a minimal edit not a human readable diff.

871

- we don't filter very common lines (because we don't know where a good

872

range will start, and after the first text we want to be emitting minmal

873

edits only.

874

- we chain the left side, not the right side

875

- we incrementally update the adjacency matrix as new lines are provided.

876

- we look for matches in all of the left side, so the routine which does

877

the analagous task of find_longest_match does not need to filter on the

878

left side.

973

974

* there is no junk, we want a minimal edit not a human readable diff.

975

* we don't filter very common lines (because we don't know where a good

976

range will start, and after the first text we want to be emitting minmal

977

edits only.

978

* we chain the left side, not the right side

979

* we incrementally update the adjacency matrix as new lines are provided.

980

* we look for matches in all of the left side, so the routine which does

981

the analagous task of find_longest_match does not need to filter on the

982

left side.

879

983

"""

880

984

881

def __init__(self):

882

super(PyrexGroupCompressor, self).__init__()

883

self._delta_index = DeltaIndex()

985

def __init__(self, settings=None):

986

super(PyrexGroupCompressor, self).__init__(settings)

987

max_bytes_to_index = self._settings.get('max_bytes_to_index', 0)

988

self._delta_index = DeltaIndex(max_bytes_to_index=max_bytes_to_index)

884

989

885

990

def _compress(self, key, bytes, max_delta_size, soft=False):

886

991

"""see _CommonGroupCompressor._compress"""

961

1066

index = _GCGraphIndex(graph_index, lambda:True, parents=parents,

962

1067

add_callback=graph_index.add_nodes,

963

1068

inconsistency_fatal=inconsistency_fatal)

964

access = knit._DirectPackAccess({})

1069

access = pack_repo._DirectPackAccess({})

965

1070

access.set_writer(writer, graph_index, (transport, 'newpack'))

966

1071

result = GroupCompressVersionedFiles(index, access, delta)

967

1072

result.stream = stream

975

1080

versioned_files.stream.close()

976

1081

977

1082

978

class GroupCompressVersionedFiles(VersionedFiles):

1083

class _BatchingBlockFetcher(object):

1084

"""Fetch group compress blocks in batches.

1085

1086

:ivar total_bytes: int of expected number of bytes needed to fetch the

1087

currently pending batch.

1088

"""

1089

1090

def __init__(self, gcvf, locations, get_compressor_settings=None):

1091

self.gcvf = gcvf

1092

self.locations = locations

1093

self.keys = []

1094

self.batch_memos = {}

1095

self.memos_to_get = []

1096

self.total_bytes = 0

1097

self.last_read_memo = None

1098

self.manager = None

1099

self._get_compressor_settings = get_compressor_settings

1100

1101

def add_key(self, key):

1102

"""Add another to key to fetch.

1103

1104

:return: The estimated number of bytes needed to fetch the batch so

1105

far.

1106

"""

1107

self.keys.append(key)

1108

index_memo, _, _, _ = self.locations[key]

1109

read_memo = index_memo[0:3]

1110

# Three possibilities for this read_memo:

1111

# - it's already part of this batch; or

1112

# - it's not yet part of this batch, but is already cached; or

1113

# - it's not yet part of this batch and will need to be fetched.

1114

if read_memo in self.batch_memos:

1115

# This read memo is already in this batch.

1116

return self.total_bytes

1117

try:

1118

cached_block = self.gcvf._group_cache[read_memo]

1119

except KeyError:

1120

# This read memo is new to this batch, and the data isn't cached

1121

# either.

1122

self.batch_memos[read_memo] = None

1123

self.memos_to_get.append(read_memo)

1124

byte_length = read_memo[2]

1125

self.total_bytes += byte_length

1126

else:

1127

# This read memo is new to this batch, but cached.

1128

# Keep a reference to the cached block in batch_memos because it's

1129

# certain that we'll use it when this batch is processed, but

1130

# there's a risk that it would fall out of _group_cache between now

1131

# and then.

1132

self.batch_memos[read_memo] = cached_block

1133

return self.total_bytes

1134

1135

def _flush_manager(self):

1136

if self.manager is not None:

1137

for factory in self.manager.get_record_stream():

1138

yield factory

1139

self.manager = None

1140

self.last_read_memo = None

1141

1142

def yield_factories(self, full_flush=False):

1143

"""Yield factories for keys added since the last yield. They will be

1144

returned in the order they were added via add_key.

1145

1146

:param full_flush: by default, some results may not be returned in case

1147

they can be part of the next batch. If full_flush is True, then

1148

all results are returned.

1149

"""

1150

if self.manager is None and not self.keys:

1151

return

1152

# Fetch all memos in this batch.

1153

blocks = self.gcvf._get_blocks(self.memos_to_get)

1154

# Turn blocks into factories and yield them.

1155

memos_to_get_stack = list(self.memos_to_get)

1156

memos_to_get_stack.reverse()

1157

for key in self.keys:

1158

index_memo, _, parents, _ = self.locations[key]

1159

read_memo = index_memo[:3]

1160

if self.last_read_memo != read_memo:

1161

# We are starting a new block. If we have a

1162

# manager, we have found everything that fits for

1163

# now, so yield records

1164

for factory in self._flush_manager():

1165

yield factory

1166

# Now start a new manager.

1167

if memos_to_get_stack and memos_to_get_stack[-1] == read_memo:

1168

# The next block from _get_blocks will be the block we

1169

# need.

1170

block_read_memo, block = blocks.next()

1171

if block_read_memo != read_memo:

1172

raise AssertionError(

1173

"block_read_memo out of sync with read_memo"

1174

"(%r != %r)" % (block_read_memo, read_memo))

1175

self.batch_memos[read_memo] = block

1176

memos_to_get_stack.pop()

1177

else:

1178

block = self.batch_memos[read_memo]

1179

self.manager = _LazyGroupContentManager(block,

1180

get_compressor_settings=self._get_compressor_settings)

1181

self.last_read_memo = read_memo

1182

start, end = index_memo[3:5]

1183

self.manager.add_factory(key, parents, start, end)

1184

if full_flush:

1185

for factory in self._flush_manager():

1186

yield factory

1187

del self.keys[:]

1188

self.batch_memos.clear()

1189

del self.memos_to_get[:]

1190

self.total_bytes = 0

1191

1192

1193

class GroupCompressVersionedFiles(VersionedFilesWithFallbacks):

979

1194

"""A group-compress based VersionedFiles implementation."""

980

1195

981

def __init__(self, index, access, delta=True):

1196

# This controls how the GroupCompress DeltaIndex works. Basically, we

1197

# compute hash pointers into the source blocks (so hash(text) => text).

1198

# However each of these references costs some memory in trade against a

1199

# more accurate match result. For very large files, they either are

1200

# pre-compressed and change in bulk whenever they change, or change in just

1201

# local blocks. Either way, 'improved resolution' is not very helpful,

1202

# versus running out of memory trying to track everything. The default max

1203

# gives 100% sampling of a 1MB file.

1204

_DEFAULT_MAX_BYTES_TO_INDEX = 1024 * 1024

1205

_DEFAULT_COMPRESSOR_SETTINGS = {'max_bytes_to_index':

1206

_DEFAULT_MAX_BYTES_TO_INDEX}

1207

1208

def __init__(self, index, access, delta=True, _unadded_refs=None,

1209

_group_cache=None):

982

1210

"""Create a GroupCompressVersionedFiles object.

983

1211

984

1212

:param index: The index object storing access and graph data.

985

1213

:param access: The access object storing raw data.

986

1214

:param delta: Whether to delta compress or just entropy compress.

1215

:param _unadded_refs: private parameter, don't use.

1216

:param _group_cache: private parameter, don't use.

987

1217

"""

988

1218

self._index = index

989

1219

self._access = access

990

1220

self._delta = delta

991

self._unadded_refs = {}

992

self._group_cache = LRUSizeCache(max_size=50*1024*1024)

993

self._fallback_vfs = []

1221

if _unadded_refs is None:

1222

_unadded_refs = {}

1223

self._unadded_refs = _unadded_refs

1224

if _group_cache is None:

1225

_group_cache = LRUSizeCache(max_size=50*1024*1024)

1226

self._group_cache = _group_cache

1227

self._immediate_fallback_vfs = []

1228

self._max_bytes_to_index = None

1229

1230

def without_fallbacks(self):

1231

"""Return a clone of this object without any fallbacks configured."""

1232

return GroupCompressVersionedFiles(self._index, self._access,

1233

self._delta, _unadded_refs=dict(self._unadded_refs),

1234

_group_cache=self._group_cache)

994

1235

995

1236

def add_lines(self, key, parents, lines, parent_texts=None,

996

1237

left_matching_blocks=None, nostore_sha=None, random_id=False,

1000

1241

:param key: The key tuple of the text to add.

1001

1242

:param parents: The parents key tuples of the text to add.

1002

1243

:param lines: A list of lines. Each line must be a bytestring. And all

1003

of them except the last must be terminated with \n and contain no

1004

other \n's. The last line may either contain no \n's or a single

1005

terminating \n. If the lines list does meet this constraint the add

1006

routine may error or may succeed - but you will be unable to read

1007

the data back accurately. (Checking the lines have been split

1244

of them except the last must be terminated with \\n and contain no

1245

other \\n's. The last line may either contain no \\n's or a single

1246

terminating \\n. If the lines list does meet this constraint the

1247

add routine may error or may succeed - but you will be unable to

1248

read the data back accurately. (Checking the lines have been split

1008

1249

correctly is expensive and extremely unlikely to catch bugs so it

1009

1250

is not done at runtime unless check_content is True.)

1010

1251

:param parent_texts: An optional dictionary containing the opaque

1065

1306

1066

1307

:param a_versioned_files: A VersionedFiles object.

1067

1308

"""

1068

self._fallback_vfs.append(a_versioned_files)

1309

self._immediate_fallback_vfs.append(a_versioned_files)

1069

1310

1070

1311

def annotate(self, key):

1071

1312

"""See VersionedFiles.annotate."""

1075

1316

def get_annotator(self):

1076

1317

return annotate.Annotator(self)

1077

1318

1078

def check(self, progress_bar=None):

1319

def check(self, progress_bar=None, keys=None):

1079

1320

"""See VersionedFiles.check()."""

1080

keys = self.keys()

1081

for record in self.get_record_stream(keys, 'unordered', True):

1082

record.get_bytes_as('fulltext')

1321

if keys is None:

1322

keys = self.keys()

1323

for record in self.get_record_stream(keys, 'unordered', True):

1324

record.get_bytes_as('fulltext')

1325

else:

1326

return self.get_record_stream(keys, 'unordered', True)

1327

1328

def clear_cache(self):

1329

"""See VersionedFiles.clear_cache()"""

1330

self._group_cache.clear()

1331

self._index._graph_index.clear_cache()

1332

self._index._int_cache.clear()

1083

1333

1084

1334

def _check_add(self, key, lines, random_id, check_content):

1085

1335

"""check that version_id and lines are safe to add."""

1116

1366

and so on.

1117

1367

"""

1118

1368

result = {}

1119

sources = [self._index] + self._fallback_vfs

1369

sources = [self._index] + self._immediate_fallback_vfs

1120

1370

source_results = []

1121

1371

missing = set(keys)

1122

1372

for source in sources:

1128

1378

missing.difference_update(set(new_result))

1129

1379

return result, source_results

1130

1380

1131

def _get_block(self, index_memo):

1132

read_memo = index_memo[0:3]

1133

# get the group:

1134

try:

1135

block = self._group_cache[read_memo]

1136

except KeyError:

1137

# read the group

1138

zdata = self._access.get_raw_records([read_memo]).next()

1139

# decompress - whole thing - this is not a bug, as it

1140

# permits caching. We might want to store the partially

1141

# decompresed group and decompress object, so that recent

1142

# texts are not penalised by big groups.

1143

block = GroupCompressBlock.from_bytes(zdata)

1144

self._group_cache[read_memo] = block

1145

# cheapo debugging:

1146

# print len(zdata), len(plain)

1147

# parse - requires split_lines, better to have byte offsets

1148

# here (but not by much - we only split the region for the

1149

# recipe, and we often want to end up with lines anyway.

1150

return block

1381

def _get_blocks(self, read_memos):

1382

"""Get GroupCompressBlocks for the given read_memos.

1383

1384

:returns: a series of (read_memo, block) pairs, in the order they were

1385

originally passed.

1386

"""

1387

cached = {}

1388

for read_memo in read_memos:

1389

try:

1390

block = self._group_cache[read_memo]

1391

except KeyError:

1392

pass

1393

else:

1394

cached[read_memo] = block

1395

not_cached = []

1396

not_cached_seen = set()

1397

for read_memo in read_memos:

1398

if read_memo in cached:

1399

# Don't fetch what we already have

1400

continue

1401

if read_memo in not_cached_seen:

1402

# Don't try to fetch the same data twice

1403

continue

1404

not_cached.append(read_memo)

1405

not_cached_seen.add(read_memo)

1406

raw_records = self._access.get_raw_records(not_cached)

1407

for read_memo in read_memos:

1408

try:

1409

yield read_memo, cached[read_memo]

1410

except KeyError:

1411

# Read the block, and cache it.

1412

zdata = raw_records.next()

1413

block = GroupCompressBlock.from_bytes(zdata)

1414

self._group_cache[read_memo] = block

1415

cached[read_memo] = block

1416

yield read_memo, block

1151

1417

1152

1418

def get_missing_compression_parent_keys(self):

1153

1419

"""Return the keys of missing compression parents.

1207

1473

parent_map = {}

1208

1474

key_to_source_map = {}

1209

1475

source_results = []

1210

for source in self._fallback_vfs:

1476

for source in self._immediate_fallback_vfs:

1211

1477

if not missing:

1212

1478

break

1213

1479

source_parents = source.get_parent_map(missing)

1223

1489

1224

1490

The returned objects should be in the order defined by 'ordering',

1225

1491

which can weave between different sources.

1492

1226

1493

:param ordering: Must be one of 'topological' or 'groupcompress'

1227

1494

:return: List of [(source, [keys])] tuples, such that all keys are in

1228

1495

the defined order, regardless of source.

1229

1496

"""

1230

1497

if ordering == 'topological':

1231

present_keys = topo_sort(parent_map)

1498

present_keys = tsort.topo_sort(parent_map)

1232

1499

else:

1233

1500

# ordering == 'groupcompress'

1234

1501

# XXX: This only optimizes for the target ordering. We may need

1319

1586

unadded_keys, source_result)

1320

1587

for key in missing:

1321

1588

yield AbsentContentFactory(key)

1322

manager = None

1323

last_read_memo = None

1324

# TODO: This works fairly well at batching up existing groups into a

1325

# streamable format, and possibly allowing for taking one big

1326

# group and splitting it when it isn't fully utilized.

1327

# However, it doesn't allow us to find under-utilized groups and

1328

# combine them into a bigger group on the fly.

1329

# (Consider the issue with how chk_map inserts texts

1330

# one-at-a-time.) This could be done at insert_record_stream()

1331

# time, but it probably would decrease the number of

1332

# bytes-on-the-wire for fetch.

1589

# Batch up as many keys as we can until either:

1590

# - we encounter an unadded ref, or

1591

# - we run out of keys, or

1592

# - the total bytes to retrieve for this batch > BATCH_SIZE

1593

batcher = _BatchingBlockFetcher(self, locations,

1594

get_compressor_settings=self._get_compressor_settings)

1333

1595

for source, keys in source_keys:

1334

1596

if source is self:

1335

1597

for key in keys:

1336

1598

if key in self._unadded_refs:

1337

if manager is not None:

1338

for factory in manager.get_record_stream():

1339

yield factory

1340

last_read_memo = manager = None

1599

# Flush batch, then yield unadded ref from

1600

# self._compressor.

1601

for factory in batcher.yield_factories(full_flush=True):

1602

yield factory

1341

1603

bytes, sha1 = self._compressor.extract(key)

1342

1604

parents = self._unadded_refs[key]

1343

1605

yield FulltextContentFactory(key, parents, sha1, bytes)

1344

else:

1345

index_memo, _, parents, (method, _) = locations[key]

1346

read_memo = index_memo[0:3]

1347

if last_read_memo != read_memo:

1348

# We are starting a new block. If we have a

1349

# manager, we have found everything that fits for

1350

# now, so yield records

1351

if manager is not None:

1352

for factory in manager.get_record_stream():

1353

yield factory

1354

# Now start a new manager

1355

block = self._get_block(index_memo)

1356

manager = _LazyGroupContentManager(block)

1357

last_read_memo = read_memo

1358

start, end = index_memo[3:5]

1359

manager.add_factory(key, parents, start, end)

1606

continue

1607

if batcher.add_key(key) > BATCH_SIZE:

1608

# Ok, this batch is big enough. Yield some results.

1609

for factory in batcher.yield_factories():

1610

yield factory

1360

1611

else:

1361

if manager is not None:

1362

for factory in manager.get_record_stream():

1363

yield factory

1364

last_read_memo = manager = None

1612

for factory in batcher.yield_factories(full_flush=True):

1613

yield factory

1365

1614

for record in source.get_record_stream(keys, ordering,

1366

1615

include_delta_closure):

1367

1616

yield record

1368

if manager is not None:

1369

for factory in manager.get_record_stream():

1370

yield factory

1617

for factory in batcher.yield_factories(full_flush=True):

1618

yield factory

1371

1619

1372

1620

def get_sha1s(self, keys):

1373

1621

"""See VersionedFiles.get_sha1s()."""

1395

1643

for _ in self._insert_record_stream(stream, random_id=False):

1396

1644

pass

1397

1645

1646

def _get_compressor_settings(self):

1647

if self._max_bytes_to_index is None:

1648

# TODO: VersionedFiles don't know about their containing

1649

# repository, so they don't have much of an idea about their

1650

# location. So for now, this is only a global option.

1651

c = config.GlobalConfig()

1652

val = c.get_user_option('bzr.groupcompress.max_bytes_to_index')

1653

if val is not None:

1654

try:

1655

val = int(val)

1656

except ValueError, e:

1657

trace.warning('Value for '

1658

'"bzr.groupcompress.max_bytes_to_index"'

1659

' %r is not an integer'

1660

% (val,))

1661

val = None

1662

if val is None:

1663

val = self._DEFAULT_MAX_BYTES_TO_INDEX

1664

self._max_bytes_to_index = val

1665

return {'max_bytes_to_index': self._max_bytes_to_index}

1666

1667

def _make_group_compressor(self):

1668

return GroupCompressor(self._get_compressor_settings())

1669

1398

1670

def _insert_record_stream(self, stream, random_id=False, nostore_sha=None,

1399

1671

reuse_blocks=True):

1400

1672

"""Internal core to insert a record stream into this container.

1423

1695

return adapter

1424

1696

# This will go up to fulltexts for gc to gc fetching, which isn't

1425

1697

# ideal.

1426

self._compressor = GroupCompressor()

1698

self._compressor = self._make_group_compressor()

1427

1699

self._unadded_refs = {}

1428

1700

keys_to_add = []

1429

1701

def flush():

1430

bytes = self._compressor.flush().to_bytes()

1702

bytes_len, chunks = self._compressor.flush().to_chunks()

1703

self._compressor = self._make_group_compressor()

1704

# Note: At this point we still have 1 copy of the fulltext (in

1705

# record and the var 'bytes'), and this generates 2 copies of

1706

# the compressed text (one for bytes, one in chunks)

1707

# TODO: Push 'chunks' down into the _access api, so that we don't

1708

# have to double compressed memory here

1709

# TODO: Figure out how to indicate that we would be happy to free

1710

# the fulltext content at this point. Note that sometimes we

1711

# will want it later (streaming CHK pages), but most of the

1712

# time we won't (everything else)

1713

bytes = ''.join(chunks)

1714

del chunks

1431

1715

index, start, length = self._access.add_raw_records(

1432

1716

[(None, len(bytes))], bytes)[0]

1433

1717

nodes = []

1436

1720

self._index.add_records(nodes, random_id=random_id)

1437

1721

self._unadded_refs = {}

1438

1722

del keys_to_add[:]

1439

self._compressor = GroupCompressor()

1440

1723

1441

1724

last_prefix = None

1442

1725

max_fulltext_len = 0

1446

1729

block_length = None

1447

1730

# XXX: TODO: remove this, it is just for safety checking for now

1448

1731

inserted_keys = set()

1732

reuse_this_block = reuse_blocks

1449

1733

for record in stream:

1450

1734

# Raise an error when a record is missing.

1451

1735

if record.storage_kind == 'absent':

1452

1736

raise errors.RevisionNotPresent(record.key, self)

1453

1737

if random_id:

1454

1738

if record.key in inserted_keys:

1455

trace.note('Insert claimed random_id=True,'

1456

' but then inserted %r two times', record.key)

1739

trace.note(gettext('Insert claimed random_id=True,'

1740

' but then inserted %r two times'), record.key)

1457

1741

continue

1458

1742

inserted_keys.add(record.key)

1459

1743

if reuse_blocks:

1460

1744

# If the reuse_blocks flag is set, check to see if we can just

1461

1745

# copy a groupcompress block as-is.

1746

# We only check on the first record (groupcompress-block) not

1747

# on all of the (groupcompress-block-ref) entries.

1748

# The reuse_this_block flag is then kept for as long as

1749

if record.storage_kind == 'groupcompress-block':

1750

# Check to see if we really want to re-use this block

1751

insert_manager = record._manager

1752

reuse_this_block = insert_manager.check_is_well_utilized()

1753

else:

1754

reuse_this_block = False

1755

if reuse_this_block:

1756

# We still want to reuse this block

1462

1757

if record.storage_kind == 'groupcompress-block':

1463

1758

# Insert the raw block into the target repo

1464

1759

insert_manager = record._manager

1465

insert_manager._check_rebuild_block()

1466

1760

bytes = record._manager._block.to_bytes()

1467

1761

_, start, length = self._access.add_raw_records(

1468

1762

[(None, len(bytes))], bytes)[0]

1473

1767

'groupcompress-block-ref'):

1474

1768

if insert_manager is None:

1475

1769

raise AssertionError('No insert_manager set')

1770

if insert_manager is not record._manager:

1771

raise AssertionError('insert_manager does not match'

1772

' the current record, we cannot be positive'

1773

' that the appropriate content was inserted.'

1774

)

1476

1775

value = "%d %d %d %d" % (block_start, block_length,

1477

1776

record._start, record._end)

1478

1777

nodes = [(record.key, value, (record.parents,))]

1528

1827

key = record.key

1529

1828

self._unadded_refs[key] = record.parents

1530

1829

yield found_sha1

1531

keys_to_add.append((key, '%d %d' % (start_point, end_point),

1532

(record.parents,)))

1830

as_st = static_tuple.StaticTuple.from_sequence

1831

if record.parents is not None:

1832

parents = as_st([as_st(p) for p in record.parents])

1833

else:

1834

parents = None

1835

refs = static_tuple.StaticTuple(parents)

1836

keys_to_add.append((key, '%d %d' % (start_point, end_point), refs))

1533

1837

if len(keys_to_add):

1534

1838

flush()

1535

1839

self._compressor = None

1578

1882

"""See VersionedFiles.keys."""

1579

1883

if 'evil' in debug.debug_flags:

1580

1884

trace.mutter_callsite(2, "keys scales with size of history")

1581

sources = [self._index] + self._fallback_vfs

1885

sources = [self._index] + self._immediate_fallback_vfs

1582

1886

result = set()

1583

1887

for source in sources:

1584

1888

result.update(source.keys())

1585

1889

return result

1586

1890

1587

1891

1892

class _GCBuildDetails(object):

1893

"""A blob of data about the build details.

1894

1895

This stores the minimal data, which then allows compatibility with the old

1896

api, without taking as much memory.

1897

"""

1898

1899

__slots__ = ('_index', '_group_start', '_group_end', '_basis_end',

1900

'_delta_end', '_parents')

1901

1902

method = 'group'

1903

compression_parent = None

1904

1905

def __init__(self, parents, position_info):

1906

self._parents = parents

1907

(self._index, self._group_start, self._group_end, self._basis_end,

1908

self._delta_end) = position_info

1909

1910

def __repr__(self):

1911

return '%s(%s, %s)' % (self.__class__.__name__,

1912

self.index_memo, self._parents)

1913

1914

@property

1915

def index_memo(self):

1916

return (self._index, self._group_start, self._group_end,

1917

self._basis_end, self._delta_end)

1918

1919

@property

1920

def record_details(self):

1921

return static_tuple.StaticTuple(self.method, None)

1922

1923

def __getitem__(self, offset):

1924

"""Compatibility thunk to act like a tuple."""

1925

if offset == 0:

1926

return self.index_memo

1927

elif offset == 1:

1928

return self.compression_parent # Always None

1929

elif offset == 2:

1930

return self._parents

1931

elif offset == 3:

1932

return self.record_details

1933

else:

1934

raise IndexError('offset out of range')

1935

1936

def __len__(self):

1937

return 4

1938

1939

1588

1940

class _GCGraphIndex(object):

1589

1941

"""Mapper from GroupCompressVersionedFiles needs into GraphIndex storage."""

1590

1942

1591

1943

def __init__(self, graph_index, is_locked, parents=True,

1592

1944

add_callback=None, track_external_parent_refs=False,

1593

inconsistency_fatal=True):

1945

inconsistency_fatal=True, track_new_keys=False):

1594

1946

"""Construct a _GCGraphIndex on a graph_index.

1595

1947

1596

1948

:param graph_index: An implementation of bzrlib.index.GraphIndex.

1615

1967

self.has_graph = parents

1616

1968

self._is_locked = is_locked

1617

1969

self._inconsistency_fatal = inconsistency_fatal

1970

# GroupCompress records tend to have the same 'group' start + offset

1971

# repeated over and over, this creates a surplus of ints

1972

self._int_cache = {}

1618

1973

if track_external_parent_refs:

1619

self._key_dependencies = knit._KeyRefs()

1974

self._key_dependencies = _KeyRefs(

1975

track_new_keys=track_new_keys)

1620

1976

else:

1621

1977

self._key_dependencies = None

1622

1978

1655

2011

if not random_id:

1656

2012

present_nodes = self._get_entries(keys)

1657

2013

for (index, key, value, node_refs) in present_nodes:

1658

if node_refs != keys[key][1]:

1659

details = '%s %s %s' % (key, (value, node_refs), keys[key])

2014

# Sometimes these are passed as a list rather than a tuple

2015

node_refs = static_tuple.as_tuples(node_refs)

2016

passed = static_tuple.as_tuples(keys[key])

2017

if node_refs != passed[1]:

2018

details = '%s %s %s' % (key, (value, node_refs), passed)

1660

2019

if self._inconsistency_fatal:

1661

2020

raise errors.KnitCorrupt(self, "inconsistent details"

1662

2021

" in add_records: %s" %

1676

2035

result.append((key, value))

1677

2036

records = result

1678

2037

key_dependencies = self._key_dependencies

1679

if key_dependencies is not None and self._parents:

1680

for key, value, refs in records:

1681

parents = refs[0]

1682

key_dependencies.add_references(key, parents)

2038

if key_dependencies is not None:

2039

if self._parents:

2040

for key, value, refs in records:

2041

parents = refs[0]

2042

key_dependencies.add_references(key, parents)

2043

else:

2044

for key, value, refs in records:

2045

new_keys.add_key(key)

1683

2046

self._add_callback(records)

1684

2047

1685

2048

def _check_read(self):

1716

2079

if missing_keys:

1717

2080

raise errors.RevisionNotPresent(missing_keys.pop(), self)

1718

2081

2082

def find_ancestry(self, keys):

2083

"""See CombinedGraphIndex.find_ancestry"""

2084

return self._graph_index.find_ancestry(keys, 0)

2085

1719

2086

def get_parent_map(self, keys):

1720

2087

"""Get a map of the parents of keys.

1721

2088

1738

2105

"""Return the keys of missing parents."""

1739

2106

# Copied from _KnitGraphIndex.get_missing_parents

1740

2107

# We may have false positives, so filter those out.

1741

self._key_dependencies.add_keys(

2108

self._key_dependencies.satisfy_refs_for_keys(

1742

2109

self.get_parent_map(self._key_dependencies.get_unsatisfied_refs()))

1743

2110

return frozenset(self._key_dependencies.get_unsatisfied_refs())

1744

2111

1750

2117

:param keys: An iterable of keys.

1751

2118

:return: A dict of key:

1752

2119

(index_memo, compression_parent, parents, record_details).

1753

index_memo

1754

opaque structure to pass to read_records to extract the raw

1755

data

1756

compression_parent

1757

Content that this record is built upon, may be None

1758

parents

1759

Logical parents of this node

1760

record_details

1761

extra information about the content which needs to be passed to

1762

Factory.parse_record

2120

2121

* index_memo: opaque structure to pass to read_records to extract

2122

the raw data

2123

* compression_parent: Content that this record is built upon, may

2124

be None

2125

* parents: Logical parents of this node

2126

* record_details: extra information about the content which needs

2127

to be passed to Factory.parse_record

1763

2128

"""

1764

2129

self._check_read()

1765

2130

result = {}

1770

2135

parents = None

1771

2136

else:

1772

2137

parents = entry[3][0]

1773

method = 'group'

1774

result[key] = (self._node_to_position(entry),

1775

None, parents, (method, None))

2138

details = _GCBuildDetails(parents, self._node_to_position(entry))

2139

result[key] = details

1776

2140

return result

1777

2141

1778

2142

def keys(self):

1787

2151

"""Convert an index value to position details."""

1788

2152

bits = node[2].split(' ')

1789

2153

# It would be nice not to read the entire gzip.

2154

# start and stop are put into _int_cache because they are very common.

2155

# They define the 'group' that an entry is in, and many groups can have

2156

# thousands of objects.

2157

# Branching Launchpad, for example, saves ~600k integers, at 12 bytes

2158

# each, or about 7MB. Note that it might be even more when you consider

2159

# how PyInt is allocated in separate slabs. And you can't return a slab

2160

# to the OS if even 1 int on it is in use. Note though that Python uses

2161

# a LIFO when re-using PyInt slots, which might cause more

2162

# fragmentation.

1790

2163

start = int(bits[0])

2164

start = self._int_cache.setdefault(start, start)

1791

2165

stop = int(bits[1])

2166

stop = self._int_cache.setdefault(stop, stop)

1792

2167

basis_end = int(bits[2])

1793

2168

delta_end = int(bits[3])

1794

return node[0], start, stop, basis_end, delta_end

2169

# We can't use StaticTuple here, because node[0] is a BTreeGraphIndex

2170

# instance...

2171

return (node[0], start, stop, basis_end, delta_end)

1795

2172

1796

2173

def scan_unvalidated_index(self, graph_index):

1797

2174

"""Inform this _GCGraphIndex that there is an unvalidated index.

1798

2175

1799

2176

This allows this _GCGraphIndex to keep track of any missing

1800

2177

compression parents we may want to have filled in to make those

1801

indices valid.

2178

indices valid. It also allows _GCGraphIndex to track any new keys.

1802

2179

1803

2180

:param graph_index: A GraphIndex

1804

2181

"""

1805

if self._key_dependencies is not None:

1806

# Add parent refs from graph_index (and discard parent refs that

1807

# the graph_index has).

1808

add_refs = self._key_dependencies.add_references

1809

for node in graph_index.iter_all_entries():

1810

add_refs(node[1], node[3][0])

1811

2182

key_dependencies = self._key_dependencies

2183

if key_dependencies is None:

2184

return

2185

for node in graph_index.iter_all_entries():

2186

# Add parent refs from graph_index (and discard parent refs

2187

# that the graph_index has).

2188

key_dependencies.add_references(node[1], node[3][0])

1812

2189

1813

2190

1814

2191

from bzrlib._groupcompress_py import (

1828

2205

decode_base128_int,

1829

2206

)

1830

2207

GroupCompressor = PyrexGroupCompressor

1831

except ImportError:

2208

except ImportError, e:

2209

osutils.failed_to_load_extension(e)

1832

2210

GroupCompressor = PythonGroupCompressor

1833

2211

Older »