~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/repofmt/groupcompress_repo.py

Committer: John Ferlito
Date: 2009-09-02 04:31:45 UTC
mto: (4665.7.1 serve-init)
mto: This revision was merged to the branch mainline in revision 4913.
Revision ID: johnf@inodes.org-20090902043145-gxdsfw03ilcwbyn5

Add a debian init script for bzr --serve

files added:
bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/clean_tree.py

bzrlib/crash.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/groupcompress.py

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/diverged-branches.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/inventory_delta.py

bzrlib/plugins/launchpad/test_lp_login.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/python-compat.h

bzrlib/rename_map.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart/packrepository.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/fake_command.py

bzrlib/tests/features.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/https_server.py

bzrlib/tests/per_branch/test_create_clone.py

bzrlib/tests/per_branch/test_dotted_revno_to_revision_id.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_revision_id_to_dotted_revno.py

bzrlib/tests/per_bzrdir/test_push.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_merge_directive.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_get_record_stream.py

bzrlib/tests/per_repository_reference/test_get_rev_id_for_revno.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_workingtree/test_annotate_iter.py

bzrlib/tests/per_workingtree/test_check.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lock.py

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart_request.py

bzrlib/util/bencode.py

bzrlib/views.py

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

contrib/debian

contrib/debian/default

contrib/debian/init.d

doc/BUILD-NOTES

doc/Makefile

doc/_static

doc/_static/bzr icon 16.png

doc/_static/bzr.ico

doc/_static/en

doc/_static/en/quick-reference

doc/_templates

doc/_templates/index.html

doc/_templates/layout.html

doc/conf.py

doc/contents.txt

doc/developers/apport.txt

doc/developers/btree_index_prefetch.txt

doc/developers/bug-handling.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/check.txt

doc/developers/colocated-branches.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/lca_tree_merging.txt

doc/developers/overview.txt

doc/en/migration

doc/en/migration/index.txt

doc/en/quick-reference/index.txt

doc/en/tutorials/index.txt

doc/en/upgrade-guide

doc/en/upgrade-guide/data_migration.txt

doc/en/upgrade-guide/index.txt

doc/en/upgrade-guide/overview.txt

doc/en/upgrade-guide/tips_and_tricks.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/index-for-2x.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/shelving_changes.txt

doc/es/quick-reference/quick-start-summary.pdf

doc/es/quick-reference/quick-start-summary.png

doc/index.ru.txt

doc/make.bat

doc/news-template.txt

doc/ru

doc/ru/mini-tutorial

doc/ru/mini-tutorial/index.txt

doc/ru/quick-reference

doc/ru/quick-reference/Makefile

doc/ru/quick-reference/quick-start-summary.pdf

doc/ru/quick-reference/quick-start-summary.png

doc/ru/quick-reference/quick-start-summary.svg

doc/ru/tutorials

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/core_concepts.txt

doc/ru/user-guide/images

doc/ru/user-guide/images/workflows_centralized.png

doc/ru/user-guide/images/workflows_centralized.svg

doc/ru/user-guide/images/workflows_gatekeeper.png

doc/ru/user-guide/images/workflows_gatekeeper.svg

doc/ru/user-guide/images/workflows_localcommit.png

doc/ru/user-guide/images/workflows_localcommit.svg

doc/ru/user-guide/images/workflows_peer.png

doc/ru/user-guide/images/workflows_peer.svg

doc/ru/user-guide/images/workflows_pqm.png

doc/ru/user-guide/images/workflows_pqm.svg

doc/ru/user-guide/images/workflows_shared.png

doc/ru/user-guide/images/workflows_shared.svg

doc/ru/user-guide/images/workflows_single.png

doc/ru/user-guide/images/workflows_single.svg

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/stacked.txt

doc/ru/user-guide/using_checkouts.txt

doc/ru/user-guide/zen.txt

tools/check-newsbugs.py

tools/packaging/lp-upload-release

tools/prepare_for_latex.py

tools/rst2pdf.py

tools/time_graph.py

tools/win32/bootstrap.py

tools/win32/build_release.py

tools/win32/buildout-templates

tools/win32/buildout-templates/bin

tools/win32/buildout-templates/bin/build-installer.bat.in

tools/win32/buildout.cfg

files removed:
bzrlib/_walkdirs_win32.h

bzrlib/help_topics/en/hooks.txt

bzrlib/tests/test_http_implementations.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/tests/test_bencode.py

doc/developers/performance-contributing.txt

files renamed:
bzrlib/_btree_serializer_c.pyx => bzrlib/_btree_serializer_pyx.pyx

bzrlib/_dirstate_helpers_c.h => bzrlib/_dirstate_helpers_pyx.h

bzrlib/_dirstate_helpers_c.pyx => bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_knit_load_data_c.pyx => bzrlib/_knit_load_data_pyx.pyx

tools/doc_generate/ => bzrlib/doc_generate/

bzrlib/tests/ftp_server.py => bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/branch_implementations/ => bzrlib/tests/per_branch/

bzrlib/tests/bzrdir_implementations/ => bzrlib/tests/per_bzrdir/

bzrlib/tests/interrepository_implementations/ => bzrlib/tests/per_interrepository/

bzrlib/tests/intertree_implementations/ => bzrlib/tests/per_intertree/

bzrlib/tests/inventory_implementations/ => bzrlib/tests/per_inventory/

bzrlib/tests/test_pack_repository.py => bzrlib/tests/per_pack_repository.py

bzrlib/tests/repository_implementations/ => bzrlib/tests/per_repository/

bzrlib/tests/test_transport_implementations.py => bzrlib/tests/per_transport.py

bzrlib/tests/tree_implementations/ => bzrlib/tests/per_tree/

bzrlib/tests/test_versionedfile.py => bzrlib/tests/per_versionedfile.py

bzrlib/tests/workingtree_implementations/ => bzrlib/tests/per_workingtree/

bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

doc/en/quick-reference/Makefile => doc/_static/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf => doc/_static/en/quick-reference/bzr-quick-reference.pdf

doc/en/quick-reference/quick-start-summary.png => doc/_static/en/quick-reference/bzr-quick-reference.png

doc/en/quick-reference/quick-start-summary.svg => doc/_static/en/quick-reference/bzr-quick-reference.svg

doc/developers/HACKING.txt => doc/en/developer-guide/HACKING.txt

doc/es/guia-desarrollador/ => doc/es/developer-guide/

doc/es/referencia-rapida/ => doc/es/quick-reference/

doc/es/referencia-rapida/referencia-rapida.svg => doc/es/quick-reference/quick-start-summary.svg

doc/es/notas-version/ => doc/es/release-notes/

doc/es/guia-usuario/ => doc/es/user-guide/

doc/es/referencia/ => doc/es/user-reference/

generate_docs.py => tools/generate_docs.py

files modified:
.bzrignore

Makefile

NEWS

bzrlib/__init__.py

bzrlib/_btree_serializer_py.py

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/chunk_writer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/readdir.h

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/file_utils.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_break_lock.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_commit.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_http.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_locking.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_sprout.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_branch/test_uncommit.py

bzrlib/tests/per_branch/test_update.py

bzrlib/tests/per_bzrdir/__init__.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_interrepository/test_interrepository.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_intertree/test_compare.py

bzrlib/tests/per_inventory/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_annotate_iter.py

bzrlib/tests/per_tree/test_get_file_mtime.py

bzrlib/tests/per_tree/test_get_root_id.py

bzrlib/tests/per_tree/test_get_symlink_target.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_list_files.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_tree/test_revision_tree.py

bzrlib/tests/per_tree/test_test_trees.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_tree/test_walkdirs.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_add.py

bzrlib/tests/per_workingtree/test_add_reference.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_basis_tree.py

bzrlib/tests/per_workingtree/test_break_lock.py

bzrlib/tests/per_workingtree/test_changes_from.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_flush.py

bzrlib/tests/per_workingtree/test_get_file_mtime.py

bzrlib/tests/per_workingtree/test_get_parent_ids.py

bzrlib/tests/per_workingtree/test_inv.py

bzrlib/tests/per_workingtree/test_is_control_filename.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_locking.py

bzrlib/tests/per_workingtree/test_merge_from_branch.py

bzrlib/tests/per_workingtree/test_mkdir.py

bzrlib/tests/per_workingtree/test_move.py

bzrlib/tests/per_workingtree/test_nested_specifics.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_put_file.py

bzrlib/tests/per_workingtree/test_read_working_inventory.py

bzrlib/tests/per_workingtree/test_readonly.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_rename_one.py

bzrlib/tests/per_workingtree/test_revision_tree.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_uncommit.py

bzrlib/tests/per_workingtree/test_unversion.py

bzrlib/tests/per_workingtree/test_walkdirs.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/treeshape.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

contrib/bzr_access

contrib/newinventory.py

contrib/pwclient.full

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/inventory.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/network-protocol.txt

doc/developers/performance-roadmap.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

doc/developers/revision-properties.txt

doc/developers/testing.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/writing_a_plugin.txt

doc/es/mini-tutorial/index.txt

doc/es/quick-reference/Makefile

doc/index.es.txt

doc/index.txt

profile_imports.py

setup.py

tools/bzr_epydoc_uid.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/package_mf.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/weavebench.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/repofmt/groupcompress_repo.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Repository formats using CHK inventories and groupcompress compression."""

import time

from bzrlib import (

bzrdir,

chk_map,

chk_serializer,

debug,

errors,

index as _mod_index,

inventory,

knit,

osutils,

pack,

remote,

revision as _mod_revision,

trace,

ui,

)

from bzrlib.btree_index import (

BTreeGraphIndex,

BTreeBuilder,

)

from bzrlib.groupcompress import (

_GCGraphIndex,

GroupCompressVersionedFiles,

)

from bzrlib.repofmt.pack_repo import (

Pack,

NewPack,

KnitPackRepository,

KnitPackStreamSource,

PackRootCommitBuilder,

RepositoryPackCollection,

RepositoryFormatPack,

ResumedPack,

Packer,

)

class GCPack(NewPack):

def __init__(self, pack_collection, upload_suffix='', file_mode=None):

"""Create a NewPack instance.

:param pack_collection: A PackCollection into which this is being

inserted.

:param upload_suffix: An optional suffix to be given to any temporary

files created during the pack creation. e.g '.autopack'

:param file_mode: An optional file mode to create the new files with.

"""

# replaced from NewPack to:

# - change inventory reference list length to 1

# - change texts reference lists to 1

# TODO: patch this to be parameterised

# The relative locations of the packs are constrained, but all are

# passed in because the caller has them, so as to avoid object churn.

index_builder_class = pack_collection._index_builder_class

# from brisbane-core

if pack_collection.chk_index is not None:

chk_index = index_builder_class(reference_lists=0)

else:

chk_index = None

Pack.__init__(self,

# Revisions: parents list, no text compression.

index_builder_class(reference_lists=1),

# Inventory: We want to map compression only, but currently the

# knit code hasn't been updated enough to understand that, so we

# have a regular 2-list index giving parents and compression

# source.

index_builder_class(reference_lists=1),

# Texts: per file graph, for all fileids - so one reference list

# and two elements in the key tuple.

index_builder_class(reference_lists=1, key_elements=2),

# Signatures: Just blobs to store, no compression, no parents

# listing.

index_builder_class(reference_lists=0),

# CHK based storage - just blobs, no compression or parents.

chk_index=chk_index

)

self._pack_collection = pack_collection

100

# When we make readonly indices, we need this.

101

self.index_class = pack_collection._index_class

102

# where should the new pack be opened

103

self.upload_transport = pack_collection._upload_transport

104

# where are indices written out to

105

self.index_transport = pack_collection._index_transport

106

# where is the pack renamed to when it is finished?

107

self.pack_transport = pack_collection._pack_transport

108

# What file mode to upload the pack and indices with.

109

self._file_mode = file_mode

110

# tracks the content written to the .pack file.

111

self._hash = osutils.md5()

112

# a four-tuple with the length in bytes of the indices, once the pack

113

# is finalised. (rev, inv, text, sigs)

114

self.index_sizes = None

115

# How much data to cache when writing packs. Note that this is not

116

# synchronised with reads, because it's not in the transport layer, so

117

# is not safe unless the client knows it won't be reading from the pack

118

# under creation.

119

self._cache_limit = 0

120

# the temporary pack file name.

121

self.random_name = osutils.rand_chars(20) + upload_suffix

122

# when was this pack started ?

123

self.start_time = time.time()

124

# open an output stream for the data added to the pack.

125

self.write_stream = self.upload_transport.open_write_stream(

126

self.random_name, mode=self._file_mode)

127

if 'pack' in debug.debug_flags:

128

trace.mutter('%s: create_pack: pack stream open: %s%s t+%6.3fs',

129

time.ctime(), self.upload_transport.base, self.random_name,

130

time.time() - self.start_time)

131

# A list of byte sequences to be written to the new pack, and the

132

# aggregate size of them. Stored as a list rather than separate

133

# variables so that the _write_data closure below can update them.

134

self._buffer = [[], 0]

135

# create a callable for adding data

136

137

# robertc says- this is a closure rather than a method on the object

138

# so that the variables are locals, and faster than accessing object

139

# members.

140

def _write_data(bytes, flush=False, _buffer=self._buffer,

141

_write=self.write_stream.write, _update=self._hash.update):

142

_buffer[0].append(bytes)

143

_buffer[1] += len(bytes)

144

# buffer cap

145

if _buffer[1] > self._cache_limit or flush:

146

bytes = ''.join(_buffer[0])

147

_write(bytes)

148

_update(bytes)

149

_buffer[:] = [[], 0]

150

# expose this on self, for the occasion when clients want to add data.

151

self._write_data = _write_data

152

# a pack writer object to serialise pack records.

153

self._writer = pack.ContainerWriter(self._write_data)

154

self._writer.begin()

155

# what state is the pack in? (open, finished, aborted)

156

self._state = 'open'

157

# no name until we finish writing the content

158

self.name = None

159

160

def _check_references(self):

161

"""Make sure our external references are present.

162

163

Packs are allowed to have deltas whose base is not in the pack, but it

164

must be present somewhere in this collection. It is not allowed to

165

have deltas based on a fallback repository.

166

(See <https://bugs.launchpad.net/bzr/+bug/288751>)

167

"""

168

# Groupcompress packs don't have any external references, arguably CHK

169

# pages have external references, but we cannot 'cheaply' determine

170

# them without actually walking all of the chk pages.

171

172

173

class ResumedGCPack(ResumedPack):

174

175

def _check_references(self):

176

"""Make sure our external compression parents are present."""

177

# See GCPack._check_references for why this is empty

178

179

def _get_external_refs(self, index):

180

# GC repositories don't have compression parents external to a given

181

# pack file

182

return set()

183

184

185

class GCCHKPacker(Packer):

186

"""This class understand what it takes to collect a GCCHK repo."""

187

188

def __init__(self, pack_collection, packs, suffix, revision_ids=None,

189

reload_func=None):

190

super(GCCHKPacker, self).__init__(pack_collection, packs, suffix,

191

revision_ids=revision_ids,

192

reload_func=reload_func)

193

self._pack_collection = pack_collection

194

# ATM, We only support this for GCCHK repositories

195

if pack_collection.chk_index is None:

196

raise AssertionError('pack_collection.chk_index should not be None')

197

self._gather_text_refs = False

198

self._chk_id_roots = []

199

self._chk_p_id_roots = []

200

self._text_refs = None

201

# set by .pack() if self.revision_ids is not None

202

self.revision_keys = None

203

204

def _get_progress_stream(self, source_vf, keys, message, pb):

205

def pb_stream():

206

substream = source_vf.get_record_stream(keys, 'groupcompress', True)

207

for idx, record in enumerate(substream):

208

if pb is not None:

209

pb.update(message, idx + 1, len(keys))

210

yield record

211

return pb_stream()

212

213

def _get_filtered_inv_stream(self, source_vf, keys, message, pb=None):

214

"""Filter the texts of inventories, to find the chk pages."""

215

total_keys = len(keys)

216

def _filtered_inv_stream():

217

id_roots_set = set()

218

p_id_roots_set = set()

219

stream = source_vf.get_record_stream(keys, 'groupcompress', True)

220

for idx, record in enumerate(stream):

221

# Inventories should always be with revisions; assume success.

222

bytes = record.get_bytes_as('fulltext')

223

chk_inv = inventory.CHKInventory.deserialise(None, bytes,

224

record.key)

225

if pb is not None:

226

pb.update('inv', idx, total_keys)

227

key = chk_inv.id_to_entry.key()

228

if key not in id_roots_set:

229

self._chk_id_roots.append(key)

230

id_roots_set.add(key)

231

p_id_map = chk_inv.parent_id_basename_to_file_id

232

if p_id_map is None:

233

raise AssertionError('Parent id -> file_id map not set')

234

key = p_id_map.key()

235

if key not in p_id_roots_set:

236

p_id_roots_set.add(key)

237

self._chk_p_id_roots.append(key)

238

yield record

239

# We have finished processing all of the inventory records, we

240

# don't need these sets anymore

241

id_roots_set.clear()

242

p_id_roots_set.clear()

243

return _filtered_inv_stream()

244

245

def _get_chk_streams(self, source_vf, keys, pb=None):

246

# We want to stream the keys from 'id_roots', and things they

247

# reference, and then stream things from p_id_roots and things they

248

# reference, and then any remaining keys that we didn't get to.

249

250

# We also group referenced texts together, so if one root references a

251

# text with prefix 'a', and another root references a node with prefix

252

# 'a', we want to yield those nodes before we yield the nodes for 'b'

253

# This keeps 'similar' nodes together.

254

255

# Note: We probably actually want multiple streams here, to help the

256

# client understand that the different levels won't compress well

257

# against each other.

258

# Test the difference between using one Group per level, and

259

# using 1 Group per prefix. (so '' (root) would get a group, then

260

# all the references to search-key 'a' would get a group, etc.)

261

total_keys = len(keys)

262

remaining_keys = set(keys)

263

counter = [0]

264

if self._gather_text_refs:

265

bytes_to_info = inventory.CHKInventory._bytes_to_utf8name_key

266

self._text_refs = set()

267

def _get_referenced_stream(root_keys, parse_leaf_nodes=False):

268

cur_keys = root_keys

269

while cur_keys:

270

keys_by_search_prefix = {}

271

remaining_keys.difference_update(cur_keys)

272

next_keys = set()

273

def handle_internal_node(node):

274

for prefix, value in node._items.iteritems():

275

# We don't want to request the same key twice, and we

276

# want to order it by the first time it is seen.

277

# Even further, we don't want to request a key which is

278

# not in this group of pack files (it should be in the

279

# repo, but it doesn't have to be in the group being

280

# packed.)

281

# TODO: consider how to treat externally referenced chk

282

# pages as 'external_references' so that we

283

# always fill them in for stacked branches

284

if value not in next_keys and value in remaining_keys:

285

keys_by_search_prefix.setdefault(prefix,

286

[]).append(value)

287

next_keys.add(value)

288

def handle_leaf_node(node):

289

# Store is None, because we know we have a LeafNode, and we

290

# just want its entries

291

for file_id, bytes in node.iteritems(None):

292

name_utf8, file_id, revision_id = bytes_to_info(bytes)

293

self._text_refs.add((file_id, revision_id))

294

def next_stream():

295

stream = source_vf.get_record_stream(cur_keys,

296

'as-requested', True)

297

for record in stream:

298

if record.storage_kind == 'absent':

299

# An absent CHK record: we assume that the missing

300

# record is in a different pack - e.g. a page not

301

# altered by the commit we're packing.

302

continue

303

bytes = record.get_bytes_as('fulltext')

304

# We don't care about search_key_func for this code,

305

# because we only care about external references.

306

node = chk_map._deserialise(bytes, record.key,

307

search_key_func=None)

308

common_base = node._search_prefix

309

if isinstance(node, chk_map.InternalNode):

310

handle_internal_node(node)

311

elif parse_leaf_nodes:

312

handle_leaf_node(node)

313

counter[0] += 1

314

if pb is not None:

315

pb.update('chk node', counter[0], total_keys)

316

yield record

317

yield next_stream()

318

# Double check that we won't be emitting any keys twice

319

# If we get rid of the pre-calculation of all keys, we could

320

# turn this around and do

321

# next_keys.difference_update(seen_keys)

322

# However, we also may have references to chk pages in another

323

# pack file during autopack. We filter earlier, so we should no

324

# longer need to do this

325

# next_keys = next_keys.intersection(remaining_keys)

326

cur_keys = []

327

for prefix in sorted(keys_by_search_prefix):

328

cur_keys.extend(keys_by_search_prefix.pop(prefix))

329

for stream in _get_referenced_stream(self._chk_id_roots,

330

self._gather_text_refs):

331

yield stream

332

del self._chk_id_roots

333

# while it isn't really possible for chk_id_roots to not be in the

334

# local group of packs, it is possible that the tree shape has not

335

# changed recently, so we need to filter _chk_p_id_roots by the

336

# available keys

337

chk_p_id_roots = [key for key in self._chk_p_id_roots

338

if key in remaining_keys]

339

del self._chk_p_id_roots

340

for stream in _get_referenced_stream(chk_p_id_roots, False):

341

yield stream

342

if remaining_keys:

343

trace.mutter('There were %d keys in the chk index, %d of which'

344

' were not referenced', total_keys,

345

len(remaining_keys))

346

if self.revision_ids is None:

347

stream = source_vf.get_record_stream(remaining_keys,

348

'unordered', True)

349

yield stream

350

351

def _build_vf(self, index_name, parents, delta, for_write=False):

352

"""Build a VersionedFiles instance on top of this group of packs."""

353

index_name = index_name + '_index'

354

index_to_pack = {}

355

access = knit._DirectPackAccess(index_to_pack)

356

if for_write:

357

# Use new_pack

358

if self.new_pack is None:

359

raise AssertionError('No new pack has been set')

360

index = getattr(self.new_pack, index_name)

361

index_to_pack[index] = self.new_pack.access_tuple()

362

index.set_optimize(for_size=True)

363

access.set_writer(self.new_pack._writer, index,

364

self.new_pack.access_tuple())

365

add_callback = index.add_nodes

366

else:

367

indices = []

368

for pack in self.packs:

369

sub_index = getattr(pack, index_name)

370

index_to_pack[sub_index] = pack.access_tuple()

371

indices.append(sub_index)

372

index = _mod_index.CombinedGraphIndex(indices)

373

add_callback = None

374

vf = GroupCompressVersionedFiles(

375

_GCGraphIndex(index,

376

add_callback=add_callback,

377

parents=parents,

378

is_locked=self._pack_collection.repo.is_locked),

379

access=access,

380

delta=delta)

381

return vf

382

383

def _build_vfs(self, index_name, parents, delta):

384

"""Build the source and target VersionedFiles."""

385

source_vf = self._build_vf(index_name, parents,

386

delta, for_write=False)

387

target_vf = self._build_vf(index_name, parents,

388

delta, for_write=True)

389

return source_vf, target_vf

390

391

def _copy_stream(self, source_vf, target_vf, keys, message, vf_to_stream,

392

pb_offset):

393

trace.mutter('repacking %d %s', len(keys), message)

394

self.pb.update('repacking %s' % (message,), pb_offset)

395

child_pb = ui.ui_factory.nested_progress_bar()

396

try:

397

stream = vf_to_stream(source_vf, keys, message, child_pb)

398

for _ in target_vf._insert_record_stream(stream,

399

random_id=True,

400

reuse_blocks=False):

401

pass

402

finally:

403

child_pb.finished()

404

405

def _copy_revision_texts(self):

406

source_vf, target_vf = self._build_vfs('revision', True, False)

407

if not self.revision_keys:

408

# We are doing a full fetch, aka 'pack'

409

self.revision_keys = source_vf.keys()

410

self._copy_stream(source_vf, target_vf, self.revision_keys,

411

'revisions', self._get_progress_stream, 1)

412

413

def _copy_inventory_texts(self):

414

source_vf, target_vf = self._build_vfs('inventory', True, True)

415

# It is not sufficient to just use self.revision_keys, as stacked

416

# repositories can have more inventories than they have revisions.

417

# One alternative would be to do something with

418

# get_parent_map(self.revision_keys), but that shouldn't be any faster

419

# than this.

420

inventory_keys = source_vf.keys()

421

missing_inventories = set(self.revision_keys).difference(inventory_keys)

422

if missing_inventories:

423

missing_inventories = sorted(missing_inventories)

424

raise ValueError('We are missing inventories for revisions: %s'

425

% (missing_inventories,))

426

self._copy_stream(source_vf, target_vf, inventory_keys,

427

'inventories', self._get_filtered_inv_stream, 2)

428

429

def _copy_chk_texts(self):

430

source_vf, target_vf = self._build_vfs('chk', False, False)

431

# TODO: This is technically spurious... if it is a performance issue,

432

# remove it

433

total_keys = source_vf.keys()

434

trace.mutter('repacking chk: %d id_to_entry roots,'

435

' %d p_id_map roots, %d total keys',

436

len(self._chk_id_roots), len(self._chk_p_id_roots),

437

len(total_keys))

438

self.pb.update('repacking chk', 3)

439

child_pb = ui.ui_factory.nested_progress_bar()

440

try:

441

for stream in self._get_chk_streams(source_vf, total_keys,

442

pb=child_pb):

443

for _ in target_vf._insert_record_stream(stream,

444

random_id=True,

445

reuse_blocks=False):

446

pass

447

finally:

448

child_pb.finished()

449

450

def _copy_text_texts(self):

451

source_vf, target_vf = self._build_vfs('text', True, True)

452

# XXX: We don't walk the chk map to determine referenced (file_id,

453

# revision_id) keys. We don't do it yet because you really need

454

# to filter out the ones that are present in the parents of the

455

# rev just before the ones you are copying, otherwise the filter

456

# is grabbing too many keys...

457

text_keys = source_vf.keys()

458

self._copy_stream(source_vf, target_vf, text_keys,

459

'texts', self._get_progress_stream, 4)

460

461

def _copy_signature_texts(self):

462

source_vf, target_vf = self._build_vfs('signature', False, False)

463

signature_keys = source_vf.keys()

464

signature_keys.intersection(self.revision_keys)

465

self._copy_stream(source_vf, target_vf, signature_keys,

466

'signatures', self._get_progress_stream, 5)

467

468

def _create_pack_from_packs(self):

469

self.pb.update('repacking', 0, 7)

470

self.new_pack = self.open_pack()

471

# Is this necessary for GC ?

472

self.new_pack.set_write_cache_size(1024*1024)

473

self._copy_revision_texts()

474

self._copy_inventory_texts()

475

self._copy_chk_texts()

476

self._copy_text_texts()

477

self._copy_signature_texts()

478

self.new_pack._check_references()

479

if not self._use_pack(self.new_pack):

480

self.new_pack.abort()

481

return None

482

self.new_pack.finish_content()

483

if len(self.packs) == 1:

484

old_pack = self.packs[0]

485

if old_pack.name == self.new_pack._hash.hexdigest():

486

# The single old pack was already optimally packed.

487

trace.mutter('single pack %s was already optimally packed',

488

old_pack.name)

489

self.new_pack.abort()

490

return None

491

self.pb.update('finishing repack', 6, 7)

492

self.new_pack.finish()

493

self._pack_collection.allocate(self.new_pack)

494

return self.new_pack

495

496

497

class GCCHKReconcilePacker(GCCHKPacker):

498

"""A packer which regenerates indices etc as it copies.

499

500

This is used by ``bzr reconcile`` to cause parent text pointers to be

501

regenerated.

502

"""

503

504

def __init__(self, *args, **kwargs):

505

super(GCCHKReconcilePacker, self).__init__(*args, **kwargs)

506

self._data_changed = False

507

self._gather_text_refs = True

508

509

def _copy_inventory_texts(self):

510

source_vf, target_vf = self._build_vfs('inventory', True, True)

511

self._copy_stream(source_vf, target_vf, self.revision_keys,

512

'inventories', self._get_filtered_inv_stream, 2)

513

if source_vf.keys() != self.revision_keys:

514

self._data_changed = True

515

516

def _copy_text_texts(self):

517

"""generate what texts we should have and then copy."""

518

source_vf, target_vf = self._build_vfs('text', True, True)

519

trace.mutter('repacking %d texts', len(self._text_refs))

520

self.pb.update("repacking texts", 4)

521

# we have three major tasks here:

522

# 1) generate the ideal index

523

repo = self._pack_collection.repo

524

# We want the one we just wrote, so base it on self.new_pack

525

revision_vf = self._build_vf('revision', True, False, for_write=True)

526

ancestor_keys = revision_vf.get_parent_map(revision_vf.keys())

527

# Strip keys back into revision_ids.

528

ancestors = dict((k[0], tuple([p[0] for p in parents]))

529

for k, parents in ancestor_keys.iteritems())

530

del ancestor_keys

531

# TODO: _generate_text_key_index should be much cheaper to generate from

532

# a chk repository, rather than the current implementation

533

ideal_index = repo._generate_text_key_index(None, ancestors)

534

file_id_parent_map = source_vf.get_parent_map(self._text_refs)

535

# 2) generate a keys list that contains all the entries that can

536

# be used as-is, with corrected parents.

537

ok_keys = []

538

new_parent_keys = {} # (key, parent_keys)

539

discarded_keys = []

540

NULL_REVISION = _mod_revision.NULL_REVISION

541

for key in self._text_refs:

542

# 0 - index

543

# 1 - key

544

# 2 - value

545

# 3 - refs

546

try:

547

ideal_parents = tuple(ideal_index[key])

548

except KeyError:

549

discarded_keys.append(key)

550

self._data_changed = True

551

else:

552

if ideal_parents == (NULL_REVISION,):

553

ideal_parents = ()

554

source_parents = file_id_parent_map[key]

555

if ideal_parents == source_parents:

556

# no change needed.

557

ok_keys.append(key)

558

else:

559

# We need to change the parent graph, but we don't need to

560

# re-insert the text (since we don't pun the compression

561

# parent with the parents list)

562

self._data_changed = True

563

new_parent_keys[key] = ideal_parents

564

# we're finished with some data.

565

del ideal_index

566

del file_id_parent_map

567

# 3) bulk copy the data, updating records than need it

568

def _update_parents_for_texts():

569

stream = source_vf.get_record_stream(self._text_refs,

570

'groupcompress', False)

571

for record in stream:

572

if record.key in new_parent_keys:

573

record.parents = new_parent_keys[record.key]

574

yield record

575

target_vf.insert_record_stream(_update_parents_for_texts())

576

577

def _use_pack(self, new_pack):

578

"""Override _use_pack to check for reconcile having changed content."""

579

return new_pack.data_inserted() and self._data_changed

580

581

582

class GCRepositoryPackCollection(RepositoryPackCollection):

583

584

pack_factory = GCPack

585

resumed_pack_factory = ResumedGCPack

586

587

def _execute_pack_operations(self, pack_operations,

588

_packer_class=GCCHKPacker,

589

reload_func=None):

590

"""Execute a series of pack operations.

591

592

:param pack_operations: A list of [revision_count, packs_to_combine].

593

:param _packer_class: The class of packer to use (default: Packer).

594

:return: None.

595

"""

596

# XXX: Copied across from RepositoryPackCollection simply because we

597

# want to override the _packer_class ... :(

598

for revision_count, packs in pack_operations:

599

# we may have no-ops from the setup logic

600

if len(packs) == 0:

601

continue

602

packer = GCCHKPacker(self, packs, '.autopack',

603

reload_func=reload_func)

604

try:

605

result = packer.pack()

606

except errors.RetryWithNewPacks:

607

# An exception is propagating out of this context, make sure

608

# this packer has cleaned up. Packer() doesn't set its new_pack

609

# state into the RepositoryPackCollection object, so we only

610

# have access to it directly here.

611

if packer.new_pack is not None:

612

packer.new_pack.abort()

613

raise

614

if result is None:

615

return

616

for pack in packs:

617

self._remove_pack_from_memory(pack)

618

# record the newly available packs and stop advertising the old

619

# packs

620

self._save_pack_names(clear_obsolete_packs=True)

621

# Move the old packs out of the way now they are no longer referenced.

622

for revision_count, packs in pack_operations:

623

self._obsolete_packs(packs)

624

625

626

class CHKInventoryRepository(KnitPackRepository):

627

"""subclass of KnitPackRepository that uses CHK based inventories."""

628

629

def __init__(self, _format, a_bzrdir, control_files, _commit_builder_class,

630

_serializer):

631

"""Overridden to change pack collection class."""

632

KnitPackRepository.__init__(self, _format, a_bzrdir, control_files,

633

_commit_builder_class, _serializer)

634

# and now replace everything it did :)

635

index_transport = self._transport.clone('indices')

636

self._pack_collection = GCRepositoryPackCollection(self,

637

self._transport, index_transport,

638

self._transport.clone('upload'),

639

self._transport.clone('packs'),

640

_format.index_builder_class,

641

_format.index_class,

642

use_chk_index=self._format.supports_chks,

643

)

644

self.inventories = GroupCompressVersionedFiles(

645

_GCGraphIndex(self._pack_collection.inventory_index.combined_index,

646

add_callback=self._pack_collection.inventory_index.add_callback,

647

parents=True, is_locked=self.is_locked,

648

inconsistency_fatal=False),

649

access=self._pack_collection.inventory_index.data_access)

650

self.revisions = GroupCompressVersionedFiles(

651

_GCGraphIndex(self._pack_collection.revision_index.combined_index,

652

add_callback=self._pack_collection.revision_index.add_callback,

653

parents=True, is_locked=self.is_locked,

654

track_external_parent_refs=True),

655

access=self._pack_collection.revision_index.data_access,

656

delta=False)

657

self.signatures = GroupCompressVersionedFiles(

658

_GCGraphIndex(self._pack_collection.signature_index.combined_index,

659

add_callback=self._pack_collection.signature_index.add_callback,

660

parents=False, is_locked=self.is_locked,

661

inconsistency_fatal=False),

662

access=self._pack_collection.signature_index.data_access,

663

delta=False)

664

self.texts = GroupCompressVersionedFiles(

665

_GCGraphIndex(self._pack_collection.text_index.combined_index,

666

add_callback=self._pack_collection.text_index.add_callback,

667

parents=True, is_locked=self.is_locked,

668

inconsistency_fatal=False),

669

access=self._pack_collection.text_index.data_access)

670

# No parents, individual CHK pages don't have specific ancestry

671

self.chk_bytes = GroupCompressVersionedFiles(

672

_GCGraphIndex(self._pack_collection.chk_index.combined_index,

673

add_callback=self._pack_collection.chk_index.add_callback,

674

parents=False, is_locked=self.is_locked,

675

inconsistency_fatal=False),

676

access=self._pack_collection.chk_index.data_access)

677

search_key_name = self._format._serializer.search_key_name

678

search_key_func = chk_map.search_key_registry.get(search_key_name)

679

self.chk_bytes._search_key_func = search_key_func

680

# True when the repository object is 'write locked' (as opposed to the

681

# physical lock only taken out around changes to the pack-names list.)

682

# Another way to represent this would be a decorator around the control

683

# files object that presents logical locks as physical ones - if this

684

# gets ugly consider that alternative design. RBC 20071011

685

self._write_lock_count = 0

686

self._transaction = None

687

# for tests

688

self._reconcile_does_inventory_gc = True

689

self._reconcile_fixes_text_parents = True

690

self._reconcile_backsup_inventory = False

691

692

def _add_inventory_checked(self, revision_id, inv, parents):

693

"""Add inv to the repository after checking the inputs.

694

695

This function can be overridden to allow different inventory styles.

696

697

:seealso: add_inventory, for the contract.

698

"""

699

# make inventory

700

serializer = self._format._serializer

701

result = inventory.CHKInventory.from_inventory(self.chk_bytes, inv,

702

maximum_size=serializer.maximum_size,

703

search_key_name=serializer.search_key_name)

704

inv_lines = result.to_lines()

705

return self._inventory_add_lines(revision_id, parents,

706

inv_lines, check_content=False)

707

708

def _create_inv_from_null(self, delta, revision_id):

709

"""This will mutate new_inv directly.

710

711

This is a simplified form of create_by_apply_delta which knows that all

712

the old values must be None, so everything is a create.

713

"""

714

serializer = self._format._serializer

715

new_inv = inventory.CHKInventory(serializer.search_key_name)

716

new_inv.revision_id = revision_id

717

entry_to_bytes = new_inv._entry_to_bytes

718

id_to_entry_dict = {}

719

parent_id_basename_dict = {}

720

for old_path, new_path, file_id, entry in delta:

721

if old_path is not None:

722

raise ValueError('Invalid delta, somebody tried to delete %r'

723

' from the NULL_REVISION'

724

% ((old_path, file_id),))

725

if new_path is None:

726

raise ValueError('Invalid delta, delta from NULL_REVISION has'

727

' no new_path %r' % (file_id,))

728

if new_path == '':

729

new_inv.root_id = file_id

730

parent_id_basename_key = ('', '')

731

else:

732

utf8_entry_name = entry.name.encode('utf-8')

733

parent_id_basename_key = (entry.parent_id, utf8_entry_name)

734

new_value = entry_to_bytes(entry)

735

# Populate Caches?

736

# new_inv._path_to_fileid_cache[new_path] = file_id

737

id_to_entry_dict[(file_id,)] = new_value

738

parent_id_basename_dict[parent_id_basename_key] = file_id

739

740

new_inv._populate_from_dicts(self.chk_bytes, id_to_entry_dict,

741

parent_id_basename_dict, maximum_size=serializer.maximum_size)

742

return new_inv

743

744

def add_inventory_by_delta(self, basis_revision_id, delta, new_revision_id,

745

parents, basis_inv=None, propagate_caches=False):

746

"""Add a new inventory expressed as a delta against another revision.

747

748

:param basis_revision_id: The inventory id the delta was created

749

against.

750

:param delta: The inventory delta (see Inventory.apply_delta for

751

details).

752

:param new_revision_id: The revision id that the inventory is being

753

added for.

754

:param parents: The revision ids of the parents that revision_id is

755

known to have and are in the repository already. These are supplied

756

for repositories that depend on the inventory graph for revision

757

graph access, as well as for those that pun ancestry with delta

758

compression.

759

:param basis_inv: The basis inventory if it is already known,

760

otherwise None.

761

:param propagate_caches: If True, the caches for this inventory are

762

copied to and updated for the result if possible.

763

764

:returns: (validator, new_inv)

765

The validator(which is a sha1 digest, though what is sha'd is

766

repository format specific) of the serialized inventory, and the

767

resulting inventory.

768

"""

769

if not self.is_in_write_group():

770

raise AssertionError("%r not in write group" % (self,))

771

_mod_revision.check_not_reserved_id(new_revision_id)

772

basis_tree = None

773

if basis_inv is None:

774

if basis_revision_id == _mod_revision.NULL_REVISION:

775

new_inv = self._create_inv_from_null(delta, new_revision_id)

776

inv_lines = new_inv.to_lines()

777

return self._inventory_add_lines(new_revision_id, parents,

778

inv_lines, check_content=False), new_inv

779

else:

780

basis_tree = self.revision_tree(basis_revision_id)

781

basis_tree.lock_read()

782

basis_inv = basis_tree.inventory

783

try:

784

result = basis_inv.create_by_apply_delta(delta, new_revision_id,

785

propagate_caches=propagate_caches)

786

inv_lines = result.to_lines()

787

return self._inventory_add_lines(new_revision_id, parents,

788

inv_lines, check_content=False), result

789

finally:

790

if basis_tree is not None:

791

basis_tree.unlock()

792

793

def deserialise_inventory(self, revision_id, bytes):

794

return inventory.CHKInventory.deserialise(self.chk_bytes, bytes,

795

(revision_id,))

796

797

def _iter_inventories(self, revision_ids, ordering):

798

"""Iterate over many inventory objects."""

799

if ordering is None:

800

ordering = 'unordered'

801

keys = [(revision_id,) for revision_id in revision_ids]

802

stream = self.inventories.get_record_stream(keys, ordering, True)

803

texts = {}

804

for record in stream:

805

if record.storage_kind != 'absent':

806

texts[record.key] = record.get_bytes_as('fulltext')

807

else:

808

raise errors.NoSuchRevision(self, record.key)

809

for key in keys:

810

yield inventory.CHKInventory.deserialise(self.chk_bytes, texts[key], key)

811

812

def _iter_inventory_xmls(self, revision_ids, ordering):

813

# Without a native 'xml' inventory, this method doesn't make sense.

814

# However older working trees, and older bundles want it - so we supply

815

# it allowing get_inventory_xml to work. Bundles currently use the

816

# serializer directly; this also isn't ideal, but there isn't an xml

817

# iteration interface offered at all for repositories. We could make

818

# _iter_inventory_xmls be part of the contract, even if kept private.

819

inv_to_str = self._serializer.write_inventory_to_string

820

for inv in self.iter_inventories(revision_ids, ordering=ordering):

821

yield inv_to_str(inv), inv.revision_id

822

823

def _find_present_inventory_keys(self, revision_keys):

824

parent_map = self.inventories.get_parent_map(revision_keys)

825

present_inventory_keys = set(k for k in parent_map)

826

return present_inventory_keys

827

828

def fileids_altered_by_revision_ids(self, revision_ids, _inv_weave=None):

829

"""Find the file ids and versions affected by revisions.

830

831

:param revisions: an iterable containing revision ids.

832

:param _inv_weave: The inventory weave from this repository or None.

833

If None, the inventory weave will be opened automatically.

834

:return: a dictionary mapping altered file-ids to an iterable of

835

revision_ids. Each altered file-ids has the exact revision_ids that

836

altered it listed explicitly.

837

"""

838

rich_root = self.supports_rich_root()

839

bytes_to_info = inventory.CHKInventory._bytes_to_utf8name_key

840

file_id_revisions = {}

841

pb = ui.ui_factory.nested_progress_bar()

842

try:

843

revision_keys = [(r,) for r in revision_ids]

844

parent_keys = self._find_parent_keys_of_revisions(revision_keys)

845

# TODO: instead of using _find_present_inventory_keys, change the

846

# code paths to allow missing inventories to be tolerated.

847

# However, we only want to tolerate missing parent

848

# inventories, not missing inventories for revision_ids

849

present_parent_inv_keys = self._find_present_inventory_keys(

850

parent_keys)

851

present_parent_inv_ids = set(

852

[k[-1] for k in present_parent_inv_keys])

853

uninteresting_root_keys = set()

854

interesting_root_keys = set()

855

inventories_to_read = set(revision_ids)

856

inventories_to_read.update(present_parent_inv_ids)

857

for inv in self.iter_inventories(inventories_to_read):

858

entry_chk_root_key = inv.id_to_entry.key()

859

if inv.revision_id in present_parent_inv_ids:

860

uninteresting_root_keys.add(entry_chk_root_key)

861

else:

862

interesting_root_keys.add(entry_chk_root_key)

863

864

chk_bytes = self.chk_bytes

865

for record, items in chk_map.iter_interesting_nodes(chk_bytes,

866

interesting_root_keys, uninteresting_root_keys,

867

pb=pb):

868

for name, bytes in items:

869

(name_utf8, file_id, revision_id) = bytes_to_info(bytes)

870

if not rich_root and name_utf8 == '':

871

continue

872

try:

873

file_id_revisions[file_id].add(revision_id)

874

except KeyError:

875

file_id_revisions[file_id] = set([revision_id])

876

finally:

877

pb.finished()

878

return file_id_revisions

879

880

def find_text_key_references(self):

881

"""Find the text key references within the repository.

882

883

:return: A dictionary mapping text keys ((fileid, revision_id) tuples)

884

to whether they were referred to by the inventory of the

885

revision_id that they contain. The inventory texts from all present

886

revision ids are assessed to generate this report.

887

"""

888

# XXX: Slow version but correct: rewrite as a series of delta

889

# examinations/direct tree traversal. Note that that will require care

890

# as a common node is reachable both from the inventory that added it,

891

# and others afterwards.

892

revision_keys = self.revisions.keys()

893

result = {}

894

rich_roots = self.supports_rich_root()

895

pb = ui.ui_factory.nested_progress_bar()

896

try:

897

all_revs = self.all_revision_ids()

898

total = len(all_revs)

899

for pos, inv in enumerate(self.iter_inventories(all_revs)):

900

pb.update("Finding text references", pos, total)

901

for _, entry in inv.iter_entries():

902

if not rich_roots and entry.file_id == inv.root_id:

903

continue

904

key = (entry.file_id, entry.revision)

905

result.setdefault(key, False)

906

if entry.revision == inv.revision_id:

907

result[key] = True

908

return result

909

finally:

910

pb.finished()

911

912

def _reconcile_pack(self, collection, packs, extension, revs, pb):

913

packer = GCCHKReconcilePacker(collection, packs, extension)

914

return packer.pack(pb)

915

916

def _get_source(self, to_format):

917

"""Return a source for streaming from this repository."""

918

if self._format._serializer == to_format._serializer:

919

# We must be exactly the same format, otherwise stuff like the chk

920

# page layout might be different.

921

# Actually, this test is just slightly looser than exact so that

922

# CHK2 <-> 2a transfers will work.

923

return GroupCHKStreamSource(self, to_format)

924

return super(CHKInventoryRepository, self)._get_source(to_format)

925

926

927

class GroupCHKStreamSource(KnitPackStreamSource):

928

"""Used when both the source and target repo are GroupCHK repos."""

929

930

def __init__(self, from_repository, to_format):

931

"""Create a StreamSource streaming from from_repository."""

932

super(GroupCHKStreamSource, self).__init__(from_repository, to_format)

933

self._revision_keys = None

934

self._text_keys = None

935

# self._text_fetch_order = 'unordered'

936

self._chk_id_roots = None

937

self._chk_p_id_roots = None

938

939

def _get_inventory_stream(self, inventory_keys, allow_absent=False):

940

"""Get a stream of inventory texts.

941

942

When this function returns, self._chk_id_roots and self._chk_p_id_roots

943

should be populated.

944

"""

945

self._chk_id_roots = []

946

self._chk_p_id_roots = []

947

def _filtered_inv_stream():

948

id_roots_set = set()

949

p_id_roots_set = set()

950

source_vf = self.from_repository.inventories

951

stream = source_vf.get_record_stream(inventory_keys,

952

'unordered', True)

953

for record in stream:

954

if record.storage_kind == 'absent':

955

if allow_absent:

956

continue

957

else:

958

raise errors.NoSuchRevision(self, record.key)

959

bytes = record.get_bytes_as('fulltext')

960

chk_inv = inventory.CHKInventory.deserialise(None, bytes,

961

record.key)

962

key = chk_inv.id_to_entry.key()

963

if key not in id_roots_set:

964

self._chk_id_roots.append(key)

965

id_roots_set.add(key)

966

p_id_map = chk_inv.parent_id_basename_to_file_id

967

if p_id_map is None:

968

raise AssertionError('Parent id -> file_id map not set')

969

key = p_id_map.key()

970

if key not in p_id_roots_set:

971

p_id_roots_set.add(key)

972

self._chk_p_id_roots.append(key)

973

yield record

974

# We have finished processing all of the inventory records, we

975

# don't need these sets anymore

976

id_roots_set.clear()

977

p_id_roots_set.clear()

978

return ('inventories', _filtered_inv_stream())

979

980

def _get_filtered_chk_streams(self, excluded_revision_keys):

981

self._text_keys = set()

982

excluded_revision_keys.discard(_mod_revision.NULL_REVISION)

983

if not excluded_revision_keys:

984

uninteresting_root_keys = set()

985

uninteresting_pid_root_keys = set()

986

else:

987

# filter out any excluded revisions whose inventories are not

988

# actually present

989

# TODO: Update Repository.iter_inventories() to add

990

# ignore_missing=True

991

present_keys = self.from_repository._find_present_inventory_keys(

992

excluded_revision_keys)

993

present_ids = [k[-1] for k in present_keys]

994

uninteresting_root_keys = set()

995

uninteresting_pid_root_keys = set()

996

for inv in self.from_repository.iter_inventories(present_ids):

997

uninteresting_root_keys.add(inv.id_to_entry.key())

998

uninteresting_pid_root_keys.add(

999

inv.parent_id_basename_to_file_id.key())

1000

bytes_to_info = inventory.CHKInventory._bytes_to_utf8name_key

1001

chk_bytes = self.from_repository.chk_bytes

1002

def _filter_id_to_entry():

1003

for record, items in chk_map.iter_interesting_nodes(chk_bytes,

1004

self._chk_id_roots, uninteresting_root_keys):

1005

for name, bytes in items:

1006

# Note: we don't care about name_utf8, because we are always

1007

# rich-root = True

1008

_, file_id, revision_id = bytes_to_info(bytes)

1009

self._text_keys.add((file_id, revision_id))

1010

if record is not None:

1011

yield record

1012

# Consumed

1013

self._chk_id_roots = None

1014

yield 'chk_bytes', _filter_id_to_entry()

1015

def _get_parent_id_basename_to_file_id_pages():

1016

for record, items in chk_map.iter_interesting_nodes(chk_bytes,

1017

self._chk_p_id_roots, uninteresting_pid_root_keys):

1018

if record is not None:

1019

yield record

1020

# Consumed

1021

self._chk_p_id_roots = None

1022

yield 'chk_bytes', _get_parent_id_basename_to_file_id_pages()

1023

1024

def get_stream(self, search):

1025

revision_ids = search.get_keys()

1026

for stream_info in self._fetch_revision_texts(revision_ids):

1027

yield stream_info

1028

self._revision_keys = [(rev_id,) for rev_id in revision_ids]

1029

yield self._get_inventory_stream(self._revision_keys)

1030

# TODO: The keys to exclude might be part of the search recipe

1031

# For now, exclude all parents that are at the edge of ancestry, for

1032

# which we have inventories

1033

from_repo = self.from_repository

1034

parent_keys = from_repo._find_parent_keys_of_revisions(

1035

self._revision_keys)

1036

for stream_info in self._get_filtered_chk_streams(parent_keys):

1037

yield stream_info

1038

yield self._get_text_stream()

1039

1040

def get_stream_for_missing_keys(self, missing_keys):

1041

# missing keys can only occur when we are byte copying and not

1042

# translating (because translation means we don't send

1043

# unreconstructable deltas ever).

1044

missing_inventory_keys = set()

1045

for key in missing_keys:

1046

if key[0] != 'inventories':

1047

raise AssertionError('The only missing keys we should'

1048

' be filling in are inventory keys, not %s'

1049

% (key[0],))

1050

missing_inventory_keys.add(key[1:])

1051

if self._chk_id_roots or self._chk_p_id_roots:

1052

raise AssertionError('Cannot call get_stream_for_missing_keys'

1053

' untill all of get_stream() has been consumed.')

1054

# Yield the inventory stream, so we can find the chk stream

1055

# Some of the missing_keys will be missing because they are ghosts.

1056

# As such, we can ignore them. The Sink is required to verify there are

1057

# no unavailable texts when the ghost inventories are not filled in.

1058

yield self._get_inventory_stream(missing_inventory_keys,

1059

allow_absent=True)

1060

# We use the empty set for excluded_revision_keys, to make it clear

1061

# that we want to transmit all referenced chk pages.

1062

for stream_info in self._get_filtered_chk_streams(set()):

1063

yield stream_info

1064

1065

1066

class RepositoryFormatCHK1(RepositoryFormatPack):

1067

"""A hashed CHK+group compress pack repository."""

1068

1069

repository_class = CHKInventoryRepository

1070

supports_external_lookups = True

1071

supports_chks = True

1072

# For right now, setting this to True gives us InterModel1And2 rather

1073

# than InterDifferingSerializer

1074

_commit_builder_class = PackRootCommitBuilder

1075

rich_root_data = True

1076

_serializer = chk_serializer.chk_serializer_255_bigpage

1077

_commit_inv_deltas = True

1078

# What index classes to use

1079

index_builder_class = BTreeBuilder

1080

index_class = BTreeGraphIndex

1081

# Note: We cannot unpack a delta that references a text we haven't

1082

# seen yet. There are 2 options, work in fulltexts, or require

1083

# topological sorting. Using fulltexts is more optimal for local

1084

# operations, because the source can be smart about extracting

1085

# multiple in-a-row (and sharing strings). Topological is better

1086

# for remote, because we access less data.

1087

_fetch_order = 'unordered'

1088

_fetch_uses_deltas = False # essentially ignored by the groupcompress code.

1089

fast_deltas = True

1090

pack_compresses = True

1091

1092

def _get_matching_bzrdir(self):

1093

return bzrdir.format_registry.make_bzrdir('development6-rich-root')

1094

1095

def _ignore_setting_bzrdir(self, format):

1096

pass

1097

1098

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

1099

1100

def get_format_string(self):

1101

"""See RepositoryFormat.get_format_string()."""

1102

return ('Bazaar development format - group compression and chk inventory'

1103

' (needs bzr.dev from 1.14)\n')

1104

1105

def get_format_description(self):

1106

"""See RepositoryFormat.get_format_description()."""

1107

return ("Development repository format - rich roots, group compression"

1108

" and chk inventories")

1109

1110

1111

class RepositoryFormatCHK2(RepositoryFormatCHK1):

1112

"""A CHK repository that uses the bencode revision serializer."""

1113

1114

_serializer = chk_serializer.chk_bencode_serializer

1115

1116

def _get_matching_bzrdir(self):

1117

return bzrdir.format_registry.make_bzrdir('development7-rich-root')

1118

1119

def _ignore_setting_bzrdir(self, format):

1120

pass

1121

1122

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

1123

1124

def get_format_string(self):

1125

"""See RepositoryFormat.get_format_string()."""

1126

return ('Bazaar development format - chk repository with bencode '

1127

'revision serialization (needs bzr.dev from 1.16)\n')

1128

1129

1130

class RepositoryFormat2a(RepositoryFormatCHK2):

1131

"""A CHK repository that uses the bencode revision serializer.

1132

1133

This is the same as RepositoryFormatCHK2 but with a public name.

1134

"""

1135

1136

_serializer = chk_serializer.chk_bencode_serializer

1137

1138

def _get_matching_bzrdir(self):

1139

return bzrdir.format_registry.make_bzrdir('2a')

1140

1141

def _ignore_setting_bzrdir(self, format):

1142

pass

1143

1144

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

1145

1146

def get_format_string(self):

1147

return ('Bazaar repository format 2a (needs bzr 1.16 or later)\n')

Older »