~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/repofmt/groupcompress_repo.py

Committer: Canonical.com Patch Queue Manager
Date: 2008-03-16 14:01:20 UTC
mfrom: (3280.2.5 integration)
Revision ID: pqm@pqm.ubuntu.com-20080316140120-i3yq8yr1l66m11h7

Start 1.4 development

files added:
bzrlib/help_topics/en/hooks.txt

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_http_implementations.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/xml6.py

tools/win32/survey.txt

files removed:
bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_chunks_to_lines_py.py

bzrlib/_chunks_to_lines_pyx.pyx

bzrlib/_groupcompress_py.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/btree_index.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/delta.h

bzrlib/diff-delta.c

bzrlib/fifo_cache.py

bzrlib/filters

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/groupcompress.py

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/eol.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/inventory_delta.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/plugins/netrc_credential_store

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/netrc_credential_store/tests

bzrlib/plugins/netrc_credential_store/tests/__init__.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/push.py

bzrlib/python-compat.h

bzrlib/readdir.h

bzrlib/rename_map.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_clean_tree.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_dump_btree.py

bzrlib/tests/blackbox/test_filesystem_cicp.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_create_clone.py

bzrlib/tests/branch_implementations/test_dotted_revno_to_revision_id.py

bzrlib/tests/branch_implementations/test_iter_merge_sorted_revisions.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_revision_id_to_dotted_revno.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/bzrdir_implementations/test_push.py

bzrlib/tests/fake_command.py

bzrlib/tests/file_utils.py

bzrlib/tests/ftp_server

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/https_server.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/per_interbranch

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interbranch/test_update_revisions.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_add_inventory_by_delta.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_refresh_data.py

bzrlib/tests/per_repository_chk

bzrlib/tests/per_repository_chk/__init__.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_chk/test_unsupported.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/ssl_certs

bzrlib/tests/ssl_certs/__init__.py

bzrlib/tests/ssl_certs/ca.crt

bzrlib/tests/ssl_certs/ca.key

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_eol_filters.py

bzrlib/tests/test_export.py

bzrlib/tests/test_fifo_cache.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patches_data/diff-7

bzrlib/tests/test_patches_data/mod-7

bzrlib/tests/test_patches_data/orig-7

bzrlib/tests/test_rename_map.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/tree_implementations/test_get_file_with_stat.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/tests/workingtree_implementations/test_content_filters.py

bzrlib/tests/workingtree_implementations/test_eol_conversion.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/transport/ftp

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/log.py

bzrlib/transport/nosmart.py

bzrlib/views.py

bzrlib/xml5.py

bzrlib/xml6.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_ssh_path_limiter

contrib/convert_to_1.9.py

doc/developers/btree_index_prefetch.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/cycle.txt

doc/developers/ec2.txt

doc/developers/groupcompress-design.txt

doc/developers/improved_chk_index.txt

doc/developers/integration.txt

doc/developers/lca_tree_merging.txt

doc/developers/overview.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/organizing_your_workspace.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/web_browsing.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

doc/news-template.txt

tools/check-newsbugs.py

tools/packaging

tools/packaging/build-packages.sh

tools/packaging/lp-upload-release

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/prepare_for_latex.py

tools/rst2pdf.py

tools/win32/build_release.py

tools/win32/run_script.py

files renamed:
bzrlib/tests/ftp_server/medusa_based.py => bzrlib/tests/ftp_server.py

bzrlib/tests/per_repository/ => bzrlib/tests/repository_implementations/

bzrlib/tests/test_revisionspec.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/transport/ftp/__init__.py => bzrlib/transport/ftp.py

bzrlib/xml8.py => bzrlib/xml5.py

doc/en/developer-guide/HACKING.txt => doc/developers/HACKING.txt

doc/en/user-guide/part2_intro.txt => doc/en/user-guide/best_practice_intro.txt

doc/en/user-guide/zen.txt => doc/en/user-guide/revnos.txt

files modified:
.bzrignore

Makefile

NEWS

bzr.ico

bzrlib/__init__.py

bzrlib/_dirstate_helpers_c.h

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_c.c

bzrlib/_patiencediff_py.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_dirstate.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/util/tests/test_bencode.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml7.py

bzrlib/xml_serializer.py

contrib/bzr_access

contrib/newinventory.py

contrib/pwclient.full

doc/default.css

doc/developers/api-versioning.txt

doc/developers/authentication-ring.txt

doc/developers/container-format.txt

doc/developers/development-repo.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/inventory.txt

doc/developers/lca-merge.txt

doc/developers/merge-scaling.txt

doc/developers/network-protocol.txt

doc/developers/performance-contributing.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/repository.txt

doc/developers/revision-properties.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_aliases.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/writing_a_plugin.txt

doc/index.txt

generate_docs.py

profile_imports.py

setup.py

tools/bzr_epydoc_uid.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/package_mf.py

tools/rst2html.py

tools/weavebench.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

Show diffs side-by-side

added added

removed removed

bzrlib/repofmt/groupcompress_repo.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Repository formats using CHK inventories and groupcompress compression."""

import time

from bzrlib import (

bzrdir,

chk_map,

chk_serializer,

debug,

errors,

index as _mod_index,

inventory,

knit,

osutils,

pack,

remote,

repository,

revision as _mod_revision,

trace,

ui,

)

from bzrlib.btree_index import (

BTreeGraphIndex,

BTreeBuilder,

)

from bzrlib.index import GraphIndex, GraphIndexBuilder

from bzrlib.groupcompress import (

_GCGraphIndex,

GroupCompressVersionedFiles,

)

from bzrlib.repofmt.pack_repo import (

Pack,

NewPack,

KnitPackRepository,

KnitPackStreamSource,

PackRootCommitBuilder,

RepositoryPackCollection,

RepositoryFormatPack,

ResumedPack,

Packer,

)

class GCPack(NewPack):

def __init__(self, pack_collection, upload_suffix='', file_mode=None):

"""Create a NewPack instance.

:param pack_collection: A PackCollection into which this is being

inserted.

:param upload_suffix: An optional suffix to be given to any temporary

files created during the pack creation. e.g '.autopack'

:param file_mode: An optional file mode to create the new files with.

"""

# replaced from NewPack to:

# - change inventory reference list length to 1

# - change texts reference lists to 1

# TODO: patch this to be parameterised

# The relative locations of the packs are constrained, but all are

# passed in because the caller has them, so as to avoid object churn.

index_builder_class = pack_collection._index_builder_class

# from brisbane-core

if pack_collection.chk_index is not None:

chk_index = index_builder_class(reference_lists=0)

else:

chk_index = None

Pack.__init__(self,

# Revisions: parents list, no text compression.

index_builder_class(reference_lists=1),

# Inventory: We want to map compression only, but currently the

# knit code hasn't been updated enough to understand that, so we

# have a regular 2-list index giving parents and compression

# source.

index_builder_class(reference_lists=1),

# Texts: per file graph, for all fileids - so one reference list

# and two elements in the key tuple.

index_builder_class(reference_lists=1, key_elements=2),

# Signatures: Just blobs to store, no compression, no parents

# listing.

index_builder_class(reference_lists=0),

# CHK based storage - just blobs, no compression or parents.

chk_index=chk_index

100

)

101

self._pack_collection = pack_collection

102

# When we make readonly indices, we need this.

103

self.index_class = pack_collection._index_class

104

# where should the new pack be opened

105

self.upload_transport = pack_collection._upload_transport

106

# where are indices written out to

107

self.index_transport = pack_collection._index_transport

108

# where is the pack renamed to when it is finished?

109

self.pack_transport = pack_collection._pack_transport

110

# What file mode to upload the pack and indices with.

111

self._file_mode = file_mode

112

# tracks the content written to the .pack file.

113

self._hash = osutils.md5()

114

# a four-tuple with the length in bytes of the indices, once the pack

115

# is finalised. (rev, inv, text, sigs)

116

self.index_sizes = None

117

# How much data to cache when writing packs. Note that this is not

118

# synchronised with reads, because it's not in the transport layer, so

119

# is not safe unless the client knows it won't be reading from the pack

120

# under creation.

121

self._cache_limit = 0

122

# the temporary pack file name.

123

self.random_name = osutils.rand_chars(20) + upload_suffix

124

# when was this pack started ?

125

self.start_time = time.time()

126

# open an output stream for the data added to the pack.

127

self.write_stream = self.upload_transport.open_write_stream(

128

self.random_name, mode=self._file_mode)

129

if 'pack' in debug.debug_flags:

130

trace.mutter('%s: create_pack: pack stream open: %s%s t+%6.3fs',

131

time.ctime(), self.upload_transport.base, self.random_name,

132

time.time() - self.start_time)

133

# A list of byte sequences to be written to the new pack, and the

134

# aggregate size of them. Stored as a list rather than separate

135

# variables so that the _write_data closure below can update them.

136

self._buffer = [[], 0]

137

# create a callable for adding data

138

139

# robertc says- this is a closure rather than a method on the object

140

# so that the variables are locals, and faster than accessing object

141

# members.

142

def _write_data(bytes, flush=False, _buffer=self._buffer,

143

_write=self.write_stream.write, _update=self._hash.update):

144

_buffer[0].append(bytes)

145

_buffer[1] += len(bytes)

146

# buffer cap

147

if _buffer[1] > self._cache_limit or flush:

148

bytes = ''.join(_buffer[0])

149

_write(bytes)

150

_update(bytes)

151

_buffer[:] = [[], 0]

152

# expose this on self, for the occasion when clients want to add data.

153

self._write_data = _write_data

154

# a pack writer object to serialise pack records.

155

self._writer = pack.ContainerWriter(self._write_data)

156

self._writer.begin()

157

# what state is the pack in? (open, finished, aborted)

158

self._state = 'open'

159

160

def _check_references(self):

161

"""Make sure our external references are present.

162

163

Packs are allowed to have deltas whose base is not in the pack, but it

164

must be present somewhere in this collection. It is not allowed to

165

have deltas based on a fallback repository.

166

(See <https://bugs.launchpad.net/bzr/+bug/288751>)

167

"""

168

# Groupcompress packs don't have any external references, arguably CHK

169

# pages have external references, but we cannot 'cheaply' determine

170

# them without actually walking all of the chk pages.

171

172

173

class ResumedGCPack(ResumedPack):

174

175

def _check_references(self):

176

"""Make sure our external compression parents are present."""

177

# See GCPack._check_references for why this is empty

178

179

def _get_external_refs(self, index):

180

# GC repositories don't have compression parents external to a given

181

# pack file

182

return set()

183

184

185

class GCCHKPacker(Packer):

186

"""This class understand what it takes to collect a GCCHK repo."""

187

188

def __init__(self, pack_collection, packs, suffix, revision_ids=None,

189

reload_func=None):

190

super(GCCHKPacker, self).__init__(pack_collection, packs, suffix,

191

revision_ids=revision_ids,

192

reload_func=reload_func)

193

self._pack_collection = pack_collection

194

# ATM, We only support this for GCCHK repositories

195

if pack_collection.chk_index is None:

196

raise AssertionError('pack_collection.chk_index should not be None')

197

self._gather_text_refs = False

198

self._chk_id_roots = []

199

self._chk_p_id_roots = []

200

self._text_refs = None

201

# set by .pack() if self.revision_ids is not None

202

self.revision_keys = None

203

204

def _get_progress_stream(self, source_vf, keys, message, pb):

205

def pb_stream():

206

substream = source_vf.get_record_stream(keys, 'groupcompress', True)

207

for idx, record in enumerate(substream):

208

if pb is not None:

209

pb.update(message, idx + 1, len(keys))

210

yield record

211

return pb_stream()

212

213

def _get_filtered_inv_stream(self, source_vf, keys, message, pb=None):

214

"""Filter the texts of inventories, to find the chk pages."""

215

total_keys = len(keys)

216

def _filtered_inv_stream():

217

id_roots_set = set()

218

p_id_roots_set = set()

219

stream = source_vf.get_record_stream(keys, 'groupcompress', True)

220

for idx, record in enumerate(stream):

221

bytes = record.get_bytes_as('fulltext')

222

chk_inv = inventory.CHKInventory.deserialise(None, bytes,

223

record.key)

224

if pb is not None:

225

pb.update('inv', idx, total_keys)

226

key = chk_inv.id_to_entry.key()

227

if key not in id_roots_set:

228

self._chk_id_roots.append(key)

229

id_roots_set.add(key)

230

p_id_map = chk_inv.parent_id_basename_to_file_id

231

if p_id_map is None:

232

raise AssertionError('Parent id -> file_id map not set')

233

key = p_id_map.key()

234

if key not in p_id_roots_set:

235

p_id_roots_set.add(key)

236

self._chk_p_id_roots.append(key)

237

yield record

238

# We have finished processing all of the inventory records, we

239

# don't need these sets anymore

240

id_roots_set.clear()

241

p_id_roots_set.clear()

242

return _filtered_inv_stream()

243

244

def _get_chk_streams(self, source_vf, keys, pb=None):

245

# We want to stream the keys from 'id_roots', and things they

246

# reference, and then stream things from p_id_roots and things they

247

# reference, and then any remaining keys that we didn't get to.

248

249

# We also group referenced texts together, so if one root references a

250

# text with prefix 'a', and another root references a node with prefix

251

# 'a', we want to yield those nodes before we yield the nodes for 'b'

252

# This keeps 'similar' nodes together.

253

254

# Note: We probably actually want multiple streams here, to help the

255

# client understand that the different levels won't compress well

256

# against each other.

257

# Test the difference between using one Group per level, and

258

# using 1 Group per prefix. (so '' (root) would get a group, then

259

# all the references to search-key 'a' would get a group, etc.)

260

total_keys = len(keys)

261

remaining_keys = set(keys)

262

counter = [0]

263

if self._gather_text_refs:

264

bytes_to_info = inventory.CHKInventory._bytes_to_utf8name_key

265

self._text_refs = set()

266

def _get_referenced_stream(root_keys, parse_leaf_nodes=False):

267

cur_keys = root_keys

268

while cur_keys:

269

keys_by_search_prefix = {}

270

remaining_keys.difference_update(cur_keys)

271

next_keys = set()

272

def handle_internal_node(node):

273

for prefix, value in node._items.iteritems():

274

# We don't want to request the same key twice, and we

275

# want to order it by the first time it is seen.

276

# Even further, we don't want to request a key which is

277

# not in this group of pack files (it should be in the

278

# repo, but it doesn't have to be in the group being

279

# packed.)

280

# TODO: consider how to treat externally referenced chk

281

# pages as 'external_references' so that we

282

# always fill them in for stacked branches

283

if value not in next_keys and value in remaining_keys:

284

keys_by_search_prefix.setdefault(prefix,

285

[]).append(value)

286

next_keys.add(value)

287

def handle_leaf_node(node):

288

# Store is None, because we know we have a LeafNode, and we

289

# just want its entries

290

for file_id, bytes in node.iteritems(None):

291

name_utf8, file_id, revision_id = bytes_to_info(bytes)

292

self._text_refs.add((file_id, revision_id))

293

def next_stream():

294

stream = source_vf.get_record_stream(cur_keys,

295

'as-requested', True)

296

for record in stream:

297

bytes = record.get_bytes_as('fulltext')

298

# We don't care about search_key_func for this code,

299

# because we only care about external references.

300

node = chk_map._deserialise(bytes, record.key,

301

search_key_func=None)

302

common_base = node._search_prefix

303

if isinstance(node, chk_map.InternalNode):

304

handle_internal_node(node)

305

elif parse_leaf_nodes:

306

handle_leaf_node(node)

307

counter[0] += 1

308

if pb is not None:

309

pb.update('chk node', counter[0], total_keys)

310

yield record

311

yield next_stream()

312

# Double check that we won't be emitting any keys twice

313

# If we get rid of the pre-calculation of all keys, we could

314

# turn this around and do

315

# next_keys.difference_update(seen_keys)

316

# However, we also may have references to chk pages in another

317

# pack file during autopack. We filter earlier, so we should no

318

# longer need to do this

319

# next_keys = next_keys.intersection(remaining_keys)

320

cur_keys = []

321

for prefix in sorted(keys_by_search_prefix):

322

cur_keys.extend(keys_by_search_prefix.pop(prefix))

323

for stream in _get_referenced_stream(self._chk_id_roots,

324

self._gather_text_refs):

325

yield stream

326

del self._chk_id_roots

327

# while it isn't really possible for chk_id_roots to not be in the

328

# local group of packs, it is possible that the tree shape has not

329

# changed recently, so we need to filter _chk_p_id_roots by the

330

# available keys

331

chk_p_id_roots = [key for key in self._chk_p_id_roots

332

if key in remaining_keys]

333

del self._chk_p_id_roots

334

for stream in _get_referenced_stream(chk_p_id_roots, False):

335

yield stream

336

if remaining_keys:

337

trace.mutter('There were %d keys in the chk index, %d of which'

338

' were not referenced', total_keys,

339

len(remaining_keys))

340

if self.revision_ids is None:

341

stream = source_vf.get_record_stream(remaining_keys,

342

'unordered', True)

343

yield stream

344

345

def _build_vf(self, index_name, parents, delta, for_write=False):

346

"""Build a VersionedFiles instance on top of this group of packs."""

347

index_name = index_name + '_index'

348

index_to_pack = {}

349

access = knit._DirectPackAccess(index_to_pack)

350

if for_write:

351

# Use new_pack

352

if self.new_pack is None:

353

raise AssertionError('No new pack has been set')

354

index = getattr(self.new_pack, index_name)

355

index_to_pack[index] = self.new_pack.access_tuple()

356

index.set_optimize(for_size=True)

357

access.set_writer(self.new_pack._writer, index,

358

self.new_pack.access_tuple())

359

add_callback = index.add_nodes

360

else:

361

indices = []

362

for pack in self.packs:

363

sub_index = getattr(pack, index_name)

364

index_to_pack[sub_index] = pack.access_tuple()

365

indices.append(sub_index)

366

index = _mod_index.CombinedGraphIndex(indices)

367

add_callback = None

368

vf = GroupCompressVersionedFiles(

369

_GCGraphIndex(index,

370

add_callback=add_callback,

371

parents=parents,

372

is_locked=self._pack_collection.repo.is_locked),

373

access=access,

374

delta=delta)

375

return vf

376

377

def _build_vfs(self, index_name, parents, delta):

378

"""Build the source and target VersionedFiles."""

379

source_vf = self._build_vf(index_name, parents,

380

delta, for_write=False)

381

target_vf = self._build_vf(index_name, parents,

382

delta, for_write=True)

383

return source_vf, target_vf

384

385

def _copy_stream(self, source_vf, target_vf, keys, message, vf_to_stream,

386

pb_offset):

387

trace.mutter('repacking %d %s', len(keys), message)

388

self.pb.update('repacking %s' % (message,), pb_offset)

389

child_pb = ui.ui_factory.nested_progress_bar()

390

try:

391

stream = vf_to_stream(source_vf, keys, message, child_pb)

392

for _ in target_vf._insert_record_stream(stream,

393

random_id=True,

394

reuse_blocks=False):

395

pass

396

finally:

397

child_pb.finished()

398

399

def _copy_revision_texts(self):

400

source_vf, target_vf = self._build_vfs('revision', True, False)

401

if not self.revision_keys:

402

# We are doing a full fetch, aka 'pack'

403

self.revision_keys = source_vf.keys()

404

self._copy_stream(source_vf, target_vf, self.revision_keys,

405

'revisions', self._get_progress_stream, 1)

406

407

def _copy_inventory_texts(self):

408

source_vf, target_vf = self._build_vfs('inventory', True, True)

409

self._copy_stream(source_vf, target_vf, self.revision_keys,

410

'inventories', self._get_filtered_inv_stream, 2)

411

412

def _copy_chk_texts(self):

413

source_vf, target_vf = self._build_vfs('chk', False, False)

414

# TODO: This is technically spurious... if it is a performance issue,

415

# remove it

416

total_keys = source_vf.keys()

417

trace.mutter('repacking chk: %d id_to_entry roots,'

418

' %d p_id_map roots, %d total keys',

419

len(self._chk_id_roots), len(self._chk_p_id_roots),

420

len(total_keys))

421

self.pb.update('repacking chk', 3)

422

child_pb = ui.ui_factory.nested_progress_bar()

423

try:

424

for stream in self._get_chk_streams(source_vf, total_keys,

425

pb=child_pb):

426

for _ in target_vf._insert_record_stream(stream,

427

random_id=True,

428

reuse_blocks=False):

429

pass

430

finally:

431

child_pb.finished()

432

433

def _copy_text_texts(self):

434

source_vf, target_vf = self._build_vfs('text', True, True)

435

# XXX: We don't walk the chk map to determine referenced (file_id,

436

# revision_id) keys. We don't do it yet because you really need

437

# to filter out the ones that are present in the parents of the

438

# rev just before the ones you are copying, otherwise the filter

439

# is grabbing too many keys...

440

text_keys = source_vf.keys()

441

self._copy_stream(source_vf, target_vf, text_keys,

442

'text', self._get_progress_stream, 4)

443

444

def _copy_signature_texts(self):

445

source_vf, target_vf = self._build_vfs('signature', False, False)

446

signature_keys = source_vf.keys()

447

signature_keys.intersection(self.revision_keys)

448

self._copy_stream(source_vf, target_vf, signature_keys,

449

'signatures', self._get_progress_stream, 5)

450

451

def _create_pack_from_packs(self):

452

self.pb.update('repacking', 0, 7)

453

self.new_pack = self.open_pack()

454

# Is this necessary for GC ?

455

self.new_pack.set_write_cache_size(1024*1024)

456

self._copy_revision_texts()

457

self._copy_inventory_texts()

458

self._copy_chk_texts()

459

self._copy_text_texts()

460

self._copy_signature_texts()

461

self.new_pack._check_references()

462

if not self._use_pack(self.new_pack):

463

self.new_pack.abort()

464

return None

465

self.pb.update('finishing repack', 6, 7)

466

self.new_pack.finish()

467

self._pack_collection.allocate(self.new_pack)

468

return self.new_pack

469

470

471

class GCCHKReconcilePacker(GCCHKPacker):

472

"""A packer which regenerates indices etc as it copies.

473

474

This is used by ``bzr reconcile`` to cause parent text pointers to be

475

regenerated.

476

"""

477

478

def __init__(self, *args, **kwargs):

479

super(GCCHKReconcilePacker, self).__init__(*args, **kwargs)

480

self._data_changed = False

481

self._gather_text_refs = True

482

483

def _copy_inventory_texts(self):

484

source_vf, target_vf = self._build_vfs('inventory', True, True)

485

self._copy_stream(source_vf, target_vf, self.revision_keys,

486

'inventories', self._get_filtered_inv_stream, 2)

487

if source_vf.keys() != self.revision_keys:

488

self._data_changed = True

489

490

def _copy_text_texts(self):

491

"""generate what texts we should have and then copy."""

492

source_vf, target_vf = self._build_vfs('text', True, True)

493

trace.mutter('repacking %d texts', len(self._text_refs))

494

self.pb.update("repacking texts", 4)

495

# we have three major tasks here:

496

# 1) generate the ideal index

497

repo = self._pack_collection.repo

498

# We want the one we just wrote, so base it on self.new_pack

499

revision_vf = self._build_vf('revision', True, False, for_write=True)

500

ancestor_keys = revision_vf.get_parent_map(revision_vf.keys())

501

# Strip keys back into revision_ids.

502

ancestors = dict((k[0], tuple([p[0] for p in parents]))

503

for k, parents in ancestor_keys.iteritems())

504

del ancestor_keys

505

# TODO: _generate_text_key_index should be much cheaper to generate from

506

# a chk repository, rather than the current implementation

507

ideal_index = repo._generate_text_key_index(None, ancestors)

508

file_id_parent_map = source_vf.get_parent_map(self._text_refs)

509

# 2) generate a keys list that contains all the entries that can

510

# be used as-is, with corrected parents.

511

ok_keys = []

512

new_parent_keys = {} # (key, parent_keys)

513

discarded_keys = []

514

NULL_REVISION = _mod_revision.NULL_REVISION

515

for key in self._text_refs:

516

# 0 - index

517

# 1 - key

518

# 2 - value

519

# 3 - refs

520

try:

521

ideal_parents = tuple(ideal_index[key])

522

except KeyError:

523

discarded_keys.append(key)

524

self._data_changed = True

525

else:

526

if ideal_parents == (NULL_REVISION,):

527

ideal_parents = ()

528

source_parents = file_id_parent_map[key]

529

if ideal_parents == source_parents:

530

# no change needed.

531

ok_keys.append(key)

532

else:

533

# We need to change the parent graph, but we don't need to

534

# re-insert the text (since we don't pun the compression

535

# parent with the parents list)

536

self._data_changed = True

537

new_parent_keys[key] = ideal_parents

538

# we're finished with some data.

539

del ideal_index

540

del file_id_parent_map

541

# 3) bulk copy the data, updating records than need it

542

def _update_parents_for_texts():

543

stream = source_vf.get_record_stream(self._text_refs,

544

'groupcompress', False)

545

for record in stream:

546

if record.key in new_parent_keys:

547

record.parents = new_parent_keys[record.key]

548

yield record

549

target_vf.insert_record_stream(_update_parents_for_texts())

550

551

def _use_pack(self, new_pack):

552

"""Override _use_pack to check for reconcile having changed content."""

553

return new_pack.data_inserted() and self._data_changed

554

555

556

class GCRepositoryPackCollection(RepositoryPackCollection):

557

558

pack_factory = GCPack

559

resumed_pack_factory = ResumedGCPack

560

561

def _already_packed(self):

562

"""Is the collection already packed?"""

563

# Always repack GC repositories for now

564

return False

565

566

def _execute_pack_operations(self, pack_operations,

567

_packer_class=GCCHKPacker,

568

reload_func=None):

569

"""Execute a series of pack operations.

570

571

:param pack_operations: A list of [revision_count, packs_to_combine].

572

:param _packer_class: The class of packer to use (default: Packer).

573

:return: None.

574

"""

575

# XXX: Copied across from RepositoryPackCollection simply because we

576

# want to override the _packer_class ... :(

577

for revision_count, packs in pack_operations:

578

# we may have no-ops from the setup logic

579

if len(packs) == 0:

580

continue

581

packer = GCCHKPacker(self, packs, '.autopack',

582

reload_func=reload_func)

583

try:

584

packer.pack()

585

except errors.RetryWithNewPacks:

586

# An exception is propagating out of this context, make sure

587

# this packer has cleaned up. Packer() doesn't set its new_pack

588

# state into the RepositoryPackCollection object, so we only

589

# have access to it directly here.

590

if packer.new_pack is not None:

591

packer.new_pack.abort()

592

raise

593

for pack in packs:

594

self._remove_pack_from_memory(pack)

595

# record the newly available packs and stop advertising the old

596

# packs

597

self._save_pack_names(clear_obsolete_packs=True)

598

# Move the old packs out of the way now they are no longer referenced.

599

for revision_count, packs in pack_operations:

600

self._obsolete_packs(packs)

601

602

603

class CHKInventoryRepository(KnitPackRepository):

604

"""subclass of KnitPackRepository that uses CHK based inventories."""

605

606

def __init__(self, _format, a_bzrdir, control_files, _commit_builder_class,

607

_serializer):

608

"""Overridden to change pack collection class."""

609

KnitPackRepository.__init__(self, _format, a_bzrdir, control_files,

610

_commit_builder_class, _serializer)

611

# and now replace everything it did :)

612

index_transport = self._transport.clone('indices')

613

self._pack_collection = GCRepositoryPackCollection(self,

614

self._transport, index_transport,

615

self._transport.clone('upload'),

616

self._transport.clone('packs'),

617

_format.index_builder_class,

618

_format.index_class,

619

use_chk_index=self._format.supports_chks,

620

)

621

self.inventories = GroupCompressVersionedFiles(

622

_GCGraphIndex(self._pack_collection.inventory_index.combined_index,

623

add_callback=self._pack_collection.inventory_index.add_callback,

624

parents=True, is_locked=self.is_locked),

625

access=self._pack_collection.inventory_index.data_access)

626

self.revisions = GroupCompressVersionedFiles(

627

_GCGraphIndex(self._pack_collection.revision_index.combined_index,

628

add_callback=self._pack_collection.revision_index.add_callback,

629

parents=True, is_locked=self.is_locked,

630

track_external_parent_refs=True),

631

access=self._pack_collection.revision_index.data_access,

632

delta=False)

633

self.signatures = GroupCompressVersionedFiles(

634

_GCGraphIndex(self._pack_collection.signature_index.combined_index,

635

add_callback=self._pack_collection.signature_index.add_callback,

636

parents=False, is_locked=self.is_locked),

637

access=self._pack_collection.signature_index.data_access,

638

delta=False)

639

self.texts = GroupCompressVersionedFiles(

640

_GCGraphIndex(self._pack_collection.text_index.combined_index,

641

add_callback=self._pack_collection.text_index.add_callback,

642

parents=True, is_locked=self.is_locked),

643

access=self._pack_collection.text_index.data_access)

644

# No parents, individual CHK pages don't have specific ancestry

645

self.chk_bytes = GroupCompressVersionedFiles(

646

_GCGraphIndex(self._pack_collection.chk_index.combined_index,

647

add_callback=self._pack_collection.chk_index.add_callback,

648

parents=False, is_locked=self.is_locked),

649

access=self._pack_collection.chk_index.data_access)

650

# True when the repository object is 'write locked' (as opposed to the

651

# physical lock only taken out around changes to the pack-names list.)

652

# Another way to represent this would be a decorator around the control

653

# files object that presents logical locks as physical ones - if this

654

# gets ugly consider that alternative design. RBC 20071011

655

self._write_lock_count = 0

656

self._transaction = None

657

# for tests

658

self._reconcile_does_inventory_gc = True

659

self._reconcile_fixes_text_parents = True

660

self._reconcile_backsup_inventory = False

661

662

def _add_inventory_checked(self, revision_id, inv, parents):

663

"""Add inv to the repository after checking the inputs.

664

665

This function can be overridden to allow different inventory styles.

666

667

:seealso: add_inventory, for the contract.

668

"""

669

# make inventory

670

serializer = self._format._serializer

671

result = inventory.CHKInventory.from_inventory(self.chk_bytes, inv,

672

maximum_size=serializer.maximum_size,

673

search_key_name=serializer.search_key_name)

674

inv_lines = result.to_lines()

675

return self._inventory_add_lines(revision_id, parents,

676

inv_lines, check_content=False)

677

678

def add_inventory_by_delta(self, basis_revision_id, delta, new_revision_id,

679

parents, basis_inv=None, propagate_caches=False):

680

"""Add a new inventory expressed as a delta against another revision.

681

682

:param basis_revision_id: The inventory id the delta was created

683

against.

684

:param delta: The inventory delta (see Inventory.apply_delta for

685

details).

686

:param new_revision_id: The revision id that the inventory is being

687

added for.

688

:param parents: The revision ids of the parents that revision_id is

689

known to have and are in the repository already. These are supplied

690

for repositories that depend on the inventory graph for revision

691

graph access, as well as for those that pun ancestry with delta

692

compression.

693

:param basis_inv: The basis inventory if it is already known,

694

otherwise None.

695

:param propagate_caches: If True, the caches for this inventory are

696

copied to and updated for the result if possible.

697

698

:returns: (validator, new_inv)

699

The validator(which is a sha1 digest, though what is sha'd is

700

repository format specific) of the serialized inventory, and the

701

resulting inventory.

702

"""

703

if basis_revision_id == _mod_revision.NULL_REVISION:

704

return KnitPackRepository.add_inventory_by_delta(self,

705

basis_revision_id, delta, new_revision_id, parents)

706

if not self.is_in_write_group():

707

raise AssertionError("%r not in write group" % (self,))

708

_mod_revision.check_not_reserved_id(new_revision_id)

709

basis_tree = self.revision_tree(basis_revision_id)

710

basis_tree.lock_read()

711

try:

712

if basis_inv is None:

713

basis_inv = basis_tree.inventory

714

result = basis_inv.create_by_apply_delta(delta, new_revision_id,

715

propagate_caches=propagate_caches)

716

inv_lines = result.to_lines()

717

return self._inventory_add_lines(new_revision_id, parents,

718

inv_lines, check_content=False), result

719

finally:

720

basis_tree.unlock()

721

722

def _iter_inventories(self, revision_ids):

723

"""Iterate over many inventory objects."""

724

keys = [(revision_id,) for revision_id in revision_ids]

725

stream = self.inventories.get_record_stream(keys, 'unordered', True)

726

texts = {}

727

for record in stream:

728

if record.storage_kind != 'absent':

729

texts[record.key] = record.get_bytes_as('fulltext')

730

else:

731

raise errors.NoSuchRevision(self, record.key)

732

for key in keys:

733

yield inventory.CHKInventory.deserialise(self.chk_bytes, texts[key], key)

734

735

def _iter_inventory_xmls(self, revision_ids):

736

# Without a native 'xml' inventory, this method doesn't make sense, so

737

# make it raise to trap naughty direct users.

738

raise NotImplementedError(self._iter_inventory_xmls)

739

740

def _find_present_inventory_ids(self, revision_ids):

741

keys = [(r,) for r in revision_ids]

742

parent_map = self.inventories.get_parent_map(keys)

743

present_inventory_ids = set(k[-1] for k in parent_map)

744

return present_inventory_ids

745

746

def fileids_altered_by_revision_ids(self, revision_ids, _inv_weave=None):

747

"""Find the file ids and versions affected by revisions.

748

749

:param revisions: an iterable containing revision ids.

750

:param _inv_weave: The inventory weave from this repository or None.

751

If None, the inventory weave will be opened automatically.

752

:return: a dictionary mapping altered file-ids to an iterable of

753

revision_ids. Each altered file-ids has the exact revision_ids that

754

altered it listed explicitly.

755

"""

756

rich_root = self.supports_rich_root()

757

bytes_to_info = inventory.CHKInventory._bytes_to_utf8name_key

758

file_id_revisions = {}

759

pb = ui.ui_factory.nested_progress_bar()

760

try:

761

parent_ids = self._find_parent_ids_of_revisions(revision_ids)

762

present_parent_inv_ids = self._find_present_inventory_ids(parent_ids)

763

uninteresting_root_keys = set()

764

interesting_root_keys = set()

765

inventories_to_read = set(present_parent_inv_ids)

766

inventories_to_read.update(revision_ids)

767

for inv in self.iter_inventories(inventories_to_read):

768

entry_chk_root_key = inv.id_to_entry.key()

769

if inv.revision_id in present_parent_inv_ids:

770

uninteresting_root_keys.add(entry_chk_root_key)

771

else:

772

interesting_root_keys.add(entry_chk_root_key)

773

774

chk_bytes = self.chk_bytes

775

for record, items in chk_map.iter_interesting_nodes(chk_bytes,

776

interesting_root_keys, uninteresting_root_keys,

777

pb=pb):

778

for name, bytes in items:

779

(name_utf8, file_id, revision_id) = bytes_to_info(bytes)

780

if not rich_root and name_utf8 == '':

781

continue

782

try:

783

file_id_revisions[file_id].add(revision_id)

784

except KeyError:

785

file_id_revisions[file_id] = set([revision_id])

786

finally:

787

pb.finished()

788

return file_id_revisions

789

790

def find_text_key_references(self):

791

"""Find the text key references within the repository.

792

793

:return: A dictionary mapping text keys ((fileid, revision_id) tuples)

794

to whether they were referred to by the inventory of the

795

revision_id that they contain. The inventory texts from all present

796

revision ids are assessed to generate this report.

797

"""

798

# XXX: Slow version but correct: rewrite as a series of delta

799

# examinations/direct tree traversal. Note that that will require care

800

# as a common node is reachable both from the inventory that added it,

801

# and others afterwards.

802

revision_keys = self.revisions.keys()

803

result = {}

804

rich_roots = self.supports_rich_root()

805

pb = ui.ui_factory.nested_progress_bar()

806

try:

807

all_revs = self.all_revision_ids()

808

total = len(all_revs)

809

for pos, inv in enumerate(self.iter_inventories(all_revs)):

810

pb.update("Finding text references", pos, total)

811

for _, entry in inv.iter_entries():

812

if not rich_roots and entry.file_id == inv.root_id:

813

continue

814

key = (entry.file_id, entry.revision)

815

result.setdefault(key, False)

816

if entry.revision == inv.revision_id:

817

result[key] = True

818

return result

819

finally:

820

pb.finished()

821

822

def _reconcile_pack(self, collection, packs, extension, revs, pb):

823

packer = GCCHKReconcilePacker(collection, packs, extension)

824

return packer.pack(pb)

825

826

def _get_source(self, to_format):

827

"""Return a source for streaming from this repository."""

828

if isinstance(to_format, remote.RemoteRepositoryFormat):

829

# Can't just check attributes on to_format with the current code,

830

# work around this:

831

to_format._ensure_real()

832

to_format = to_format._custom_format

833

if to_format.__class__ is self._format.__class__:

834

# We must be exactly the same format, otherwise stuff like the chk

835

# page layout might be different

836

return GroupCHKStreamSource(self, to_format)

837

return super(CHKInventoryRepository, self)._get_source(to_format)

838

839

840

class GroupCHKStreamSource(KnitPackStreamSource):

841

"""Used when both the source and target repo are GroupCHK repos."""

842

843

def __init__(self, from_repository, to_format):

844

"""Create a StreamSource streaming from from_repository."""

845

super(GroupCHKStreamSource, self).__init__(from_repository, to_format)

846

self._revision_keys = None

847

self._text_keys = None

848

self._text_fetch_order = 'groupcompress'

849

self._chk_id_roots = None

850

self._chk_p_id_roots = None

851

852

def _get_inventory_stream(self, inventory_keys):

853

"""Get a stream of inventory texts.

854

855

When this function returns, self._chk_id_roots and self._chk_p_id_roots

856

should be populated.

857

"""

858

self._chk_id_roots = []

859

self._chk_p_id_roots = []

860

def _filtered_inv_stream():

861

id_roots_set = set()

862

p_id_roots_set = set()

863

source_vf = self.from_repository.inventories

864

stream = source_vf.get_record_stream(inventory_keys,

865

'groupcompress', True)

866

for record in stream:

867

bytes = record.get_bytes_as('fulltext')

868

chk_inv = inventory.CHKInventory.deserialise(None, bytes,

869

record.key)

870

key = chk_inv.id_to_entry.key()

871

if key not in id_roots_set:

872

self._chk_id_roots.append(key)

873

id_roots_set.add(key)

874

p_id_map = chk_inv.parent_id_basename_to_file_id

875

if p_id_map is None:

876

raise AssertionError('Parent id -> file_id map not set')

877

key = p_id_map.key()

878

if key not in p_id_roots_set:

879

p_id_roots_set.add(key)

880

self._chk_p_id_roots.append(key)

881

yield record

882

# We have finished processing all of the inventory records, we

883

# don't need these sets anymore

884

id_roots_set.clear()

885

p_id_roots_set.clear()

886

return ('inventories', _filtered_inv_stream())

887

888

def _get_filtered_chk_streams(self, excluded_revision_ids):

889

self._text_keys = set()

890

excluded_revision_ids.discard(_mod_revision.NULL_REVISION)

891

if not excluded_revision_ids:

892

uninteresting_root_keys = set()

893

uninteresting_pid_root_keys = set()

894

else:

895

# filter out any excluded revisions whose inventories are not

896

# actually present

897

# TODO: Update Repository.iter_inventories() to add

898

# ignore_missing=True

899

present_ids = self.from_repository._find_present_inventory_ids(

900

excluded_revision_ids)

901

uninteresting_root_keys = set()

902

uninteresting_pid_root_keys = set()

903

for inv in self.from_repository.iter_inventories(present_ids):

904

uninteresting_root_keys.add(inv.id_to_entry.key())

905

uninteresting_pid_root_keys.add(

906

inv.parent_id_basename_to_file_id.key())

907

bytes_to_info = inventory.CHKInventory._bytes_to_utf8name_key

908

chk_bytes = self.from_repository.chk_bytes

909

def _filter_id_to_entry():

910

for record, items in chk_map.iter_interesting_nodes(chk_bytes,

911

self._chk_id_roots, uninteresting_root_keys):

912

for name, bytes in items:

913

# Note: we don't care about name_utf8, because we are always

914

# rich-root = True

915

_, file_id, revision_id = bytes_to_info(bytes)

916

self._text_keys.add((file_id, revision_id))

917

if record is not None:

918

yield record

919

# Consumed

920

self._chk_id_roots = None

921

yield 'chk_bytes', _filter_id_to_entry()

922

def _get_parent_id_basename_to_file_id_pages():

923

for record, items in chk_map.iter_interesting_nodes(chk_bytes,

924

self._chk_p_id_roots, uninteresting_pid_root_keys):

925

if record is not None:

926

yield record

927

# Consumed

928

self._chk_p_id_roots = None

929

yield 'chk_bytes', _get_parent_id_basename_to_file_id_pages()

930

931

def get_stream(self, search):

932

revision_ids = search.get_keys()

933

for stream_info in self._fetch_revision_texts(revision_ids):

934

yield stream_info

935

self._revision_keys = [(rev_id,) for rev_id in revision_ids]

936

yield self._get_inventory_stream(self._revision_keys)

937

# TODO: The keys to exclude might be part of the search recipe

938

# For now, exclude all parents that are at the edge of ancestry, for

939

# which we have inventories

940

from_repo = self.from_repository

941

parent_ids = from_repo._find_parent_ids_of_revisions(revision_ids)

942

for stream_info in self._get_filtered_chk_streams(parent_ids):

943

yield stream_info

944

yield self._get_text_stream()

945

946

def get_stream_for_missing_keys(self, missing_keys):

947

# missing keys can only occur when we are byte copying and not

948

# translating (because translation means we don't send

949

# unreconstructable deltas ever).

950

missing_inventory_keys = set()

951

for key in missing_keys:

952

if key[0] != 'inventories':

953

raise AssertionError('The only missing keys we should'

954

' be filling in are inventory keys, not %s'

955

% (key[0],))

956

missing_inventory_keys.add(key[1:])

957

if self._chk_id_roots or self._chk_p_id_roots:

958

raise AssertionError('Cannot call get_stream_for_missing_keys'

959

' untill all of get_stream() has been consumed.')

960

# Yield the inventory stream, so we can find the chk stream

961

yield self._get_inventory_stream(missing_inventory_keys)

962

# We use the empty set for excluded_revision_ids, to make it clear that

963

# we want to transmit all referenced chk pages.

964

for stream_info in self._get_filtered_chk_streams(set()):

965

yield stream_info

966

967

968

class RepositoryFormatCHK1(RepositoryFormatPack):

969

"""A hashed CHK+group compress pack repository."""

970

971

repository_class = CHKInventoryRepository

972

supports_external_lookups = True

973

supports_chks = True

974

# For right now, setting this to True gives us InterModel1And2 rather

975

# than InterDifferingSerializer

976

_commit_builder_class = PackRootCommitBuilder

977

rich_root_data = True

978

_serializer = chk_serializer.chk_serializer_255_bigpage

979

_commit_inv_deltas = True

980

# What index classes to use

981

index_builder_class = BTreeBuilder

982

index_class = BTreeGraphIndex

983

# Note: We cannot unpack a delta that references a text we haven't

984

# seen yet. There are 2 options, work in fulltexts, or require

985

# topological sorting. Using fulltexts is more optimal for local

986

# operations, because the source can be smart about extracting

987

# multiple in-a-row (and sharing strings). Topological is better

988

# for remote, because we access less data.

989

_fetch_order = 'unordered'

990

_fetch_uses_deltas = False # essentially ignored by the groupcompress code.

991

fast_deltas = True

992

993

def _get_matching_bzrdir(self):

994

return bzrdir.format_registry.make_bzrdir('development6-rich-root')

995

996

def _ignore_setting_bzrdir(self, format):

997

pass

998

999

_matchingbzrdir = property(_get_matching_bzrdir, _ignore_setting_bzrdir)

1000

1001

def get_format_string(self):

1002

"""See RepositoryFormat.get_format_string()."""

1003

return ('Bazaar development format - group compression and chk inventory'

1004

' (needs bzr.dev from 1.14)\n')

1005

1006

def get_format_description(self):

1007

"""See RepositoryFormat.get_format_description()."""

1008

return ("Development repository format - rich roots, group compression"

1009

" and chk inventories")

1010

1011

def check_conversion_target(self, target_format):

1012

if not target_format.rich_root_data:

1013

raise errors.BadConversionTarget(

1014

'Does not support rich root data.', target_format)

1015

if not getattr(target_format, 'supports_tree_reference', False):

1016

raise errors.BadConversionTarget(

1017

'Does not support nested trees', target_format)

1018

1019

Older »