~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/knit.py

Committer: Martin Pool
Date: 2006-03-21 12:26:54 UTC
mto: This revision was merged to the branch mainline in revision 1621.
Revision ID: mbp@sourcefrog.net-20060321122654-514047ed65795a17

New developer commands 'weave-list' and 'weave-join'.

files added:
NEWS.developers

build-api

bzrlib/tests/test_doc_generate.py

bzrlib/util/configobj/validate.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

notes

files removed:
COPYING.txt

bzr.ico

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/api.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_knit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/dirstate.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/help_topics.py

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/inspect_for_copy.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/mutabletree.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/revisiontree.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/strace.py

bzrlib/tag.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HttpServer.py

bzrlib/tests/TransportUtil.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/commands

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_pack.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_info.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_uncommit.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/remote.py

bzrlib/transport/ssh.py

bzrlib/treebuilder.py

bzrlib/tuned_gzip.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/workingtree_4.py

bzrlib/xml6.py

bzrlib/xml7.py

doc/README.1st

doc/bazaar-vcs.org.kid

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/bundle-creation.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/merge-scaling.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/profiling.txt

doc/developers/revert.txt

doc/developers/scratch.txt

doc/developers/status.txt

doc/developers/uncommit.txt

doc/http_smart_server.txt

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/shared_repository_layouts.txt

doc/specifying_revisions.txt

doc/using_aliases.txt

doc/version_info.txt

man1

profile_imports.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

files renamed:
doc/developers/HACKING => HACKING

bzrlib/deprecated_graph.py => bzrlib/graph.py

bzrlib/tests/blackbox/test_annotate.py => bzrlib/tests/test_annotate.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py => bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_commands.py => bzrlib/tests/test_command.py

bzrlib/tests/test_deprecated_graph.py => bzrlib/tests/test_graph.py

bzrlib/tests/repository_implementations/test_revision.py => bzrlib/tests/test_revprops.py

bzrlib/tests/blackbox/test_uncommit.py => bzrlib/tests/test_uncommit.py

bzrlib/win32utils.py => bzrlib/win32console.py

doc/tutorial.txt => tutorial.txt

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/elementtree/ElementTree.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib/bash/bzr.simple

contrib/newinventory.py

generate_docs.py

setup.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/knit.py

# Written by Martin Pool.

# Modified by Johan Rydberg <jrydberg@gnu.org>

# Modified by Robert Collins <robert.collins@canonical.com>

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

from copy import copy

from cStringIO import StringIO

import difflib

import gzip

from itertools import izip, chain

import operator

import os

import sys

import warnings

import bzrlib

from bzrlib import (

cache_utf8,

errors,

osutils,

patiencediff,

progress,

ui,

)

from bzrlib.errors import (

FileExists,

NoSuchFile,

KnitError,

InvalidRevisionId,

KnitCorrupt,

KnitHeaderError,

RevisionNotPresent,

RevisionAlreadyPresent,

)

from bzrlib.tuned_gzip import GzipFile

import bzrlib.errors as errors

from bzrlib.errors import FileExists, NoSuchFile, KnitError, \

InvalidRevisionId, KnitCorrupt, KnitHeaderError, \

RevisionNotPresent, RevisionAlreadyPresent

from bzrlib.trace import mutter

from bzrlib.osutils import (

contains_whitespace,

contains_linebreaks,

sha_strings,

)

from bzrlib.symbol_versioning import DEPRECATED_PARAMETER, deprecated_passed

from bzrlib.osutils import contains_whitespace, contains_linebreaks, \

sha_strings

from bzrlib.versionedfile import VersionedFile, InterVersionedFile

from bzrlib.tsort import topo_sort

100

import bzrlib.ui

101

import bzrlib.weave

102

from bzrlib.versionedfile import VersionedFile, InterVersionedFile

103

104

105

# TODO: Split out code specific to this format into an associated object.

107

# TODO: Can we put in some kind of value to check that the index and data

108

# files belong together?

109

110

# TODO: accommodate binaries, perhaps by storing a byte count

# TODO: accomodate binaries, perhaps by storing a byte count

111

112

# TODO: function to check whole file

113

127

108

128

109

def annotate_iter(self):

129

110

"""Yield tuples of (origin, text) for each content line."""

130

return iter(self._lines)

111

for origin, text in self._lines:

112

yield origin, text

131

113

132

114

def annotate(self):

133

115

"""Return a list of (origin, text) tuples."""

135

117

136

118

def line_delta_iter(self, new_lines):

137

119

"""Generate line-based delta from this content to new_lines."""

138

new_texts = new_lines.text()

139

old_texts = self.text()

140

s = KnitSequenceMatcher(None, old_texts, new_texts)

141

for tag, i1, i2, j1, j2 in s.get_opcodes():

142

if tag == 'equal':

120

new_texts = [text for origin, text in new_lines._lines]

121

old_texts = [text for origin, text in self._lines]

122

s = SequenceMatcher(None, old_texts, new_texts)

123

for op in s.get_opcodes():

124

if op[0] == 'equal':

143

125

continue

144

# ofrom, oto, length, data

145

yield i1, i2, j2 - j1, new_lines._lines[j1:j2]

126

# ofrom oto length data

127

yield (op[1], op[2], op[4]-op[3], new_lines._lines[op[3]:op[4]])

146

128

147

129

def line_delta(self, new_lines):

148

130

return list(self.line_delta_iter(new_lines))

150

132

def text(self):

151

133

return [text for origin, text in self._lines]

152

134

153

def copy(self):

154

return KnitContent(self._lines[:])

155

156

135

157

136

class _KnitFactory(object):

158

137

"""Base factory for creating content objects."""

159

138

160

def make(self, lines, version_id):

139

def make(self, lines, version):

161

140

num_lines = len(lines)

162

return KnitContent(zip([version_id] * num_lines, lines))

141

return KnitContent(zip([version] * num_lines, lines))

163

142

164

143

165

144

class KnitAnnotateFactory(_KnitFactory):

167

146

168

147

annotated = True

169

148

170

def parse_fulltext(self, content, version_id):

149

def parse_fulltext(self, content, version):

171

150

"""Convert fulltext to internal representation

172

151

173

152

fulltext content is of the format

175

154

internal representation is of the format:

176

155

(revid, plaintext)

177

156

"""

178

# TODO: jam 20070209 The tests expect this to be returned as tuples,

179

# but the code itself doesn't really depend on that.

180

# Figure out a way to not require the overhead of turning the

181

# list back into tuples.

182

lines = [tuple(line.split(' ', 1)) for line in content]

157

lines = []

158

for line in content:

159

origin, text = line.split(' ', 1)

160

lines.append((origin.decode('utf-8'), text))

183

161

return KnitContent(lines)

184

162

185

163

def parse_line_delta_iter(self, lines):

186

return iter(self.parse_line_delta(lines))

187

188

def parse_line_delta(self, lines, version_id):

189

164

"""Convert a line based delta into internal representation.

190

165

191

166

line delta is in the form of:

192

167

intstart intend intcount

193

168

1..count lines:

194

169

revid(utf8) newline\n

195

internal representation is

170

internal represnetation is

196

171

(start, end, count, [1..count tuples (revid, newline)])

197

172

"""

198

result = []

199

lines = iter(lines)

200

next = lines.next

201

202

cache = {}

203

def cache_and_return(line):

204

origin, text = line.split(' ', 1)

205

return cache.setdefault(origin, origin), text

206

207

# walk through the lines parsing.

208

for header in lines:

209

start, end, count = [int(n) for n in header.split(',')]

210

contents = [tuple(next().split(' ', 1)) for i in xrange(count)]

211

result.append((start, end, count, contents))

212

return result

213

214

def get_fulltext_content(self, lines):

215

"""Extract just the content lines from a fulltext."""

216

return (line.split(' ', 1)[1] for line in lines)

217

218

def get_linedelta_content(self, lines):

219

"""Extract just the content from a line delta.

220

221

This doesn't return all of the extra information stored in a delta.

222

Only the actual content lines.

223

"""

224

lines = iter(lines)

225

next = lines.next

226

for header in lines:

227

header = header.split(',')

228

count = int(header[2])

229

for i in xrange(count):

230

origin, text = next().split(' ', 1)

231

yield text

173

while lines:

174

header = lines.pop(0)

175

start, end, c = [int(n) for n in header.split(',')]

176

contents = []

177

for i in range(c):

178

origin, text = lines.pop(0).split(' ', 1)

179

contents.append((origin.decode('utf-8'), text))

180

yield start, end, c, contents

181

182

def parse_line_delta(self, lines, version):

183

return list(self.parse_line_delta_iter(lines))

232

184

233

185

def lower_fulltext(self, content):

234

186

"""convert a fulltext content record into a serializable form.

235

187

236

188

see parse_fulltext which this inverts.

237

189

"""

238

# TODO: jam 20070209 We only do the caching thing to make sure that

239

# the origin is a valid utf-8 line, eventually we could remove it

240

return ['%s %s' % (o, t) for o, t in content._lines]

190

return ['%s %s' % (o.encode('utf-8'), t) for o, t in content._lines]

241

191

242

192

def lower_line_delta(self, delta):

243

193

"""convert a delta into a serializable form.

244

194

245

See parse_line_delta which this inverts.

195

See parse_line_delta_iter which this inverts.

246

196

"""

247

# TODO: jam 20070209 We only do the caching thing to make sure that

248

# the origin is a valid utf-8 line, eventually we could remove it

249

197

out = []

250

198

for start, end, c, lines in delta:

251

199

out.append('%d,%d,%d\n' % (start, end, c))

252

out.extend(origin + ' ' + text

253

for origin, text in lines)

200

for origin, text in lines:

201

out.append('%s %s' % (origin.encode('utf-8'), text))

254

202

return out

255

203

256

204

259

207

260

208

annotated = False

261

209

262

def parse_fulltext(self, content, version_id):

210

def parse_fulltext(self, content, version):

263

211

"""This parses an unannotated fulltext.

264

212

265

213

Note that this is not a noop - the internal representation

266

214

has (versionid, line) - its just a constant versionid.

267

215

"""

268

return self.make(content, version_id)

216

return self.make(content, version)

269

217

270

def parse_line_delta_iter(self, lines, version_id):

271

cur = 0

272

num_lines = len(lines)

273

while cur < num_lines:

274

header = lines[cur]

275

cur += 1

218

def parse_line_delta_iter(self, lines, version):

219

while lines:

220

header = lines.pop(0)

276

221

start, end, c = [int(n) for n in header.split(',')]

277

yield start, end, c, zip([version_id] * c, lines[cur:cur+c])

278

cur += c

279

280

def parse_line_delta(self, lines, version_id):

281

return list(self.parse_line_delta_iter(lines, version_id))

282

283

def get_fulltext_content(self, lines):

284

"""Extract just the content lines from a fulltext."""

285

return iter(lines)

286

287

def get_linedelta_content(self, lines):

288

"""Extract just the content from a line delta.

289

290

This doesn't return all of the extra information stored in a delta.

291

Only the actual content lines.

292

"""

293

lines = iter(lines)

294

next = lines.next

295

for header in lines:

296

header = header.split(',')

297

count = int(header[2])

298

for i in xrange(count):

299

yield next()

300

222

yield start, end, c, zip([version] * c, lines[:c])

223

del lines[:c]

224

225

def parse_line_delta(self, lines, version):

226

return list(self.parse_line_delta_iter(lines, version))

227

301

228

def lower_fulltext(self, content):

302

229

return content.text()

303

230

330

257

stored and retrieved.

331

258

"""

332

259

333

def __init__(self, relpath, transport, file_mode=None, access_mode=None,

334

factory=None, basis_knit=DEPRECATED_PARAMETER, delta=True,

335

create=False, create_parent_dir=False, delay_create=False,

336

dir_mode=None):

260

def __init__(self, relpath, transport, file_mode=None, access_mode=None, factory=None,

261

basis_knit=None, delta=True, create=False):

337

262

"""Construct a knit at location specified by relpath.

338

263

339

264

:param create: If not True, only open an existing knit.

340

:param create_parent_dir: If True, create the parent directory if

341

creating the file fails. (This is used for stores with

342

hash-prefixes that may not exist yet)

343

:param delay_create: The calling code is aware that the knit won't

344

actually be created until the first data is stored.

345

265

"""

346

if deprecated_passed(basis_knit):

347

warnings.warn("KnitVersionedFile.__(): The basis_knit parameter is"

348

" deprecated as of bzr 0.9.",

349

DeprecationWarning, stacklevel=2)

350

266

if access_mode is None:

351

267

access_mode = 'w'

352

268

super(KnitVersionedFile, self).__init__(access_mode)

353

269

assert access_mode in ('r', 'w'), "invalid mode specified %r" % access_mode

270

assert not basis_knit or isinstance(basis_knit, KnitVersionedFile), \

271

type(basis_knit)

272

354

273

self.transport = transport

355

274

self.filename = relpath

275

self.basis_knit = basis_knit

356

276

self.factory = factory or KnitAnnotateFactory()

357

277

self.writable = (access_mode == 'w')

358

278

self.delta = delta

359

279

360

self._max_delta_chain = 200

361

362

280

self._index = _KnitIndex(transport, relpath + INDEX_SUFFIX,

363

access_mode, create=create, file_mode=file_mode,

364

create_parent_dir=create_parent_dir, delay_create=delay_create,

365

dir_mode=dir_mode)

281

access_mode, create=create)

366

282

self._data = _KnitData(transport, relpath + DATA_SUFFIX,

367

access_mode, create=create and not len(self), file_mode=file_mode,

368

create_parent_dir=create_parent_dir, delay_create=delay_create,

369

dir_mode=dir_mode)

370

371

def __repr__(self):

372

return '%s(%s)' % (self.__class__.__name__,

373

self.transport.abspath(self.filename))

374

375

def _check_should_delta(self, first_parents):

376

"""Iterate back through the parent listing, looking for a fulltext.

377

378

This is used when we want to decide whether to add a delta or a new

379

fulltext. It searches for _max_delta_chain parents. When it finds a

380

fulltext parent, it sees if the total size of the deltas leading up to

381

it is large enough to indicate that we want a new full text anyway.

382

383

Return True if we should create a new delta, False if we should use a

384

full text.

385

"""

386

delta_size = 0

387

fulltext_size = None

388

delta_parents = first_parents

389

for count in xrange(self._max_delta_chain):

390

parent = delta_parents[0]

391

method = self._index.get_method(parent)

392

pos, size = self._index.get_position(parent)

393

if method == 'fulltext':

394

fulltext_size = size

395

break

396

delta_size += size

397

delta_parents = self._index.get_parents(parent)

398

else:

399

# We couldn't find a fulltext, so we must create a new one

400

return False

401

402

return fulltext_size > delta_size

283

access_mode, create=not len(self.versions()))

403

284

404

285

def _add_delta(self, version_id, parents, delta_parent, sha1, noeol, delta):

405

286

"""See VersionedFile._add_delta()."""

438

319

# To speed the extract of texts the delta chain is limited

439

320

# to a fixed number of deltas. This should minimize both

440

321

# I/O and the time spend applying deltas.

441

# The window was changed to a maximum of 200 deltas, but also added

442

# was a check that the total compressed size of the deltas is

443

# smaller than the compressed size of the fulltext.

444

if not self._check_should_delta([delta_parent]):

445

# We don't want a delta here, just do a normal insertion.

322

count = 0

323

delta_parents = [delta_parent]

324

while count < 25:

325

parent = delta_parents[0]

326

method = self._index.get_method(parent)

327

if method == 'fulltext':

328

break

329

delta_parents = self._index.get_parents(parent)

330

count = count + 1

331

if method == 'line-delta':

332

# did not find a fulltext in the delta limit.

333

# just do a normal insertion.

446

334

return super(KnitVersionedFile, self)._add_delta(version_id,

447

335

parents,

448

336

delta_parent,

456

344

where, size = self._data.add_record(version_id, digest, store_lines)

457

345

self._index.add_version(version_id, options, where, size, parents)

458

346

459

def _add_raw_records(self, records, data):

460

"""Add all the records 'records' with data pre-joined in 'data'.

461

462

:param records: A list of tuples(version_id, options, parents, size).

463

:param data: The data for the records. When it is written, the records

464

are adjusted to have pos pointing into data by the sum of

465

the preceding records sizes.

466

"""

467

# write all the data

468

pos = self._data.add_raw_record(data)

469

offset = 0

470

index_entries = []

471

for (version_id, options, parents, size) in records:

472

index_entries.append((version_id, options, pos+offset,

473

size, parents))

474

if self._data._do_cache:

475

self._data._cache[version_id] = data[offset:offset+size]

476

offset += size

477

self._index.add_versions(index_entries)

478

479

def enable_cache(self):

480

"""Start caching data for this knit"""

481

self._data.enable_cache()

482

483

347

def clear_cache(self):

484

348

"""Clear the data cache only."""

485

349

self._data.clear_cache()

488

352

"""See VersionedFile.copy_to()."""

489

353

# copy the current index to a temp index to avoid racing with local

490

354

# writes

491

transport.put_file_non_atomic(name + INDEX_SUFFIX + '.tmp',

492

self.transport.get(self._index._filename))

355

transport.put(name + INDEX_SUFFIX + '.tmp', self.transport.get(self._index._filename))

493

356

# copy the data file

494

f = self._data._open_file()

495

try:

496

transport.put_file(name + DATA_SUFFIX, f)

497

finally:

498

f.close()

499

# move the copied index into place

500

transport.move(name + INDEX_SUFFIX + '.tmp', name + INDEX_SUFFIX)

357

transport.put(name + DATA_SUFFIX, self._data._open_file())

358

# rename the copied index into place

359

transport.rename(name + INDEX_SUFFIX + '.tmp', name + INDEX_SUFFIX)

501

360

502

361

def create_empty(self, name, transport, mode=None):

503

return KnitVersionedFile(name, transport, factory=self.factory,

504

delta=self.delta, create=True)

362

return KnitVersionedFile(name, transport, factory=self.factory, delta=self.delta, create=True)

505

363

506

def _fix_parents(self, version_id, new_parents):

364

def _fix_parents(self, version, new_parents):

507

365

"""Fix the parents list for version.

508

366

509

367

This is done by appending a new version to the index

511

369

the parents list must be a superset of the current

512

370

list.

513

371

"""

514

current_values = self._index._cache[version_id]

372

current_values = self._index._cache[version]

515

373

assert set(current_values[4]).difference(set(new_parents)) == set()

516

self._index.add_version(version_id,

374

self._index.add_version(version,

517

375

current_values[1],

518

376

current_values[2],

519

377

current_values[3],

521

379

522

380

def get_delta(self, version_id):

523

381

"""Get a delta for constructing version from some other version."""

524

version_id = osutils.safe_revision_id(version_id)

525

self.check_not_reserved_id(version_id)

526

382

if not self.has_version(version_id):

527

383

raise RevisionNotPresent(version_id, self.filename)

528

384

533

389

parent = None

534

390

data_pos, data_size = self._index.get_position(version_id)

535

391

data, sha1 = self._data.read_records(((version_id, data_pos, data_size),))[version_id]

392

version_idx = self._index.lookup(version_id)

536

393

noeol = 'no-eol' in self._index.get_options(version_id)

537

394

if 'fulltext' == self._index.get_method(version_id):

538

new_content = self.factory.parse_fulltext(data, version_id)

395

new_content = self.factory.parse_fulltext(data, version_idx)

539

396

if parent is not None:

540

397

reference_content = self._get_content(parent)

541

398

old_texts = reference_content.text()

542

399

else:

543

400

old_texts = []

544

401

new_texts = new_content.text()

545

delta_seq = KnitSequenceMatcher(None, old_texts, new_texts)

402

delta_seq = SequenceMatcher(None, old_texts, new_texts)

546

403

return parent, sha1, noeol, self._make_line_delta(delta_seq, new_content)

547

404

else:

548

delta = self.factory.parse_line_delta(data, version_id)

405

delta = self.factory.parse_line_delta(data, version_idx)

549

406

return parent, sha1, noeol, delta

550

407

551

408

def get_graph_with_ghosts(self):

553

410

graph_items = self._index.get_graph()

554

411

return dict(graph_items)

555

412

556

def get_sha1(self, version_id):

557

"""See VersionedFile.get_sha1()."""

558

version_id = osutils.safe_revision_id(version_id)

559

record_map = self._get_record_map([version_id])

560

method, content, digest, next = record_map[version_id]

561

return digest

562

563

413

@staticmethod

564

414

def get_suffixes():

565

415

"""See VersionedFile.get_suffixes()."""

567

417

568

418

def has_ghost(self, version_id):

569

419

"""True if there is a ghost reference in the file to version_id."""

570

version_id = osutils.safe_revision_id(version_id)

571

420

# maybe we have it

572

421

if self.has_version(version_id):

573

422

return False

586

435

587

436

def has_version(self, version_id):

588

437

"""See VersionedFile.has_version."""

589

version_id = osutils.safe_revision_id(version_id)

590

438

return self._index.has_version(version_id)

591

439

592

440

__contains__ = has_version

600

448

delta_seq = None

601

449

for parent_id in parents:

602

450

merge_content = self._get_content(parent_id, parent_texts)

603

seq = patiencediff.PatienceSequenceMatcher(

604

None, merge_content.text(), content.text())

451

seq = SequenceMatcher(None, merge_content.text(), content.text())

605

452

if delta_seq is None:

606

453

# setup a delta seq to reuse.

607

454

delta_seq = seq

618

465

reference_content = self._get_content(parents[0], parent_texts)

619

466

new_texts = content.text()

620

467

old_texts = reference_content.text()

621

delta_seq = patiencediff.PatienceSequenceMatcher(

622

None, old_texts, new_texts)

468

delta_seq = SequenceMatcher(None, old_texts, new_texts)

623

469

return self._make_line_delta(delta_seq, content)

624

470

625

471

def _make_line_delta(self, delta_seq, new_content):

631

477

diff_hunks.append((op[1], op[2], op[4]-op[3], new_content._lines[op[3]:op[4]]))

632

478

return diff_hunks

633

479

634

def _get_components_positions(self, version_ids):

635

"""Produce a map of position data for the components of versions.

636

637

This data is intended to be used for retrieving the knit records.

638

639

A dict of version_id to (method, data_pos, data_size, next) is

640

returned.

641

method is the way referenced data should be applied.

642

data_pos is the position of the data in the knit.

643

data_size is the size of the data in the knit.

644

next is the build-parent of the version, or None for fulltexts.

480

def _get_components(self, version_id):

481

"""Return a list of (version_id, method, data) tuples that

482

makes up version specified by version_id of the knit.

483

484

The components should be applied in the order of the returned

485

list.

486

487

The basis knit will be used to the largest extent possible

488

since it is assumed that accesses to it is faster.

645

489

"""

646

component_data = {}

647

for version_id in version_ids:

648

cursor = version_id

649

650

while cursor is not None and cursor not in component_data:

651

method = self._index.get_method(cursor)

652

if method == 'fulltext':

653

next = None

654

else:

655

next = self.get_parents(cursor)[0]

656

data_pos, data_size = self._index.get_position(cursor)

657

component_data[cursor] = (method, data_pos, data_size, next)

658

cursor = next

659

return component_data

660

490

# needed_revisions holds a list of (method, version_id) of

491

# versions that is needed to be fetched to construct the final

492

# version of the file.

493

494

# basis_revisions is a list of versions that needs to be

495

# fetched but exists in the basis knit.

496

497

basis = self.basis_knit

498

needed_versions = []

499

basis_versions = []

500

cursor = version_id

501

502

while 1:

503

picked_knit = self

504

if basis and basis._index.has_version(cursor):

505

picked_knit = basis

506

basis_versions.append(cursor)

507

method = picked_knit._index.get_method(cursor)

508

needed_versions.append((method, cursor))

509

if method == 'fulltext':

510

break

511

cursor = picked_knit.get_parents(cursor)[0]

512

513

components = {}

514

if basis_versions:

515

records = []

516

for comp_id in basis_versions:

517

data_pos, data_size = basis._index.get_data_position(comp_id)

518

records.append((piece_id, data_pos, data_size))

519

components.update(basis._data.read_records(records))

520

521

records = []

522

for comp_id in [vid for method, vid in needed_versions

523

if vid not in basis_versions]:

524

data_pos, data_size = self._index.get_position(comp_id)

525

records.append((comp_id, data_pos, data_size))

526

components.update(self._data.read_records(records))

527

528

# get_data_records returns a mapping with the version id as

529

# index and the value as data. The order the components need

530

# to be applied is held by needed_versions (reversed).

531

out = []

532

for method, comp_id in reversed(needed_versions):

533

out.append((comp_id, method, components[comp_id]))

534

535

return out

536

661

537

def _get_content(self, version_id, parent_texts={}):

662

538

"""Returns a content object that makes up the specified

663

539

version."""

668

544

if cached_version is not None:

669

545

return cached_version

670

546

671

text_map, contents_map = self._get_content_maps([version_id])

672

return contents_map[version_id]

547

if self.basis_knit and version_id in self.basis_knit:

548

return self.basis_knit._get_content(version_id)

549

550

content = None

551

components = self._get_components(version_id)

552

for component_id, method, (data, digest) in components:

553

version_idx = self._index.lookup(component_id)

554

if method == 'fulltext':

555

assert content is None

556

content = self.factory.parse_fulltext(data, version_idx)

557

elif method == 'line-delta':

558

delta = self.factory.parse_line_delta(data, version_idx)

559

content._lines = self._apply_delta(content._lines, delta)

560

561

if 'no-eol' in self._index.get_options(version_id):

562

line = content._lines[-1][1].rstrip('\n')

563

content._lines[-1] = (content._lines[-1][0], line)

564

565

if sha_strings(content.text()) != digest:

566

import pdb;pdb.set_trace()

567

raise KnitCorrupt(self.filename, 'sha-1 does not match %s' % version_id)

568

569

return content

673

570

674

571

def _check_versions_present(self, version_ids):

675

572

"""Check that all specified versions are present."""

676

self._index.check_versions_present(version_ids)

573

version_ids = set(version_ids)

574

for r in list(version_ids):

575

if self._index.has_version(r):

576

version_ids.remove(r)

577

if version_ids:

578

raise RevisionNotPresent(list(version_ids)[0], self.filename)

677

579

678

580

def _add_lines_with_ghosts(self, version_id, parents, lines, parent_texts):

679

581

"""See VersionedFile.add_lines_with_ghosts()."""

691

593

assert self.writable, "knit is not opened for write"

692

594

### FIXME escape. RBC 20060228

693

595

if contains_whitespace(version_id):

694

raise InvalidRevisionId(version_id, self.filename)

695

self.check_not_reserved_id(version_id)

596

raise InvalidRevisionId(version_id)

696

597

if self.has_version(version_id):

697

598

raise RevisionAlreadyPresent(version_id, self.filename)

698

self._check_lines_not_unicode(lines)

699

self._check_lines_are_lines(lines)

599

600

if False or __debug__:

601

for l in lines:

602

assert '\n' not in l[:-1]

700

603

701

604

def _add(self, version_id, lines, parents, delta, parent_texts):

702

605

"""Add a set of lines on top of version specified by parents.

742

645

# To speed the extract of texts the delta chain is limited

743

646

# to a fixed number of deltas. This should minimize both

744

647

# I/O and the time spend applying deltas.

745

delta = self._check_should_delta(present_parents)

648

count = 0

649

delta_parents = present_parents

650

while count < 25:

651

parent = delta_parents[0]

652

method = self._index.get_method(parent)

653

if method == 'fulltext':

654

break

655

delta_parents = self._index.get_parents(parent)

656

count = count + 1

657

if method == 'line-delta':

658

delta = False

746

659

747

assert isinstance(version_id, str)

748

660

lines = self.factory.make(lines, version_id)

749

661

if delta or (self.factory.annotated and len(present_parents) > 0):

750

662

# Merge annotations from parent texts if so is needed.

767

679

768

680

def _clone_text(self, new_version_id, old_version_id, parents):

769

681

"""See VersionedFile.clone_text()."""

770

# FIXME RBC 20060228 make fast by only inserting an index with null

771

# delta.

682

# FIXME RBC 20060228 make fast by only inserting an index with null delta.

772

683

self.add_lines(new_version_id, parents, self.get_lines(old_version_id))

773

684

774

685

def get_lines(self, version_id):

775

686

"""See VersionedFile.get_lines()."""

776

return self.get_line_list([version_id])[0]

777

778

def _get_record_map(self, version_ids):

779

"""Produce a dictionary of knit records.

780

781

The keys are version_ids, the values are tuples of (method, content,

782

digest, next).

783

method is the way the content should be applied.

784

content is a KnitContent object.

785

digest is the SHA1 digest of this version id after all steps are done

786

next is the build-parent of the version, i.e. the leftmost ancestor.

787

If the method is fulltext, next will be None.

788

"""

789

position_map = self._get_components_positions(version_ids)

790

# c = component_id, m = method, p = position, s = size, n = next

791

records = [(c, p, s) for c, (m, p, s, n) in position_map.iteritems()]

792

record_map = {}

793

for component_id, content, digest in \

794

self._data.read_records_iter(records):

795

method, position, size, next = position_map[component_id]

796

record_map[component_id] = method, content, digest, next

797

798

return record_map

799

800

def get_text(self, version_id):

801

"""See VersionedFile.get_text"""

802

return self.get_texts([version_id])[0]

803

804

def get_texts(self, version_ids):

805

return [''.join(l) for l in self.get_line_list(version_ids)]

806

807

def get_line_list(self, version_ids):

808

"""Return the texts of listed versions as a list of strings."""

809

version_ids = [osutils.safe_revision_id(v) for v in version_ids]

810

for version_id in version_ids:

811

self.check_not_reserved_id(version_id)

812

text_map, content_map = self._get_content_maps(version_ids)

813

return [text_map[v] for v in version_ids]

814

815

def _get_content_maps(self, version_ids):

816

"""Produce maps of text and KnitContents

817

818

:return: (text_map, content_map) where text_map contains the texts for

819

the requested versions and content_map contains the KnitContents.

820

Both dicts take version_ids as their keys.

821

"""

822

for version_id in version_ids:

823

if not self.has_version(version_id):

824

raise RevisionNotPresent(version_id, self.filename)

825

record_map = self._get_record_map(version_ids)

826

827

text_map = {}

828

content_map = {}

829

final_content = {}

830

for version_id in version_ids:

831

components = []

832

cursor = version_id

833

while cursor is not None:

834

method, data, digest, next = record_map[cursor]

835

components.append((cursor, method, data, digest))

836

if cursor in content_map:

837

break

838

cursor = next

839

840

content = None

841

for component_id, method, data, digest in reversed(components):

842

if component_id in content_map:

843

content = content_map[component_id]

844

else:

845

if method == 'fulltext':

846

assert content is None

847

content = self.factory.parse_fulltext(data, version_id)

848

elif method == 'line-delta':

849

delta = self.factory.parse_line_delta(data, version_id)

850

content = content.copy()

851

content._lines = self._apply_delta(content._lines,

852

delta)

853

content_map[component_id] = content

854

855

if 'no-eol' in self._index.get_options(version_id):

856

content = content.copy()

857

line = content._lines[-1][1].rstrip('\n')

858

content._lines[-1] = (content._lines[-1][0], line)

859

final_content[version_id] = content

860

861

# digest here is the digest from the last applied component.

862

text = content.text()

863

if sha_strings(text) != digest:

864

raise KnitCorrupt(self.filename,

865

'sha-1 does not match %s' % version_id)

866

867

text_map[version_id] = text

868

return text_map, final_content

869

870

def iter_lines_added_or_present_in_versions(self, version_ids=None,

871

pb=None):

687

return self._get_content(version_id).text()

688

689

def iter_lines_added_or_present_in_versions(self, version_ids=None):

872

690

"""See VersionedFile.iter_lines_added_or_present_in_versions()."""

873

691

if version_ids is None:

874

692

version_ids = self.versions()

875

else:

876

version_ids = [osutils.safe_revision_id(v) for v in version_ids]

877

if pb is None:

878

pb = progress.DummyProgress()

879

# we don't care about inclusions, the caller cares.

693

# we dont care about inclusions, the caller cares.

880

694

# but we need to setup a list of records to visit.

881

695

# we need version_id, position, length

882

696

version_id_records = []

883

requested_versions = set(version_ids)

697

requested_versions = list(version_ids)

884

698

# filter for available versions

885

699

for version_id in requested_versions:

886

700

if not self.has_version(version_id):

887

701

raise RevisionNotPresent(version_id, self.filename)

888

702

# get a in-component-order queue:

703

version_ids = []

889

704

for version_id in self.versions():

890

705

if version_id in requested_versions:

706

version_ids.append(version_id)

891

707

data_pos, length = self._index.get_position(version_id)

892

708

version_id_records.append((version_id, data_pos, length))

893

709

710

pb = bzrlib.ui.ui_factory.nested_progress_bar()

711

count = 0

894

712

total = len(version_id_records)

895

for version_idx, (version_id, data, sha_value) in \

896

enumerate(self._data.read_records_iter(version_id_records)):

897

pb.update('Walking content.', version_idx, total)

898

method = self._index.get_method(version_id)

899

900

assert method in ('fulltext', 'line-delta')

901

if method == 'fulltext':

902

line_iterator = self.factory.get_fulltext_content(data)

903

else:

904

line_iterator = self.factory.get_linedelta_content(data)

905

for line in line_iterator:

906

yield line

907

908

pb.update('Walking content.', total, total)

713

try:

714

pb.update('Walking content.', count, total)

715

for version_id, data, sha_value in \

716

self._data.read_records_iter(version_id_records):

717

pb.update('Walking content.', count, total)

718

method = self._index.get_method(version_id)

719

version_idx = self._index.lookup(version_id)

720

assert method in ('fulltext', 'line-delta')

721

if method == 'fulltext':

722

content = self.factory.parse_fulltext(data, version_idx)

723

for line in content.text():

724

yield line

725

else:

726

delta = self.factory.parse_line_delta(data, version_idx)

727

for start, end, count, lines in delta:

728

for origin, line in lines:

729

yield line

730

count +=1

731

pb.update('Walking content.', total, total)

732

pb.finished()

733

except:

734

pb.update('Walking content.', total, total)

735

pb.finished()

736

raise

909

737

910

738

def num_versions(self):

911

739

"""See VersionedFile.num_versions()."""

915

743

916

744

def annotate_iter(self, version_id):

917

745

"""See VersionedFile.annotate_iter."""

918

version_id = osutils.safe_revision_id(version_id)

919

746

content = self._get_content(version_id)

920

747

for origin, text in content.annotate_iter():

921

748

yield origin, text

922

749

923

750

def get_parents(self, version_id):

924

751

"""See VersionedFile.get_parents."""

925

# perf notes:

926

# optimism counts!

927

# 52554 calls in 1264 872 internal down from 3674

928

version_id = osutils.safe_revision_id(version_id)

929

try:

930

return self._index.get_parents(version_id)

931

except KeyError:

932

raise RevisionNotPresent(version_id, self.filename)

752

self._check_versions_present([version_id])

753

return list(self._index.get_parents(version_id))

933

754

934

755

def get_parents_with_ghosts(self, version_id):

935

756

"""See VersionedFile.get_parents."""

936

version_id = osutils.safe_revision_id(version_id)

937

try:

938

return self._index.get_parents_with_ghosts(version_id)

939

except KeyError:

940

raise RevisionNotPresent(version_id, self.filename)

757

self._check_versions_present([version_id])

758

return list(self._index.get_parents_with_ghosts(version_id))

941

759

942

def get_ancestry(self, versions, topo_sorted=True):

760

def get_ancestry(self, versions):

943

761

"""See VersionedFile.get_ancestry."""

944

762

if isinstance(versions, basestring):

945

763

versions = [versions]

946

764

if not versions:

947

765

return []

948

versions = [osutils.safe_revision_id(v) for v in versions]

949

return self._index.get_ancestry(versions, topo_sorted)

766

self._check_versions_present(versions)

767

return self._index.get_ancestry(versions)

950

768

951

769

def get_ancestry_with_ghosts(self, versions):

952

770

"""See VersionedFile.get_ancestry_with_ghosts."""

954

772

versions = [versions]

955

773

if not versions:

956

774

return []

957

versions = [osutils.safe_revision_id(v) for v in versions]

775

self._check_versions_present(versions)

958

776

return self._index.get_ancestry_with_ghosts(versions)

959

777

960

778

#@deprecated_method(zero_eight)

967

785

from bzrlib.weave import Weave

968

786

969

787

w = Weave(self.filename)

970

ancestry = set(self.get_ancestry(version_ids, topo_sorted=False))

788

ancestry = self.get_ancestry(version_ids)

971

789

sorted_graph = topo_sort(self._index.get_graph())

972

790

version_list = [vid for vid in sorted_graph if vid in ancestry]

973

791

978

796

for lineno, insert_id, dset, line in w.walk(version_ids):

979

797

yield lineno, insert_id, dset, line

980

798

981

def plan_merge(self, ver_a, ver_b):

982

"""See VersionedFile.plan_merge."""

983

ver_a = osutils.safe_revision_id(ver_a)

984

ver_b = osutils.safe_revision_id(ver_b)

985

ancestors_b = set(self.get_ancestry(ver_b, topo_sorted=False))

986

def status_a(revision, text):

987

if revision in ancestors_b:

988

return 'killed-b', text

989

else:

990

return 'new-a', text

991

992

ancestors_a = set(self.get_ancestry(ver_a, topo_sorted=False))

993

def status_b(revision, text):

994

if revision in ancestors_a:

995

return 'killed-a', text

996

else:

997

return 'new-b', text

998

999

annotated_a = self.annotate(ver_a)

1000

annotated_b = self.annotate(ver_b)

1001

plain_a = [t for (a, t) in annotated_a]

1002

plain_b = [t for (a, t) in annotated_b]

1003

blocks = KnitSequenceMatcher(None, plain_a, plain_b).get_matching_blocks()

1004

a_cur = 0

1005

b_cur = 0

1006

for ai, bi, l in blocks:

1007

# process all mismatched sections

1008

# (last mismatched section is handled because blocks always

1009

# includes a 0-length last block)

1010

for revision, text in annotated_a[a_cur:ai]:

1011

yield status_a(revision, text)

1012

for revision, text in annotated_b[b_cur:bi]:

1013

yield status_b(revision, text)

1014

1015

# and now the matched section

1016

a_cur = ai + l

1017

b_cur = bi + l

1018

for text_a, text_b in zip(plain_a[ai:a_cur], plain_b[bi:b_cur]):

1019

assert text_a == text_b

1020

yield "unchanged", text_a

1021

1022

799

1023

800

class _KnitComponentFile(object):

1024

801

"""One of the files used to implement a knit database"""

1025

802

1026

def __init__(self, transport, filename, mode, file_mode=None,

1027

create_parent_dir=False, dir_mode=None):

803

def __init__(self, transport, filename, mode):

1028

804

self._transport = transport

1029

805

self._filename = filename

1030

806

self._mode = mode

1031

self._file_mode = file_mode

1032

self._dir_mode = dir_mode

1033

self._create_parent_dir = create_parent_dir

1034

self._need_to_create = False

1035

807

1036

def _full_path(self):

1037

"""Return the full path to this file."""

1038

return self._transport.base + self._filename

808

def write_header(self):

809

if self._transport.append(self._filename, StringIO(self.HEADER)):

810

raise KnitCorrupt(self._filename, 'misaligned after writing header')

1039

811

1040

812

def check_header(self, fp):

1041

line = fp.readline()

1042

if line == '':

1043

# An empty file can actually be treated as though the file doesn't

1044

# exist yet.

1045

raise errors.NoSuchFile(self._full_path())

813

line = fp.read(len(self.HEADER))

1046

814

if line != self.HEADER:

1047

raise KnitHeaderError(badline=line,

1048

filename=self._transport.abspath(self._filename))

815

raise KnitHeaderError(badline=line)

1049

816

1050

817

def commit(self):

1051

818

"""Commit is a nop."""

1076

843

this allows updates to correct version and parent information.

1077

844

Note that the two entries may share the delta, and that successive

1078

845

annotations and references MUST point to the first entry.

1079

1080

The index file on disc contains a header, followed by one line per knit

1081

record. The same revision can be present in an index file more than once.

1082

The first occurrence gets assigned a sequence number starting from 0.

1083

1084

The format of a single line is

1085

REVISION_ID FLAGS BYTE_OFFSET LENGTH( PARENT_ID|PARENT_SEQUENCE_ID)* :\n

1086

REVISION_ID is a utf8-encoded revision id

1087

FLAGS is a comma separated list of flags about the record. Values include

1088

no-eol, line-delta, fulltext.

1089

BYTE_OFFSET is the ascii representation of the byte offset in the data file

1090

that the the compressed data starts at.

1091

LENGTH is the ascii representation of the length of the data file.

1092

PARENT_ID a utf-8 revision id prefixed by a '.' that is a parent of

1093

REVISION_ID.

1094

PARENT_SEQUENCE_ID the ascii representation of the sequence number of a

1095

revision id already in the knit that is a parent of REVISION_ID.

1096

The ' :' marker is the end of record marker.

1097

1098

partial writes:

1099

when a write is interrupted to the index file, it will result in a line

1100

that does not end in ' :'. If the ' :' is not present at the end of a line,

1101

or at the end of the file, then the record that is missing it will be

1102

ignored by the parser.

1103

1104

When writing new records to the index file, the data is preceded by '\n'

1105

to ensure that records always start on new lines even if the last write was

1106

interrupted. As a result its normal for the last line in the index to be

1107

missing a trailing newline. One can be added with no harmful effects.

1108

846

"""

1109

847

1110

HEADER = "# bzr knit index 8\n"

848

HEADER = "# bzr knit index 7\n"

1111

849

1112

850

# speed of knit parsing went from 280 ms to 280 ms with slots addition.

1113

851

# __slots__ = ['_cache', '_history', '_transport', '_filename']

1114

852

1115

853

def _cache_version(self, version_id, options, pos, size, parents):

1116

854

"""Cache a version record in the history array and index cache.

1117

1118

This is inlined into _load_data for performance. KEEP IN SYNC.

855

856

This is inlined into __init__ for performance. KEEP IN SYNC.

1119

857

(It saves 60ms, 25% of the __init__ overhead on local 4000 record

1120

858

indexes).

1121

859

"""

1122

860

# only want the _history index to reference the 1st index entry

1123

861

# for version_id

1124

862

if version_id not in self._cache:

1125

index = len(self._history)

1126

863

self._history.append(version_id)

1127

else:

1128

index = self._cache[version_id][5]

1129

self._cache[version_id] = (version_id,

1130

options,

1131

pos,

1132

size,

1133

parents,

1134

index)

864

self._cache[version_id] = (version_id, options, pos, size, parents)

1135

865

1136

def __init__(self, transport, filename, mode, create=False, file_mode=None,

1137

create_parent_dir=False, delay_create=False, dir_mode=None):

1138

_KnitComponentFile.__init__(self, transport, filename, mode,

1139

file_mode=file_mode,

1140

create_parent_dir=create_parent_dir,

1141

dir_mode=dir_mode)

866

def __init__(self, transport, filename, mode, create=False):

867

_KnitComponentFile.__init__(self, transport, filename, mode)

1142

868

self._cache = {}

1143

869

# position in _history is the 'official' index for a revision

1144

870

# but the values may have come from a newer entry.

1145

# so - wc -l of a knit index is != the number of unique names

1146

# in the knit.

871

# so - wc -l of a knit index is != the number of uniqe names

872

# in the weave.

1147

873

self._history = []

874

pb = bzrlib.ui.ui_factory.nested_progress_bar()

1148

875

try:

1149

fp = self._transport.get(self._filename)

876

count = 0

877

total = 1

1150

878

try:

1151

# _load_data may raise NoSuchFile if the target knit is

1152

# completely empty.

1153

_load_data(self, fp)

1154

finally:

1155

fp.close()

1156

except NoSuchFile:

1157

if mode != 'w' or not create:

1158

raise

1159

elif delay_create:

1160

self._need_to_create = True

879

pb.update('read knit index', count, total)

880

fp = self._transport.get(self._filename)

881

self.check_header(fp)

882

# readlines reads the whole file at once:

883

# bad for transports like http, good for local disk

884

# we save 60 ms doing this one change (

885

# from calling readline each time to calling

886

# readlines once.

887

# probably what we want for nice behaviour on

888

# http is a incremental readlines that yields, or

889

# a check for local vs non local indexes,

890

for l in fp.readlines():

891

rec = l.split()

892

count += 1

893

total += 1

894

#pb.update('read knit index', count, total)

895

# See self._parse_parents

896

parents = []

897

for value in rec[4:]:

898

if '.' == value[0]:

899

# uncompressed reference

900

parents.append(value[1:])

901

else:

902

# this is 15/4000ms faster than isinstance,

903

# (in lsprof)

904

# this function is called thousands of times a

905

# second so small variations add up.

906

assert value.__class__ is str

907

parents.append(self._history[int(value)])

908

# end self._parse_parents

909

# self._cache_version(rec[0],

910

# rec[1].split(','),

911

# int(rec[2]),

912

# int(rec[3]),

913

# parents)

914

# --- self._cache_version

915

# only want the _history index to reference the 1st

916

# index entry for version_id

917

version_id = rec[0]

918

if version_id not in self._cache:

919

self._history.append(version_id)

920

self._cache[version_id] = (version_id,

921

rec[1].split(','),

922

int(rec[2]),

923

int(rec[3]),

924

parents)

925

# --- self._cache_version

926

except NoSuchFile, e:

927

if mode != 'w' or not create:

928

raise

929

self.write_header()

930

finally:

931

pb.update('read knit index', total, total)

932

pb.finished()

933

934

def _parse_parents(self, compressed_parents):

935

"""convert a list of string parent values into version ids.

936

937

ints are looked up in the index.

938

.FOO values are ghosts and converted in to FOO.

939

940

NOTE: the function is retained here for clarity, and for possible

941

use in partial index reads. However bulk processing now has

942

it inlined in __init__ for inner-loop optimisation.

943

"""

944

result = []

945

for value in compressed_parents:

946

if value[-1] == '.':

947

# uncompressed reference

948

result.append(value[1:])

1161

949

else:

1162

self._transport.put_bytes_non_atomic(

1163

self._filename, self.HEADER, mode=self._file_mode)

950

# this is 15/4000ms faster than isinstance,

951

# this function is called thousands of times a

952

# second so small variations add up.

953

assert value.__class__ is str

954

result.append(self._history[int(value)])

955

return result

1164

956

1165

957

def get_graph(self):

1166

return [(vid, idx[4]) for vid, idx in self._cache.iteritems()]

958

graph = []

959

for version_id, index in self._cache.iteritems():

960

graph.append((version_id, index[4]))

961

return graph

1167

962

1168

def get_ancestry(self, versions, topo_sorted=True):

963

def get_ancestry(self, versions):

1169

964

"""See VersionedFile.get_ancestry."""

1170

965

# get a graph of all the mentioned versions:

1171

966

graph = {}

1172

967

pending = set(versions)

1173

cache = self._cache

1174

while pending:

968

while len(pending):

1175

969

version = pending.pop()

970

parents = self._cache[version][4]

971

# got the parents ok

1176

972

# trim ghosts

1177

try:

1178

parents = [p for p in cache[version][4] if p in cache]

1179

except KeyError:

1180

raise RevisionNotPresent(version, self._filename)

1181

# if not completed and not a ghost

1182

pending.update([p for p in parents if p not in graph])

973

parents = [parent for parent in parents if parent in self._cache]

974

for parent in parents:

975

# if not completed and not a ghost

976

if parent not in graph:

977

pending.add(parent)

1183

978

graph[version] = parents

1184

if not topo_sorted:

1185

return graph.keys()

1186

979

return topo_sort(graph.items())

1187

980

1188

981

def get_ancestry_with_ghosts(self, versions):

1189

982

"""See VersionedFile.get_ancestry_with_ghosts."""

1190

983

# get a graph of all the mentioned versions:

1191

self.check_versions_present(versions)

1192

cache = self._cache

1193

984

graph = {}

1194

985

pending = set(versions)

1195

while pending:

986

while len(pending):

1196

987

version = pending.pop()

1197

988

try:

1198

parents = cache[version][4]

989

parents = self._cache[version][4]

1199

990

except KeyError:

1200

991

# ghost, fake it

1201

992

graph[version] = []

993

pass

1202

994

else:

1203

# if not completed

1204

pending.update([p for p in parents if p not in graph])

995

# got the parents ok

996

for parent in parents:

997

if parent not in graph:

998

pending.add(parent)

1205

999

graph[version] = parents

1206

1000

return topo_sort(graph.items())

1207

1001

1218

1012

1219

1013

def lookup(self, version_id):

1220

1014

assert version_id in self._cache

1221

return self._cache[version_id][5]

1015

return self._history.index(version_id)

1222

1016

1223

1017

def _version_list_to_index(self, versions):

1224

1018

result_list = []

1225

cache = self._cache

1226

1019

for version in versions:

1227

if version in cache:

1228

# -- inlined lookup() --

1229

result_list.append(str(cache[version][5]))

1230

# -- end lookup () --

1020

if version in self._cache:

1021

result_list.append(str(self._history.index(version)))

1231

1022

else:

1232

result_list.append('.' + version)

1023

result_list.append('.' + version.encode('utf-8'))

1233

1024

return ' '.join(result_list)

1234

1025

1235

1026

def add_version(self, version_id, options, pos, size, parents):

1236

1027

"""Add a version record to the index."""

1237

self.add_versions(((version_id, options, pos, size, parents),))

1238

1239

def add_versions(self, versions):

1240

"""Add multiple versions to the index.

1241

1242

:param versions: a list of tuples:

1243

(version_id, options, pos, size, parents).

1244

"""

1245

lines = []

1246

orig_history = self._history[:]

1247

orig_cache = self._cache.copy()

1248

1249

try:

1250

for version_id, options, pos, size, parents in versions:

1251

line = "\n%s %s %s %s %s :" % (version_id,

1252

','.join(options),

1253

pos,

1254

size,

1255

self._version_list_to_index(parents))

1256

assert isinstance(line, str), \

1257

'content must be utf-8 encoded: %r' % (line,)

1258

lines.append(line)

1259

self._cache_version(version_id, options, pos, size, parents)

1260

if not self._need_to_create:

1261

self._transport.append_bytes(self._filename, ''.join(lines))

1262

else:

1263

sio = StringIO()

1264

sio.write(self.HEADER)

1265

sio.writelines(lines)

1266

sio.seek(0)

1267

self._transport.put_file_non_atomic(self._filename, sio,

1268

create_parent_dir=self._create_parent_dir,

1269

mode=self._file_mode,

1270

dir_mode=self._dir_mode)

1271

self._need_to_create = False

1272

except:

1273

# If any problems happen, restore the original values and re-raise

1274

self._history = orig_history

1275

self._cache = orig_cache

1276

raise

1028

self._cache_version(version_id, options, pos, size, parents)

1029

1030

content = "%s %s %s %s %s\n" % (version_id.encode('utf-8'),

1031

','.join(options),

1032

pos,

1033

size,

1034

self._version_list_to_index(parents))

1035

assert isinstance(content, str), 'content must be utf-8 encoded'

1036

self._transport.append(self._filename, StringIO(content))

1277

1037

1278

1038

def has_version(self, version_id):

1279

1039

"""True if the version is in the index."""

1280

return version_id in self._cache

1040

return self._cache.has_key(version_id)

1281

1041

1282

1042

def get_position(self, version_id):

1283

1043

"""Return data position and size of specified version."""

1284

entry = self._cache[version_id]

1285

return entry[2], entry[3]

1044

return (self._cache[version_id][2], \

1045

self._cache[version_id][3])

1286

1046

1287

1047

def get_method(self, version_id):

1288

1048

"""Return compression method of specified version."""

1290

1050

if 'fulltext' in options:

1291

1051

return 'fulltext'

1292

1052

else:

1293

if 'line-delta' not in options:

1294

raise errors.KnitIndexUnknownMethod(self._full_path(), options)

1053

assert 'line-delta' in options

1295

1054

return 'line-delta'

1296

1055

1297

1056

def get_options(self, version_id):

1303

1062

if parent in self._cache]

1304

1063

1305

1064

def get_parents_with_ghosts(self, version_id):

1306

"""Return parents of specified version with ghosts."""

1065

"""Return parents of specified version wth ghosts."""

1307

1066

return self._cache[version_id][4]

1308

1067

1309

1068

def check_versions_present(self, version_ids):

1310

1069

"""Check that all specified versions are present."""

1311

cache = self._cache

1312

for version_id in version_ids:

1313

if version_id not in cache:

1314

raise RevisionNotPresent(version_id, self._filename)

1070

version_ids = set(version_ids)

1071

for version_id in list(version_ids):

1072

if version_id in self._cache:

1073

version_ids.remove(version_id)

1074

if version_ids:

1075

raise RevisionNotPresent(list(version_ids)[0], self.filename)

1315

1076

1316

1077

1317

1078

class _KnitData(_KnitComponentFile):

1318

1079

"""Contents of the knit data file"""

1319

1080

1320

def __init__(self, transport, filename, mode, create=False, file_mode=None,

1321

create_parent_dir=False, delay_create=False,

1322

dir_mode=None):

1323

_KnitComponentFile.__init__(self, transport, filename, mode,

1324

file_mode=file_mode,

1325

create_parent_dir=create_parent_dir,

1326

dir_mode=dir_mode)

1081

HEADER = "# bzr knit data 7\n"

1082

1083

def __init__(self, transport, filename, mode, create=False):

1084

_KnitComponentFile.__init__(self, transport, filename, mode)

1085

self._file = None

1327

1086

self._checked = False

1328

# TODO: jam 20060713 conceptually, this could spill to disk

1329

# if the cached size gets larger than a certain amount

1330

# but it complicates the model a bit, so for now just use

1331

# a simple dictionary

1332

self._cache = {}

1333

self._do_cache = False

1334

1087

if create:

1335

if delay_create:

1336

self._need_to_create = create

1337

else:

1338

self._transport.put_bytes_non_atomic(self._filename, '',

1339

mode=self._file_mode)

1340

1341

def enable_cache(self):

1342

"""Enable caching of reads."""

1343

self._do_cache = True

1088

self._transport.put(self._filename, StringIO(''))

1089

self._records = {}

1344

1090

1345

1091

def clear_cache(self):

1346

1092

"""Clear the record cache."""

1347

self._do_cache = False

1348

self._cache = {}

1093

self._records = {}

1349

1094

1350

1095

def _open_file(self):

1351

try:

1352

return self._transport.get(self._filename)

1353

except NoSuchFile:

1354

pass

1355

return None

1096

if self._file is None:

1097

try:

1098

self._file = self._transport.get(self._filename)

1099

except NoSuchFile:

1100

pass

1101

return self._file

1356

1102

1357

1103

def _record_to_data(self, version_id, digest, lines):

1358

1104

"""Convert version_id, digest, lines into a raw data block.

1361

1107

"""

1362

1108

sio = StringIO()

1363

1109

data_file = GzipFile(None, mode='wb', fileobj=sio)

1364

1365

assert isinstance(version_id, str)

1366

1110

data_file.writelines(chain(

1367

["version %s %d %s\n" % (version_id,

1111

["version %s %d %s\n" % (version_id.encode('utf-8'),

1368

1112

len(lines),

1369

1113

digest)],

1370

1114

lines,

1371

["end %s\n" % version_id]))

1115

["end %s\n\n" % version_id.encode('utf-8')]))

1372

1116

data_file.close()

1373

1117

length= sio.tell()

1374

1118

1376

1120

return length, sio

1377

1121

1378

1122

def add_raw_record(self, raw_data):

1379

"""Append a prepared record to the data file.

1380

1381

:return: the offset in the data file raw_data was written.

1382

"""

1123

"""Append a prepared record to the data file."""

1383

1124

assert isinstance(raw_data, str), 'data must be plain bytes'

1384

if not self._need_to_create:

1385

return self._transport.append_bytes(self._filename, raw_data)

1386

else:

1387

self._transport.put_bytes_non_atomic(self._filename, raw_data,

1388

create_parent_dir=self._create_parent_dir,

1389

mode=self._file_mode,

1390

dir_mode=self._dir_mode)

1391

self._need_to_create = False

1392

return 0

1125

start_pos = self._transport.append(self._filename, StringIO(raw_data))

1126

return start_pos, len(raw_data)

1393

1127

1394

1128

def add_record(self, version_id, digest, lines):

1395

1129

"""Write new text record to disk. Returns the position in the

1396

1130

file where it was written."""

1397

1131

size, sio = self._record_to_data(version_id, digest, lines)

1132

# cache

1133

self._records[version_id] = (digest, lines)

1398

1134

# write to disk

1399

if not self._need_to_create:

1400

start_pos = self._transport.append_file(self._filename, sio)

1401

else:

1402

self._transport.put_file_non_atomic(self._filename, sio,

1403

create_parent_dir=self._create_parent_dir,

1404

mode=self._file_mode,

1405

dir_mode=self._dir_mode)

1406

self._need_to_create = False

1407

start_pos = 0

1408

if self._do_cache:

1409

self._cache[version_id] = sio.getvalue()

1135

start_pos = self._transport.append(self._filename, sio)

1410

1136

return start_pos, size

1411

1137

1412

1138

def _parse_record_header(self, version_id, raw_data):

1416

1142

as (stream, header_record)

1417

1143

"""

1418

1144

df = GzipFile(mode='rb', fileobj=StringIO(raw_data))

1419

try:

1420

rec = self._check_header(version_id, df.readline())

1421

except Exception, e:

1422

raise KnitCorrupt(self._filename,

1423

"While reading {%s} got %s(%s)"

1424

% (version_id, e.__class__.__name__, str(e)))

1145

rec = df.readline().split()

1146

if len(rec) != 4:

1147

raise KnitCorrupt(self._filename, 'unexpected number of elements in record header')

1148

if rec[1].decode('utf-8')!= version_id:

1149

raise KnitCorrupt(self._filename,

1150

'unexpected version, wanted %r, got %r' % (

1151

version_id, rec[1]))

1425

1152

return df, rec

1426

1153

1427

def _check_header(self, version_id, line):

1428

rec = line.split()

1429

if len(rec) != 4:

1430

raise KnitCorrupt(self._filename,

1431

'unexpected number of elements in record header')

1432

if rec[1] != version_id:

1433

raise KnitCorrupt(self._filename,

1434

'unexpected version, wanted %r, got %r'

1435

% (version_id, rec[1]))

1436

return rec

1437

1438

1154

def _parse_record(self, version_id, data):

1439

# profiling notes:

1440

# 4168 calls in 2880 217 internal

1441

# 4168 calls to _parse_record_header in 2121

1442

# 4168 calls to readlines in 330

1443

df = GzipFile(mode='rb', fileobj=StringIO(data))

1444

1445

try:

1446

record_contents = df.readlines()

1447

except Exception, e:

1448

raise KnitCorrupt(self._filename,

1449

"While reading {%s} got %s(%s)"

1450

% (version_id, e.__class__.__name__, str(e)))

1451

header = record_contents.pop(0)

1452

rec = self._check_header(version_id, header)

1453

1454

last_line = record_contents.pop()

1455

if len(record_contents) != int(rec[2]):

1456

raise KnitCorrupt(self._filename,

1457

'incorrect number of lines %s != %s'

1458

' for version {%s}'

1459

% (len(record_contents), int(rec[2]),

1460

version_id))

1461

if last_line != 'end %s\n' % rec[1]:

1462

raise KnitCorrupt(self._filename,

1463

'unexpected version end line %r, wanted %r'

1464

% (last_line, version_id))

1155

df, rec = self._parse_record_header(version_id, data)

1156

lines = int(rec[2])

1157

record_contents = self._read_record_contents(df, lines)

1158

l = df.readline()

1159

if l.decode('utf-8') != 'end %s\n' % version_id:

1160

raise KnitCorrupt(self._filename, 'unexpected version end line %r, wanted %r'

1161

% (l, version_id))

1465

1162

df.close()

1466

1163

return record_contents, rec[3]

1467

1164

1165

def _read_record_contents(self, df, record_lines):

1166

"""Read and return n lines from datafile."""

1167

r = []

1168

for i in range(record_lines):

1169

r.append(df.readline())

1170

return r

1171

1468

1172

def read_records_iter_raw(self, records):

1469

1173

"""Read text records from data file and yield raw data.

1470

1174

1471

1175

This unpacks enough of the text record to validate the id is

1472

1176

as expected but thats all.

1177

1178

It will actively recompress currently cached records on the

1179

basis that that is cheaper than I/O activity.

1473

1180

"""

1181

needed_records = []

1182

for version_id, pos, size in records:

1183

if version_id not in self._records:

1184

needed_records.append((version_id, pos, size))

1185

1474

1186

# setup an iterator of the external records:

1475

1187

# uses readv so nice and fast we hope.

1476

if len(records):

1188

if len(needed_records):

1477

1189

# grab the disk data needed.

1478

if self._cache:

1479

# Don't check _cache if it is empty

1480

needed_offsets = [(pos, size) for version_id, pos, size

1481

in records

1482

if version_id not in self._cache]

1483

else:

1484

needed_offsets = [(pos, size) for version_id, pos, size

1485

in records]

1486

1487

raw_records = self._transport.readv(self._filename, needed_offsets)

1190

raw_records = self._transport.readv(self._filename,

1191

[(pos, size) for version_id, pos, size in needed_records])

1488

1192

1489

1193

for version_id, pos, size in records:

1490

if version_id in self._cache:

1491

# This data has already been validated

1492

data = self._cache[version_id]

1194

if version_id in self._records:

1195

# compress a new version

1196

size, sio = self._record_to_data(version_id,

1197

self._records[version_id][0],

1198

self._records[version_id][1])

1199

yield version_id, sio.getvalue()

1493

1200

else:

1494

1201

pos, data = raw_records.next()

1495

if self._do_cache:

1496

self._cache[version_id] = data

1497

1498

1202

# validate the header

1499

1203

df, rec = self._parse_record_header(version_id, data)

1500

1204

df.close()

1501

yield version_id, data

1205

yield version_id, data

1206

1502

1207

1503

1208

def read_records_iter(self, records):

1504

1209

"""Read text records from data file and yield result.

1505

1210

1506

The result will be returned in whatever is the fastest to read.

1507

Not by the order requested. Also, multiple requests for the same

1508

record will only yield 1 response.

1509

:param records: A list of (version_id, pos, len) entries

1510

:return: Yields (version_id, contents, digest) in the order

1511

read, not the order requested

1211

Each passed record is a tuple of (version_id, pos, len) and

1212

will be read in the given order. Yields (version_id,

1213

contents, digest).

1512

1214

"""

1513

if not records:

1514

return

1515

1516

if self._cache:

1517

# Skip records we have alread seen

1518

yielded_records = set()

1519

needed_records = set()

1520

for record in records:

1521

if record[0] in self._cache:

1522

if record[0] in yielded_records:

1523

continue

1524

yielded_records.add(record[0])

1525

data = self._cache[record[0]]

1526

content, digest = self._parse_record(record[0], data)

1527

yield (record[0], content, digest)

1528

else:

1529

needed_records.add(record)

1530

needed_records = sorted(needed_records, key=operator.itemgetter(1))

1531

else:

1532

needed_records = sorted(set(records), key=operator.itemgetter(1))

1533

1534

if not needed_records:

1535

return

1536

1537

# The transport optimizes the fetching as well

1538

# (ie, reads continuous ranges.)

1539

readv_response = self._transport.readv(self._filename,

1540

[(pos, size) for version_id, pos, size in needed_records])

1541

1542

for (version_id, pos, size), (pos, data) in \

1543

izip(iter(needed_records), readv_response):

1544

content, digest = self._parse_record(version_id, data)

1545

if self._do_cache:

1546

self._cache[version_id] = data

1547

yield version_id, content, digest

1215

1216

needed_records = []

1217

for version_id, pos, size in records:

1218

if version_id not in self._records:

1219

needed_records.append((version_id, pos, size))

1220

1221

if len(needed_records):

1222

# We take it that the transport optimizes the fetching as good

1223

# as possible (ie, reads continous ranges.)

1224

response = self._transport.readv(self._filename,

1225

[(pos, size) for version_id, pos, size in needed_records])

1226

1227

for (record_id, pos, size), (pos, data) in izip(iter(needed_records), response):

1228

content, digest = self._parse_record(record_id, data)

1229

self._records[record_id] = (digest, content)

1230

1231

for version_id, pos, size in records:

1232

yield version_id, copy(self._records[version_id][1]), copy(self._records[version_id][0])

1548

1233

1549

1234

def read_records(self, records):

1550

1235

"""Read records into a dictionary."""

1551

1236

components = {}

1552

for record_id, content, digest in \

1553

self.read_records_iter(records):

1237

for record_id, content, digest in self.read_records_iter(records):

1554

1238

components[record_id] = (content, digest)

1555

1239

return components

1556

1240

1558

1242

class InterKnit(InterVersionedFile):

1559

1243

"""Optimised code paths for knit to knit operations."""

1560

1244

1561

_matching_file_from_factory = KnitVersionedFile

1562

_matching_file_to_factory = KnitVersionedFile

1245

_matching_file_factory = KnitVersionedFile

1563

1246

1564

1247

@staticmethod

1565

1248

def is_compatible(source, target):

1575

1258

assert isinstance(self.source, KnitVersionedFile)

1576

1259

assert isinstance(self.target, KnitVersionedFile)

1577

1260

1578

version_ids = self._get_source_version_ids(version_ids, ignore_missing)

1261

if version_ids is None:

1262

version_ids = self.source.versions()

1263

else:

1264

if not ignore_missing:

1265

self.source._check_versions_present(version_ids)

1266

else:

1267

version_ids = set(self.source.versions()).intersection(

1268

set(version_ids))

1579

1269

1580

1270

if not version_ids:

1581

1271

return 0

1582

1272

1583

pb = ui.ui_factory.nested_progress_bar()

1273

pb = bzrlib.ui.ui_factory.nested_progress_bar()

1584

1274

try:

1585

1275

version_ids = list(version_ids)

1586

1276

if None in version_ids:

1612

1302

needed_versions.update(new_parents.difference(this_versions))

1613

1303

mismatched_versions.add(version)

1614

1304

1615

if not needed_versions and not mismatched_versions:

1305

if not needed_versions and not cross_check_versions:

1616

1306

return 0

1617

1307

full_list = topo_sort(self.source.get_graph())

1618

1308

1631

1321

# if source has the parent, we must :

1632

1322

# * already have it or

1633

1323

# * have it scheduled already

1634

# otherwise we don't care

1324

# otherwise we dont care

1635

1325

assert (self.target.has_version(parent) or

1636

1326

parent in copy_set or

1637

1327

not self.source.has_version(parent))

1643

1333

# data suck the join:

1644

1334

count = 0

1645

1335

total = len(version_list)

1646

raw_datum = []

1647

raw_records = []

1336

# we want the raw gzip for bulk copying, but the record validated

1337

# just enough to be sure its the right one.

1338

# TODO: consider writev or write combining to reduce

1339

# death of a thousand cuts feeling.

1648

1340

for (version_id, raw_data), \

1649

1341

(version_id2, options, parents) in \

1650

1342

izip(self.source._data.read_records_iter_raw(copy_queue_records),

1652

1344

assert version_id == version_id2, 'logic error, inconsistent results'

1653

1345

count = count + 1

1654

1346

pb.update("Joining knit", count, total)

1655

raw_records.append((version_id, options, parents, len(raw_data)))

1656

raw_datum.append(raw_data)

1657

self.target._add_raw_records(raw_records, ''.join(raw_datum))

1347

pos, size = self.target._data.add_raw_record(raw_data)

1348

self.target._index.add_version(version_id, options, pos, size, parents)

1658

1349

1659

1350

for version in mismatched_versions:

1660

1351

# FIXME RBC 20060309 is this needed?

1672

1363

InterVersionedFile.register_optimiser(InterKnit)

1673

1364

1674

1365

1675

class WeaveToKnit(InterVersionedFile):

1676

"""Optimised code paths for weave to knit operations."""

1677

1678

_matching_file_from_factory = bzrlib.weave.WeaveFile

1679

_matching_file_to_factory = KnitVersionedFile

1680

1681

@staticmethod

1682

def is_compatible(source, target):

1683

"""Be compatible with weaves to knits."""

1684

try:

1685

return (isinstance(source, bzrlib.weave.Weave) and

1686

isinstance(target, KnitVersionedFile))

1687

except AttributeError:

1688

return False

1689

1690

def join(self, pb=None, msg=None, version_ids=None, ignore_missing=False):

1691

"""See InterVersionedFile.join."""

1692

assert isinstance(self.source, bzrlib.weave.Weave)

1693

assert isinstance(self.target, KnitVersionedFile)

1694

1695

version_ids = self._get_source_version_ids(version_ids, ignore_missing)

1696

1697

if not version_ids:

1698

return 0

1699

1700

pb = ui.ui_factory.nested_progress_bar()

1701

try:

1702

version_ids = list(version_ids)

1703

1704

self.source_ancestry = set(self.source.get_ancestry(version_ids))

1705

this_versions = set(self.target._index.get_versions())

1706

needed_versions = self.source_ancestry - this_versions

1707

cross_check_versions = self.source_ancestry.intersection(this_versions)

1708

mismatched_versions = set()

1709

for version in cross_check_versions:

1710

# scan to include needed parents.

1711

n1 = set(self.target.get_parents_with_ghosts(version))

1712

n2 = set(self.source.get_parents(version))

1713

# if all of n2's parents are in n1, then its fine.

1714

if n2.difference(n1):

1715

# FIXME TEST this check for cycles being introduced works

1716

# the logic is we have a cycle if in our graph we are an

1717

# ancestor of any of the n2 revisions.

1718

for parent in n2:

1719

if parent in n1:

1720

# safe

1721

continue

1722

else:

1723

parent_ancestors = self.source.get_ancestry(parent)

1724

if version in parent_ancestors:

1725

raise errors.GraphCycleError([parent, version])

1726

# ensure this parent will be available later.

1727

new_parents = n2.difference(n1)

1728

needed_versions.update(new_parents.difference(this_versions))

1729

mismatched_versions.add(version)

1730

1731

if not needed_versions and not mismatched_versions:

1732

return 0

1733

full_list = topo_sort(self.source.get_graph())

1734

1735

version_list = [i for i in full_list if (not self.target.has_version(i)

1736

and i in needed_versions)]

1737

1738

# do the join:

1739

count = 0

1740

total = len(version_list)

1741

for version_id in version_list:

1742

pb.update("Converting to knit", count, total)

1743

parents = self.source.get_parents(version_id)

1744

# check that its will be a consistent copy:

1745

for parent in parents:

1746

# if source has the parent, we must already have it

1747

assert (self.target.has_version(parent))

1748

self.target.add_lines(

1749

version_id, parents, self.source.get_lines(version_id))

1750

count = count + 1

1751

1752

for version in mismatched_versions:

1753

# FIXME RBC 20060309 is this needed?

1754

n1 = set(self.target.get_parents_with_ghosts(version))

1755

n2 = set(self.source.get_parents(version))

1756

# write a combined record to our history preserving the current

1757

# parents as first in the list

1758

new_parents = self.target.get_parents_with_ghosts(version) + list(n2.difference(n1))

1759

self.target.fix_parents(version, new_parents)

1760

return count

1761

finally:

1762

pb.finished()

1763

1764

1765

InterVersionedFile.register_optimiser(WeaveToKnit)

1766

1767

1768

class KnitSequenceMatcher(difflib.SequenceMatcher):

1366

# make GzipFile faster:

1367

import zlib

1368

class GzipFile(gzip.GzipFile):

1369

"""Knit tuned version of GzipFile.

1370

1371

This is based on the following lsprof stats:

1372

python 2.4 stock GzipFile write:

1373

58971 0 5644.3090 2721.4730 gzip:193(write)

1374

+58971 0 1159.5530 1159.5530 +<built-in method compress>

1375

+176913 0 987.0320 987.0320 +<len>

1376

+58971 0 423.1450 423.1450 +<zlib.crc32>

1377

+58971 0 353.1060 353.1060 +<method 'write' of 'cStringIO.

1378

StringO' objects>

1379

tuned GzipFile write:

1380

58971 0 4477.2590 2103.1120 bzrlib.knit:1250(write)

1381

+58971 0 1297.7620 1297.7620 +<built-in method compress>

1382

+58971 0 406.2160 406.2160 +<zlib.crc32>

1383

+58971 0 341.9020 341.9020 +<method 'write' of 'cStringIO.

1384

StringO' objects>

1385

+58971 0 328.2670 328.2670 +<len>

1386

1387

1388

Yes, its only 1.6 seconds, but they add up.

1389

"""

1390

1391

def write(self, data):

1392

if self.mode != gzip.WRITE:

1393

import errno

1394

raise IOError(errno.EBADF, "write() on read-only GzipFile object")

1395

1396

if self.fileobj is None:

1397

raise ValueError, "write() on closed GzipFile object"

1398

data_len = len(data)

1399

if data_len > 0:

1400

self.size = self.size + data_len

1401

self.crc = zlib.crc32(data, self.crc)

1402

self.fileobj.write( self.compress.compress(data) )

1403

self.offset += data_len

1404

1405

def writelines(self, lines):

1406

# profiling indicated a significant overhead

1407

# calling write for each line.

1408

# this batch call is a lot faster :).

1409

# (4 seconds to 1 seconds for the sample upgrades I was testing).

1410

self.write(''.join(lines))

1411

1412

1413

class SequenceMatcher(difflib.SequenceMatcher):

1769

1414

"""Knit tuned sequence matcher.

1770

1415

1771

1416

This is based on profiling of difflib which indicated some improvements

1842

1487

j2lenget = j2len.get

1843

1488

newj2len = {}

1844

1489

1845

# changing b2j.get(a[i], nothing) to a try:KeyError pair produced the

1490

# changing b2j.get(a[i], nothing) to a try:Keyerror pair produced the

1846

1491

# following improvement

1847

1492

# 704 0 4650.5320 2620.7410 bzrlib.knit:1336(find_longest_match)

1848

1493

# +326674 0 1655.1210 1655.1210 +<method 'get' of 'dict' objects>

1898

1543

1899

1544

return besti, bestj, bestsize

1900

1545

1901

1902

try:

1903

from bzrlib._knit_load_data_c import _load_data_c as _load_data

1904

except ImportError:

1905

from bzrlib._knit_load_data_py import _load_data_py as _load_data

Older »