~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/fetch.py

Committer: Robey Pointer
Date: 2006-09-08 18:46:29 UTC
mto: This revision was merged to the branch mainline in revision 1996.
Revision ID: robey@lag.net-20060908184629-e3fc4c61ca21508c

pychecker is on crack; go back to using 'is None'.

files added:
BRANCH.TODO

COPYING.txt

bzr.ico

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/decorators.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/ignores.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/sign_my_commits.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/symbol_versioning.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transform.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/readonly.py

bzrlib/transport/ssh.py

bzrlib/tuned_gzip.py

bzrlib/urlutils.py

bzrlib/version.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

doc/README.1st

doc/configuration.txt

doc/default.css

doc/index.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/using_aliases.txt

generate_docs.py

profile_imports.py

tools/__init__.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/ostools.py

tools/win32/start_bzr.bat

files removed:
bzrlib/clone.py

bzrlib/merge_core.py

bzrlib/tests/test_reweave.py

bzrlib/util/configobj/validate.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

files renamed:
bzrlib/changeset.py => bzrlib/bundle/__init__.py

bzrlib/store/weave.py => bzrlib/store/versioned/__init__.py

bzrlib/tests/test_annotate.py => bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/test_revision_info.py => bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/test_status.py => bzrlib/tests/blackbox/test_status.py

bzrlib/tests/test_uncommit.py => bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/test_branch.py => bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/test_parent.py => bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/test_revprops.py => bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/test_sftp.py => bzrlib/tests/test_sftp_transport.py

bzrlib/transport/http.py => bzrlib/transport/http/__init__.py

bzrlib/xml.py => bzrlib/xml_serializer.py

tutorial.txt => doc/tutorial.txt

bzr_man.py => tools/doc_generate/autodoc_man.py

files modified:
.bzrignore

HACKING

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_store.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/newinventory.py

contrib/pwk

setup.py *

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/fetch.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

from copy import copy

import os

from cStringIO import StringIO

import bzrlib

import bzrlib.errors as errors

from bzrlib.errors import (InstallFailed, NoSuchRevision, WeaveError,

MissingText)

from bzrlib.trace import mutter, note, warning

from bzrlib.branch import Branch

from bzrlib.progress import ProgressBar

from bzrlib.xml5 import serializer_v5

from bzrlib.osutils import sha_string, split_lines

"""Copying of history from one branch to another.

add a revision to the store until everything it refers to is also

stored, so that if a revision is present we can totally recreate it.

However, we can't know what files are included in a revision until we

read its inventory. Therefore, we first pull the XML and hold it in

memory until we've updated all of the files referenced.

read its inventory. So we query the inventory store of the source for

the ids we need, and then pull those ids and finally actually join

the inventories.

"""

import bzrlib

import bzrlib.errors as errors

from bzrlib.errors import (InstallFailed,

)

from bzrlib.trace import mutter

from bzrlib.progress import ProgressPhase

from bzrlib.revision import NULL_REVISION

from bzrlib.symbol_versioning import (deprecated_function,

deprecated_method,

zero_eight,

)

# TODO: Avoid repeatedly opening weaves so many times.

# XXX: This doesn't handle ghost (not present in branch) revisions at

# and add in all file versions

@deprecated_function(zero_eight)

def greedy_fetch(to_branch, from_branch, revision=None, pb=None):

"""Legacy API, please see branch.fetch(from_branch, last_revision, pb)."""

f = Fetcher(to_branch, from_branch, revision, pb)

return f.count_copied, f.failed_revisions

class Fetcher(object):

"""Pull revisions and texts from one branch to another.

This doesn't update the destination's history; that can be done

separately if desired.

revision_limit

If set, pull only up to this revision_id.

After running:

last_revision -- if last_revision

is given it will be that, otherwise the last revision of

from_branch

fetch = greedy_fetch

class RepoFetcher(object):

"""Pull revisions and texts from one repository to another.

last_revision

if set, try to limit to the data this revision references.

after running:

count_copied -- number of revisions copied

count_weaves -- number of file weaves copied

This should not be used directory, its essential a object to encapsulate

the logic in InterRepository.fetch().

"""

def __init__(self, to_branch, from_branch, last_revision=None, pb=None):

if to_branch == from_branch:

raise Exception("can't fetch from a branch to itself")

self.to_branch = to_branch

self.to_weaves = to_branch.weave_store

self.to_control = to_branch.control_weaves

self.from_branch = from_branch

self.from_weaves = from_branch.weave_store

self.from_control = from_branch.control_weaves

def __init__(self, to_repository, from_repository, last_revision=None, pb=None):

# result variables.

self.failed_revisions = []

100

self.count_copied = 0

if to_repository.control_files._transport.base == from_repository.control_files._transport.base:

# check that last_revision is in 'from' and then return a no-operation.

if last_revision not in (None, NULL_REVISION):

from_repository.get_revision(last_revision)

return

self.to_repository = to_repository

self.from_repository = from_repository

# must not mutate self._last_revision as its potentially a shared instance

self._last_revision = last_revision

if pb is None:

100

self.pb = bzrlib.ui.ui_factory.nested_progress_bar()

101

self.nested_pb = self.pb

102

else:

103

self.pb = pb

104

self.nested_pb = None

105

self.from_repository.lock_read()

106

try:

107

self.to_repository.lock_write()

108

try:

109

self.__fetch()

110

finally:

111

if self.nested_pb is not None:

112

self.nested_pb.finished()

113

self.to_repository.unlock()

114

finally:

115

self.from_repository.unlock()

116

117

def __fetch(self):

118

"""Primary worker function.

119

120

This initialises all the needed variables, and then fetches the

121

requested revisions, finally clearing the progress bar.

122

"""

123

self.to_weaves = self.to_repository.weave_store

124

self.to_control = self.to_repository.control_weaves

125

self.from_weaves = self.from_repository.weave_store

126

self.from_control = self.from_repository.control_weaves

101

127

self.count_total = 0

102

self.count_weaves = 0

103

self.copied_file_ids = set()

104

128

self.file_ids_names = {}

105

if pb is None:

106

self.pb = bzrlib.ui.ui_factory.progress_bar()

107

else:

108

self.pb = pb

109

self.from_branch.lock_read()

129

pp = ProgressPhase('Fetch phase', 4, self.pb)

110

130

try:

111

self._fetch_revisions(last_revision)

131

pp.next_phase()

132

revs = self._revids_to_fetch()

133

# something to do ?

134

if revs:

135

pp.next_phase()

136

self._fetch_weave_texts(revs)

137

pp.next_phase()

138

self._fetch_inventory_weave(revs)

139

pp.next_phase()

140

self._fetch_revision_texts(revs)

141

self.count_copied += len(revs)

112

142

finally:

113

self.from_branch.unlock()

114

143

self.pb.clear()

115

144

116

def _fetch_revisions(self, last_revision):

117

self.last_revision = self._find_last_revision(last_revision)

118

mutter('fetch up to rev {%s}', self.last_revision)

119

if (self.last_revision is not None and

120

self.to_branch.has_revision(self.last_revision)):

121

return

122

try:

123

revs_to_fetch = self._compare_ancestries()

124

except WeaveError:

125

raise InstallFailed([self.last_revision])

126

self._copy_revisions(revs_to_fetch)

127

self.new_ancestry = revs_to_fetch

128

129

def _find_last_revision(self, last_revision):

130

"""Find the limiting source revision.

131

132

Every ancestor of that revision will be merged across.

133

134

Returns the revision_id, or returns None if there's no history

135

in the source branch."""

136

if last_revision:

137

return last_revision

138

self.pb.update('get source history')

139

from_history = self.from_branch.revision_history()

140

self.pb.update('get destination history')

141

if from_history:

142

return from_history[-1]

143

else:

144

return None # no history in the source branch

145

def _revids_to_fetch(self):

146

mutter('fetch up to rev {%s}', self._last_revision)

147

if self._last_revision is NULL_REVISION:

148

# explicit limit of no revisions needed

149

return None

150

if (self._last_revision is not None and

151

self.to_repository.has_revision(self._last_revision)):

152

return None

145

153

146

147

def _compare_ancestries(self):

148

"""Get a list of revisions that must be copied.

149

150

That is, every revision that's in the ancestry of the source

151

branch and not in the destination branch."""

152

self.pb.update('get source ancestry')

153

self.from_ancestry = self.from_branch.get_ancestry(self.last_revision)

154

155

dest_last_rev = self.to_branch.last_revision()

156

self.pb.update('get destination ancestry')

157

if dest_last_rev:

158

dest_ancestry = self.to_branch.get_ancestry(dest_last_rev)

159

else:

160

dest_ancestry = []

161

ss = set(dest_ancestry)

162

to_fetch = []

163

for rev_id in self.from_ancestry:

164

if rev_id not in ss:

165

to_fetch.append(rev_id)

166

mutter('need to get revision {%s}', rev_id)

167

mutter('need to get %d revisions in total', len(to_fetch))

168

self.count_total = len(to_fetch)

169

return to_fetch

170

171

def _copy_revisions(self, revs_to_fetch):

172

i = 0

173

for rev_id in revs_to_fetch:

174

i += 1

175

if rev_id is None:

176

continue

177

if self.to_branch.has_revision(rev_id):

178

continue

179

self.pb.update('copy revision', i, self.count_total)

180

self._copy_one_revision(rev_id)

181

self.count_copied += 1

182

183

184

def _copy_one_revision(self, rev_id):

185

"""Copy revision and everything referenced by it."""

186

mutter('copying revision {%s}', rev_id)

187

rev_xml = self.from_branch.get_revision_xml(rev_id)

188

inv_xml = self.from_branch.get_inventory_xml(rev_id)

189

rev = serializer_v5.read_revision_from_string(rev_xml)

190

inv = serializer_v5.read_inventory_from_string(inv_xml)

191

assert rev.revision_id == rev_id

192

assert rev.inventory_sha1 == sha_string(inv_xml)

193

mutter(' commiter %s, %d parents',

194

rev.committer,

195

len(rev.parent_ids))

196

self._copy_new_texts(rev_id, inv)

197

parents = rev.parent_ids

198

new_parents = copy(parents)

199

for parent in parents:

200

if not self.to_branch.has_revision(parent):

201

new_parents.pop(new_parents.index(parent))

202

self._copy_inventory(rev_id, inv_xml, new_parents)

203

self.to_branch.revision_store.add(StringIO(rev_xml), rev_id)

204

mutter('copied revision %s', rev_id)

205

206

def _copy_inventory(self, rev_id, inv_xml, parent_ids):

207

self.to_control.add_text('inventory', rev_id,

208

split_lines(inv_xml), parent_ids,

209

self.to_branch.get_transaction())

210

211

def _copy_new_texts(self, rev_id, inv):

212

"""Copy any new texts occuring in this revision."""

213

# TODO: Rather than writing out weaves every time, hold them

214

# in memory until everything's done? But this way is nicer

215

# if it's interrupted.

216

for path, ie in inv.iter_entries():

217

self._copy_one_weave(rev_id, ie.file_id, ie.revision)

218

219

def _copy_one_weave(self, rev_id, file_id, text_revision):

220

"""Copy one file weave, esuring the result contains text_revision."""

221

# check if the revision is already there

222

if file_id in self.file_ids_names.keys( ) and \

223

text_revision in self.file_ids_names[file_id]:

224

return

225

to_weave = self.to_weaves.get_weave_or_empty(file_id,

226

self.to_branch.get_transaction())

227

if not file_id in self.file_ids_names.keys( ):

228

self.file_ids_names[file_id] = to_weave.names( )

229

if text_revision in to_weave:

230

return

231

from_weave = self.from_weaves.get_weave(file_id,

232

self.from_branch.get_transaction())

233

if text_revision not in from_weave:

234

raise MissingText(self.from_branch, text_revision, file_id)

235

mutter('copy file {%s} modified in {%s}', file_id, rev_id)

236

237

if to_weave.numversions() > 0:

238

# destination has contents, must merge

154

try:

155

return self.to_repository.missing_revision_ids(self.from_repository,

156

self._last_revision)

157

except errors.NoSuchRevision:

158

raise InstallFailed([self._last_revision])

159

160

def _fetch_weave_texts(self, revs):

161

texts_pb = bzrlib.ui.ui_factory.nested_progress_bar()

162

try:

163

# fileids_altered_by_revision_ids requires reading the inventory

164

# weave, we will need to read the inventory weave again when

165

# all this is done, so enable caching for that specific weave

166

inv_w = self.from_repository.get_inventory_weave()

167

inv_w.enable_cache()

168

file_ids = self.from_repository.fileids_altered_by_revision_ids(revs)

169

count = 0

170

num_file_ids = len(file_ids)

171

for file_id, required_versions in file_ids.items():

172

texts_pb.update("fetch texts", count, num_file_ids)

173

count +=1

174

to_weave = self.to_weaves.get_weave_or_empty(file_id,

175

self.to_repository.get_transaction())

176

from_weave = self.from_weaves.get_weave(file_id,

177

self.from_repository.get_transaction())

178

# we fetch all the texts, because texts do

179

# not reference anything, and its cheap enough

180

to_weave.join(from_weave, version_ids=required_versions)

181

# we don't need *all* of this data anymore, but we dont know

182

# what we do. This cache clearing will result in a new read

183

# of the knit data when we do the checkout, but probably we

184

# want to emit the needed data on the fly rather than at the

185

# end anyhow.

186

# the from weave should know not to cache data being joined,

187

# but its ok to ask it to clear.

188

from_weave.clear_cache()

189

to_weave.clear_cache()

190

finally:

191

texts_pb.finished()

192

193

def _fetch_inventory_weave(self, revs):

194

pb = bzrlib.ui.ui_factory.nested_progress_bar()

195

try:

196

pb.update("fetch inventory", 0, 2)

197

to_weave = self.to_control.get_weave('inventory',

198

self.to_repository.get_transaction())

199

200

child_pb = bzrlib.ui.ui_factory.nested_progress_bar()

239

201

try:

240

to_weave.join(from_weave)

241

except errors.WeaveParentMismatch:

242

to_weave.reweave(from_weave)

243

else:

244

# destination is empty, just replace it

245

to_weave = from_weave.copy( )

246

self.to_weaves.put_weave(file_id, to_weave,

247

self.to_branch.get_transaction())

248

self.count_weaves += 1

249

self.copied_file_ids.add(file_id)

250

self.file_ids_names[file_id] = to_weave.names()

251

mutter('copied file {%s}', file_id)

252

253

254

fetch = Fetcher

202

# just merge, this is optimisable and its means we don't

203

# copy unreferenced data such as not-needed inventories.

204

pb.update("fetch inventory", 1, 3)

205

from_weave = self.from_repository.get_inventory_weave()

206

pb.update("fetch inventory", 2, 3)

207

# we fetch only the referenced inventories because we do not

208

# know for unselected inventories whether all their required

209

# texts are present in the other repository - it could be

210

# corrupt.

211

to_weave.join(from_weave, pb=child_pb, msg='merge inventory',

212

version_ids=revs)

213

from_weave.clear_cache()

214

finally:

215

child_pb.finished()

216

finally:

217

pb.finished()

218

219

220

class GenericRepoFetcher(RepoFetcher):

221

"""This is a generic repo to repo fetcher.

222

223

This makes minimal assumptions about repo layout and contents.

224

It triggers a reconciliation after fetching to ensure integrity.

225

"""

226

227

def _fetch_revision_texts(self, revs):

228

"""Fetch revision object texts"""

229

rev_pb = bzrlib.ui.ui_factory.nested_progress_bar()

230

try:

231

to_txn = self.to_transaction = self.to_repository.get_transaction()

232

count = 0

233

total = len(revs)

234

to_store = self.to_repository._revision_store

235

for rev in revs:

236

pb = bzrlib.ui.ui_factory.nested_progress_bar()

237

try:

238

pb.update('copying revisions', count, total)

239

try:

240

sig_text = self.from_repository.get_signature_text(rev)

241

to_store.add_revision_signature_text(rev, sig_text, to_txn)

242

except errors.NoSuchRevision:

243

# not signed.

244

pass

245

to_store.add_revision(self.from_repository.get_revision(rev),

246

to_txn)

247

count += 1

248

finally:

249

pb.finished()

250

# fixup inventory if needed:

251

# this is expensive because we have no inverse index to current ghosts.

252

# but on local disk its a few seconds and sftp push is already insane.

253

# so we just-do-it.

254

# FIXME: repository should inform if this is needed.

255

self.to_repository.reconcile()

256

finally:

257

rev_pb.finished()

258

259

260

class KnitRepoFetcher(RepoFetcher):

261

"""This is a knit format repository specific fetcher.

262

263

This differs from the GenericRepoFetcher by not doing a

264

reconciliation after copying, and using knit joining to

265

copy revision texts.

266

"""

267

268

def _fetch_revision_texts(self, revs):

269

# may need to be a InterRevisionStore call here.

270

from_transaction = self.from_repository.get_transaction()

271

to_transaction = self.to_repository.get_transaction()

272

to_sf = self.to_repository._revision_store.get_signature_file(

273

to_transaction)

274

from_sf = self.from_repository._revision_store.get_signature_file(

275

from_transaction)

276

to_sf.join(from_sf, version_ids=revs, ignore_missing=True)

277

to_rf = self.to_repository._revision_store.get_revision_file(

278

to_transaction)

279

from_rf = self.from_repository._revision_store.get_revision_file(

280

from_transaction)

281

to_rf.join(from_rf, version_ids=revs)

282

283

284

class Fetcher(object):

285

"""Backwards compatibility glue for branch.fetch()."""

286

287

@deprecated_method(zero_eight)

288

def __init__(self, to_branch, from_branch, last_revision=None, pb=None):

289

"""Please see branch.fetch()."""

290

to_branch.fetch(from_branch, last_revision, pb)

Older »