~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/fetch.py

Committer: Canonical.com Patch Queue Manager
Date: 2007-12-20 16:16:34 UTC
mfrom: (3123.5.18 hardlinks)
Revision ID: pqm@pqm.ubuntu.com-20071220161634-2kcjb650o21ydko4

Accelerate build_tree using similar workingtrees (abentley)

files added:
bzrlib/plugins/multiparent.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_escaped_store.py

bzrlib/xml6.py

index.txt

tools/win32/survey.txt

files removed:
bzrlib/_btree_serializer_c.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_walkdirs_win32.h

bzrlib/_walkdirs_win32.pyx

bzrlib/btree_index.py

bzrlib/chunk_writer.py

bzrlib/directory_service.py

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/push.py

bzrlib/rules.py

bzrlib/smart/message.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_stacking.py

bzrlib/tests/file_utils.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/per_repository_reference

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_add_inventory.py

bzrlib/tests/per_repository_reference/test_add_revision.py

bzrlib/tests/per_repository_reference/test_add_signature_text.py

bzrlib/tests/per_repository_reference/test_all_revision_ids.py

bzrlib/tests/per_repository_reference/test_break_lock.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/repository_implementations/test_add_fallback_repository.py

bzrlib/tests/repository_implementations/test_get_parent_map.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_chunk_writer.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_iter_search_rules.py

bzrlib/transport/nosmart.py

bzrlib/xml5.py

bzrlib/xml6.py

contrib/bash/bzrbashprompt.sh

contrib/bzr_access

doc/developers/development-repo.txt

doc/developers/integration.txt

doc/developers/inventory.txt

doc/developers/lca-merge.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/tortoise-strategy.txt

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide/testing.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/zen.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

tools/package_mf.py

tools/win32/run_script.py

files renamed:
bzrlib/plugins/launchpad/lp_directory.py => bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_directory.py => bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/tests/http_utils.py => bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/http_server.py => bzrlib/tests/HttpServer.py

bzrlib/tests/test_revisionspec.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/xml8.py => bzrlib/xml5.py

doc/en/user-guide/part2_intro.txt => doc/en/user-guide/best_practice_intro.txt

files modified:
.bzrignore

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_py.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/conflicts.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/ftp_server.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_info.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/HACKING.txt

doc/developers/authentication-ring.txt

doc/developers/index.txt

doc/developers/network-protocol.txt

doc/developers/repository.txt

doc/en/mini-tutorial/index.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/version_info.txt

doc/index.txt

setup.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/win32/bzr.iss.cog

Show diffs side-by-side

added added

removed removed

bzrlib/fetch.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

stored, so that if a revision is present we can totally recreate it.

However, we can't know what files are included in a revision until we

read its inventory. So we query the inventory store of the source for

the ids we need, and then pull those ids and then return to the inventories.

the ids we need, and then pull those ids and finally actually join

the inventories.

"""

import operator

import bzrlib

import bzrlib.errors as errors

from bzrlib.errors import InstallFailed

from bzrlib.errors import (InstallFailed,

)

from bzrlib.progress import ProgressPhase

from bzrlib.revision import is_null, NULL_REVISION

from bzrlib.symbol_versioning import (deprecated_function,

deprecated_method,

)

from bzrlib.tsort import topo_sort

from bzrlib.trace import mutter

import bzrlib.ui

from bzrlib.versionedfile import filter_absent, FulltextContentFactory

from bzrlib.lazy_import import lazy_import

# TODO: Avoid repeatedly opening weaves so many times.

This should not be used directly, it's essential a object to encapsulate

the logic in InterRepository.fetch().

"""

def __init__(self, to_repository, from_repository, last_revision=None, pb=None,

find_ghosts=True):

"""Create a repo fetcher.

:param find_ghosts: If True search the entire history for ghosts.

"""

def __init__(self, to_repository, from_repository, last_revision=None, pb=None):

# result variables.

self.failed_revisions = []

self.count_copied = 0

self.from_repository = from_repository

# must not mutate self._last_revision as its potentially a shared instance

self._last_revision = last_revision

self.find_ghosts = find_ghosts

if pb is None:

self.pb = bzrlib.ui.ui_factory.nested_progress_bar()

100

self.nested_pb = self.pb

114

107

else:

115

108

self.to_repository.commit_write_group()

116

109

finally:

117

try:

118

if self.nested_pb is not None:

119

self.nested_pb.finished()

120

finally:

121

self.to_repository.unlock()

110

if self.nested_pb is not None:

111

self.nested_pb.finished()

112

self.to_repository.unlock()

122

113

finally:

123

114

self.from_repository.unlock()

124

115

128

119

This initialises all the needed variables, and then fetches the

129

120

requested revisions, finally clearing the progress bar.

130

121

"""

122

self.to_weaves = self.to_repository.weave_store

123

self.from_weaves = self.from_repository.weave_store

131

124

self.count_total = 0

132

125

self.file_ids_names = {}

133

126

pp = ProgressPhase('Transferring', 4, self.pb)

134

127

try:

135

128

pp.next_phase()

136

search = self._revids_to_fetch()

137

if search is None:

129

revs = self._revids_to_fetch()

130

if revs is None:

138

131

return

139

if getattr(self, '_fetch_everything_for_search', None) is not None:

140

self._fetch_everything_for_search(search, pp)

141

else:

142

# backward compatibility

143

self._fetch_everything_for_revisions(search.get_keys, pp)

132

self._fetch_everything_for_revisions(revs, pp)

144

133

finally:

145

134

self.pb.clear()

146

135

147

def _fetch_everything_for_search(self, search, pp):

136

def _fetch_everything_for_revisions(self, revs, pp):

148

137

"""Fetch all data for the given set of revisions."""

149

138

# The first phase is "file". We pass the progress bar for it directly

150

139

# into item_keys_introduced_by, which has more information about how

157

146

phase = 'file'

158

147

pb = bzrlib.ui.ui_factory.nested_progress_bar()

159

148

try:

160

revs = search.get_keys()

161

graph = self.from_repository.get_graph()

162

revs = list(graph.iter_topo_order(revs))

163

data_to_fetch = self.from_repository.item_keys_introduced_by(revs,

164

pb)

165

text_keys = []

149

data_to_fetch = self.from_repository.item_keys_introduced_by(revs, pb)

166

150

for knit_kind, file_id, revisions in data_to_fetch:

167

151

if knit_kind != phase:

168

152

phase = knit_kind

171

155

pp.next_phase()

172

156

pb = bzrlib.ui.ui_factory.nested_progress_bar()

173

157

if knit_kind == "file":

174

# Accumulate file texts

175

text_keys.extend([(file_id, revision) for revision in

176

revisions])

158

self._fetch_weave_text(file_id, revisions)

177

159

elif knit_kind == "inventory":

178

# Now copy the file texts.

179

to_texts = self.to_repository.texts

180

from_texts = self.from_repository.texts

181

to_texts.insert_record_stream(from_texts.get_record_stream(

182

text_keys, self.to_repository._fetch_order,

183

not self.to_repository._fetch_uses_deltas))

184

# Cause an error if a text occurs after we have done the

185

# copy.

186

text_keys = None

187

# Before we process the inventory we generate the root

188

# texts (if necessary) so that the inventories references

189

# will be valid.

160

# XXX:

161

# Once we've processed all the files, then we generate the root

162

# texts (if necessary), then we process the inventory. It's a

163

# bit distasteful to have knit_kind == "inventory" mean this,

164

# perhaps it should happen on the first non-"file" knit, in case

165

# it's not always inventory?

190

166

self._generate_root_texts(revs)

191

# NB: This currently reopens the inventory weave in source;

192

# using a single stream interface instead would avoid this.

193

167

self._fetch_inventory_weave(revs, pb)

194

168

elif knit_kind == "signatures":

195

169

# Nothing to do here; this will be taken care of when

199

173

self._fetch_revision_texts(revs, pb)

200

174

else:

201

175

raise AssertionError("Unknown knit kind %r" % knit_kind)

202

if self.to_repository._fetch_reconcile:

203

self.to_repository.reconcile()

204

176

finally:

205

177

if pb is not None:

206

178

pb.finished()

219

191

if (self._last_revision is not None and

220

192

self.to_repository.has_revision(self._last_revision)):

221

193

return None

194

222

195

try:

223

return self.to_repository.search_missing_revision_ids(

224

self.from_repository, self._last_revision,

225

find_ghosts=self.find_ghosts)

226

except errors.NoSuchRevision, e:

196

# XXX: this gets the full graph on both sides, and will make sure

197

# that ghosts are filled whether or not you care about them.

198

return self.to_repository.missing_revision_ids(self.from_repository,

199

self._last_revision)

200

except errors.NoSuchRevision:

227

201

raise InstallFailed([self._last_revision])

228

202

203

def _fetch_weave_text(self, file_id, required_versions):

204

to_weave = self.to_weaves.get_weave_or_empty(file_id,

205

self.to_repository.get_transaction())

206

from_weave = self.from_weaves.get_weave(file_id,

207

self.from_repository.get_transaction())

208

# we fetch all the texts, because texts do

209

# not reference anything, and its cheap enough

210

to_weave.join(from_weave, version_ids=required_versions)

211

# we don't need *all* of this data anymore, but we dont know

212

# what we do. This cache clearing will result in a new read

213

# of the knit data when we do the checkout, but probably we

214

# want to emit the needed data on the fly rather than at the

215

# end anyhow.

216

# the from weave should know not to cache data being joined,

217

# but its ok to ask it to clear.

218

from_weave.clear_cache()

219

to_weave.clear_cache()

220

229

221

def _fetch_inventory_weave(self, revs, pb):

230

222

pb.update("fetch inventory", 0, 2)

231

to_weave = self.to_repository.inventories

223

to_weave = self.to_repository.get_inventory_weave()

232

224

child_pb = bzrlib.ui.ui_factory.nested_progress_bar()

233

225

try:

234

226

# just merge, this is optimisable and its means we don't

235

227

# copy unreferenced data such as not-needed inventories.

236

228

pb.update("fetch inventory", 1, 3)

237

from_weave = self.from_repository.inventories

229

from_weave = self.from_repository.get_inventory_weave()

238

230

pb.update("fetch inventory", 2, 3)

239

231

# we fetch only the referenced inventories because we do not

240

232

# know for unselected inventories whether all their required

241

233

# texts are present in the other repository - it could be

242

234

# corrupt.

243

to_weave.insert_record_stream(from_weave.get_record_stream(

244

[(rev_id,) for rev_id in revs],

245

self.to_repository._fetch_order,

246

not self.to_repository._fetch_uses_deltas))

235

to_weave.join(from_weave, pb=child_pb, msg='merge inventory',

236

version_ids=revs)

237

from_weave.clear_cache()

247

238

finally:

248

239

child_pb.finished()

249

240

250

def _fetch_revision_texts(self, revs, pb):

251

# may need to be a InterRevisionStore call here.

252

to_sf = self.to_repository.signatures

253

from_sf = self.from_repository.signatures

254

# A missing signature is just skipped.

255

to_sf.insert_record_stream(filter_absent(from_sf.get_record_stream(

256

[(rev_id,) for rev_id in revs],

257

self.to_repository._fetch_order,

258

not self.to_repository._fetch_uses_deltas)))

259

self._fetch_just_revision_texts(revs)

260

261

def _fetch_just_revision_texts(self, version_ids):

262

to_rf = self.to_repository.revisions

263

from_rf = self.from_repository.revisions

264

to_rf.insert_record_stream(from_rf.get_record_stream(

265

[(rev_id,) for rev_id in version_ids],

266

self.to_repository._fetch_order,

267

not self.to_repository._fetch_uses_deltas))

268

269

241

def _generate_root_texts(self, revs):

270

242

"""This will be called by __fetch between fetching weave texts and

271

243

fetching the inventory weave.

276

248

pass

277

249

278

250

251

class GenericRepoFetcher(RepoFetcher):

252

"""This is a generic repo to repo fetcher.

253

254

This makes minimal assumptions about repo layout and contents.

255

It triggers a reconciliation after fetching to ensure integrity.

256

"""

257

258

def _fetch_revision_texts(self, revs, pb):

259

"""Fetch revision object texts"""

260

to_txn = self.to_transaction = self.to_repository.get_transaction()

261

count = 0

262

total = len(revs)

263

to_store = self.to_repository._revision_store

264

for rev in revs:

265

pb.update('copying revisions', count, total)

266

try:

267

sig_text = self.from_repository.get_signature_text(rev)

268

to_store.add_revision_signature_text(rev, sig_text, to_txn)

269

except errors.NoSuchRevision:

270

# not signed.

271

pass

272

to_store.add_revision(self.from_repository.get_revision(rev),

273

to_txn)

274

count += 1

275

# fixup inventory if needed:

276

# this is expensive because we have no inverse index to current ghosts.

277

# but on local disk its a few seconds and sftp push is already insane.

278

# so we just-do-it.

279

# FIXME: repository should inform if this is needed.

280

self.to_repository.reconcile()

281

282

283

class KnitRepoFetcher(RepoFetcher):

284

"""This is a knit format repository specific fetcher.

285

286

This differs from the GenericRepoFetcher by not doing a

287

reconciliation after copying, and using knit joining to

288

copy revision texts.

289

"""

290

291

def _fetch_revision_texts(self, revs, pb):

292

# may need to be a InterRevisionStore call here.

293

from_transaction = self.from_repository.get_transaction()

294

to_transaction = self.to_repository.get_transaction()

295

to_sf = self.to_repository._revision_store.get_signature_file(

296

to_transaction)

297

from_sf = self.from_repository._revision_store.get_signature_file(

298

from_transaction)

299

to_sf.join(from_sf, version_ids=revs, ignore_missing=True)

300

to_rf = self.to_repository._revision_store.get_revision_file(

301

to_transaction)

302

from_rf = self.from_repository._revision_store.get_revision_file(

303

from_transaction)

304

to_rf.join(from_rf, version_ids=revs)

305

306

279

307

class Inter1and2Helper(object):

280

308

"""Helper for operations that convert data from model 1 and 2

281

309

301

329

302

330

:param revs: A list of revision ids

303

331

"""

304

# In case that revs is not a list.

305

revs = list(revs)

306

332

while revs:

307

333

for tree in self.source.revision_trees(revs[:100]):

308

334

if tree.inventory.revision_id is None:

310

336

yield tree

311

337

revs = revs[100:]

312

338

313

def _find_root_ids(self, revs, parent_map, graph):

314

revision_root = {}

315

planned_versions = {}

316

for tree in self.iter_rev_trees(revs):

317

revision_id = tree.inventory.root.revision

318

root_id = tree.get_root_id()

319

planned_versions.setdefault(root_id, []).append(revision_id)

320

revision_root[revision_id] = root_id

321

# Find out which parents we don't already know root ids for

322

parents = set()

323

for revision_parents in parent_map.itervalues():

324

parents.update(revision_parents)

325

parents.difference_update(revision_root.keys() + [NULL_REVISION])

326

# Limit to revisions present in the versionedfile

327

parents = graph.get_parent_map(parents).keys()

328

for tree in self.iter_rev_trees(parents):

329

root_id = tree.get_root_id()

330

revision_root[tree.get_revision_id()] = root_id

331

return revision_root, planned_versions

332

333

339

def generate_root_texts(self, revs):

334

340

"""Generate VersionedFiles for all root ids.

335

341

336

342

:param revs: the revisions to include

337

343

"""

338

to_texts = self.target.texts

339

graph = self.source.get_graph()

340

parent_map = graph.get_parent_map(revs)

341

rev_order = topo_sort(parent_map)

342

rev_id_to_root_id, root_id_to_rev_ids = self._find_root_ids(

343

revs, parent_map, graph)

344

root_id_order = [(rev_id_to_root_id[rev_id], rev_id) for rev_id in

345

rev_order]

346

# Guaranteed stable, this groups all the file id operations together

347

# retaining topological order within the revisions of a file id.

348

# File id splits and joins would invalidate this, but they don't exist

349

# yet, and are unlikely to in non-rich-root environments anyway.

350

root_id_order.sort(key=operator.itemgetter(0))

351

# Create a record stream containing the roots to create.

352

def yield_roots():

353

for key in root_id_order:

354

root_id, rev_id = key

355

rev_parents = parent_map[rev_id]

356

# We drop revision parents with different file-ids, because

357

# that represents a rename of the root to a different location

358

# - its not actually a parent for us. (We could look for that

359

# file id in the revision tree at considerably more expense,

360

# but for now this is sufficient (and reconcile will catch and

361

# correct this anyway).

362

# When a parent revision is a ghost, we guess that its root id

363

# was unchanged (rather than trimming it from the parent list).

364

parent_keys = tuple((root_id, parent) for parent in rev_parents

365

if parent != NULL_REVISION and

366

rev_id_to_root_id.get(parent, root_id) == root_id)

367

yield FulltextContentFactory(key, parent_keys, None, '')

368

to_texts.insert_record_stream(yield_roots())

344

inventory_weave = self.source.get_inventory_weave()

345

parent_texts = {}

346

versionedfile = {}

347

to_store = self.target.weave_store

348

for tree in self.iter_rev_trees(revs):

349

revision_id = tree.inventory.root.revision

350

root_id = tree.get_root_id()

351

parents = inventory_weave.get_parents(revision_id)

352

if root_id not in versionedfile:

353

versionedfile[root_id] = to_store.get_weave_or_empty(root_id,

354

self.target.get_transaction())

355

_, _, parent_texts[root_id] = versionedfile[root_id].add_lines(

356

revision_id, parents, [], parent_texts)

369

357

370

358

def regenerate_inventory(self, revs):

371

359

"""Generate a new inventory versionedfile in target, convertin data.

374

362

stored in the target (reserializing it in a different format).

375

363

:param revs: The revisions to include

376

364

"""

365

inventory_weave = self.source.get_inventory_weave()

377

366

for tree in self.iter_rev_trees(revs):

378

parents = tree.get_parent_ids()

367

parents = inventory_weave.get_parents(tree.get_revision_id())

379

368

self.target.add_inventory(tree.get_revision_id(), tree.inventory,

380

369

parents)

381

370

382

def fetch_revisions(self, revision_ids):

383

for revision in self.source.get_revisions(revision_ids):

384

self.target.add_revision(revision.revision_id, revision)

385

386

387

class Model1toKnit2Fetcher(RepoFetcher):

371

372

class Model1toKnit2Fetcher(GenericRepoFetcher):

388

373

"""Fetch from a Model1 repository into a Knit2 repository

389

374

"""

390

def __init__(self, to_repository, from_repository, last_revision=None,

391

pb=None, find_ghosts=True):

375

def __init__(self, to_repository, from_repository, last_revision=None,

376

pb=None):

392

377

self.helper = Inter1and2Helper(from_repository, to_repository)

393

RepoFetcher.__init__(self, to_repository, from_repository,

394

last_revision, pb, find_ghosts)

378

GenericRepoFetcher.__init__(self, to_repository, from_repository,

379

last_revision, pb)

395

380

396

381

def _generate_root_texts(self, revs):

397

382

self.helper.generate_root_texts(revs)

398

383

399

384

def _fetch_inventory_weave(self, revs, pb):

400

385

self.helper.regenerate_inventory(revs)

401

402

def _fetch_revision_texts(self, revs, pb):

403

"""Fetch revision object texts"""

404

count = 0

405

total = len(revs)

406

for rev in revs:

407

pb.update('copying revisions', count, total)

408

try:

409

sig_text = self.from_repository.get_signature_text(rev)

410

self.to_repository.add_signature_text(rev, sig_text)

411

except errors.NoSuchRevision:

412

# not signed.

413

pass

414

self._copy_revision(rev)

415

count += 1

416

417

def _copy_revision(self, rev):

418

self.helper.fetch_revisions([rev])

419

420

421

class Knit1to2Fetcher(RepoFetcher):

386

387

388

class Knit1to2Fetcher(KnitRepoFetcher):

422

389

"""Fetch from a Knit1 repository into a Knit2 repository"""

423

390

424

def __init__(self, to_repository, from_repository, last_revision=None,

425

pb=None, find_ghosts=True):

391

def __init__(self, to_repository, from_repository, last_revision=None,

392

pb=None):

426

393

self.helper = Inter1and2Helper(from_repository, to_repository)

427

RepoFetcher.__init__(self, to_repository, from_repository,

428

last_revision, pb, find_ghosts)

394

KnitRepoFetcher.__init__(self, to_repository, from_repository,

395

last_revision, pb)

429

396

430

397

def _generate_root_texts(self, revs):

431

398

self.helper.generate_root_texts(revs)

433

400

def _fetch_inventory_weave(self, revs, pb):

434

401

self.helper.regenerate_inventory(revs)

435

402

436

def _fetch_just_revision_texts(self, version_ids):

437

self.helper.fetch_revisions(version_ids)

403

404

class RemoteToOtherFetcher(GenericRepoFetcher):

405

406

def _fetch_everything_for_revisions(self, revs, pp):

407

data_stream = self.from_repository.get_data_stream(revs)

408

self.to_repository.insert_data_stream(data_stream)

409

410

Older »