~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/repofmt/pack_repo.py

Committer: Jelmer Vernooij
Date: 2009-02-23 20:55:58 UTC
mfrom: (4034 +trunk)
mto: This revision was merged to the branch mainline in revision 4053.
Revision ID: jelmer@samba.org-20090223205558-1cx2k4w1zgs8r5qa

Merge bzr.dev.

files added:
bzrlib/help_topics/en/log-formats.txt

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/workingtree_implementations/test_views.py

bzrlib/views.py

tools/prepare_for_latex.py

tools/rst2pdf.py

files modified:
.bzrignore

Makefile

NEWS

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_patiencediff_py.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_pack.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/btree_index.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/fetch.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/hooks.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_deprecated_graph.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/util/configobj/configobj.py

bzrlib/util/simplemapi.py

bzrlib/util/tests/test_bencode.py

bzrlib/version_info_formats/__init__.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/developers/index.txt

doc/developers/ppa.txt

doc/developers/releasing.txt

setup.py

tools/packaging/build-packages.sh

tools/packaging/update-changelogs.sh

tools/packaging/update-packaging-branches.sh

tools/win32/build_release.py

tools/win32/bzr.iss.cog

Show diffs side-by-side

added added

removed removed

bzrlib/repofmt/pack_repo.py

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

import re

import sys

from bzrlib.lazy_import import lazy_import

class PackCommitBuilder(CommitBuilder):

"""A subclass of CommitBuilder to add texts with pack semantics.

Specifically this uses one knit object rather than one knit object per

added text, reducing memory and object pressure.

"""

101

102

103

class PackRootCommitBuilder(RootCommitBuilder):

103

104

"""A subclass of RootCommitBuilder to add texts with pack semantics.

104

105

106

Specifically this uses one knit object rather than one knit object per

106

107

added text, reducing memory and object pressure.

107

108

"""

127

128

ExistingPack and NewPack are used.

128

129

"""

129

130

131

# A map of index 'type' to the file extension and position in the

132

# index_sizes array.

133

index_definitions = {

134

'revision': ('.rix', 0),

135

'inventory': ('.iix', 1),

136

'text': ('.tix', 2),

137

'signature': ('.six', 3),

138

}

139

130

140

def __init__(self, revision_index, inventory_index, text_index,

131

141

signature_index):

132

142

"""Create a pack instance.

151

161

"""Return a tuple (transport, name) for the pack content."""

152

162

return self.pack_transport, self.file_name()

153

163

164

def _check_references(self):

165

"""Make sure our external references are present.

166

167

Packs are allowed to have deltas whose base is not in the pack, but it

168

must be present somewhere in this collection. It is not allowed to

169

have deltas based on a fallback repository.

170

(See <https://bugs.launchpad.net/bzr/+bug/288751>)

171

"""

172

missing_items = {}

173

for (index_name, external_refs, index) in [

174

('texts',

175

self._get_external_refs(self.text_index),

176

self._pack_collection.text_index.combined_index),

177

('inventories',

178

self._get_external_refs(self.inventory_index),

179

self._pack_collection.inventory_index.combined_index),

180

181

missing = external_refs.difference(

182

k for (idx, k, v, r) in

183

index.iter_entries(external_refs))

184

if missing:

185

missing_items[index_name] = sorted(list(missing))

186

if missing_items:

187

from pprint import pformat

188

raise errors.BzrCheckError(

189

"Newly created pack file %r has delta references to "

190

"items not in its repository:\n%s"

191

% (self, pformat(missing_items)))

192

154

193

def file_name(self):

155

194

"""Get the file name for the pack on disk."""

156

195

return self.name + '.pack'

158

197

def get_revision_count(self):

159

198

return self.revision_index.key_count()

160

199

200

def index_name(self, index_type, name):

201

"""Get the disk name of an index type for pack name 'name'."""

202

return name + Pack.index_definitions[index_type][0]

203

204

def index_offset(self, index_type):

205

"""Get the position in a index_size array for a given index type."""

206

return Pack.index_definitions[index_type][1]

207

161

208

def inventory_index_name(self, name):

162

209

"""The inv index is the name + .iix."""

163

210

return self.index_name('inventory', name)

174

221

"""The text index is the name + .tix."""

175

222

return self.index_name('text', name)

176

223

224

def _replace_index_with_readonly(self, index_type):

225

setattr(self, index_type + '_index',

226

self.index_class(self.index_transport,

227

self.index_name(index_type, self.name),

228

self.index_sizes[self.index_offset(index_type)]))

229

177

230

178

231

class ExistingPack(Pack):

179

232

"""An in memory proxy for an existing .pack and its disk indices."""

200

253

return not self.__eq__(other)

201

254

202

255

def __repr__(self):

203

return "<bzrlib.repofmt.pack_repo.Pack object at 0x%x, %s, %s" % (

204

id(self), self.pack_transport, self.name)

256

return "<%s.%s object at 0x%x, %s, %s" % (

257

self.__class__.__module__, self.__class__.__name__, id(self),

258

self.pack_transport, self.name)

259

260

261

class ResumedPack(ExistingPack):

262

263

def __init__(self, name, revision_index, inventory_index, text_index,

264

signature_index, upload_transport, pack_transport, index_transport,

265

pack_collection):

266

"""Create a ResumedPack object."""

267

ExistingPack.__init__(self, pack_transport, name, revision_index,

268

inventory_index, text_index, signature_index)

269

self.upload_transport = upload_transport

270

self.index_transport = index_transport

271

self.index_sizes = [None, None, None, None]

272

indices = [

273

('revision', revision_index),

274

('inventory', inventory_index),

275

('text', text_index),

276

('signature', signature_index),

277

]

278

for index_type, index in indices:

279

offset = self.index_offset(index_type)

280

self.index_sizes[offset] = index._size

281

self.index_class = pack_collection._index_class

282

self._pack_collection = pack_collection

283

self._state = 'resumed'

284

# XXX: perhaps check that the .pack file exists?

285

286

def access_tuple(self):

287

if self._state == 'finished':

288

return Pack.access_tuple(self)

289

elif self._state == 'resumed':

290

return self.upload_transport, self.file_name()

291

else:

292

raise AssertionError(self._state)

293

294

def abort(self):

295

self.upload_transport.delete(self.file_name())

296

indices = [self.revision_index, self.inventory_index, self.text_index,

297

self.signature_index]

298

for index in indices:

299

index._transport.delete(index._name)

300

301

def finish(self):

302

self._check_references()

303

new_name = '../packs/' + self.file_name()

304

self.upload_transport.rename(self.file_name(), new_name)

305

for index_type in ['revision', 'inventory', 'text', 'signature']:

306

old_name = self.index_name(index_type, self.name)

307

new_name = '../indices/' + old_name

308

self.upload_transport.rename(old_name, new_name)

309

self._replace_index_with_readonly(index_type)

310

self._state = 'finished'

311

312

def _get_external_refs(self, index):

313

return index.external_references(1)

205

314

206

315

207

316

class NewPack(Pack):

208

317

"""An in memory proxy for a pack which is being created."""

209

318

210

# A map of index 'type' to the file extension and position in the

211

# index_sizes array.

212

index_definitions = {

213

'revision': ('.rix', 0),

214

'inventory': ('.iix', 1),

215

'text': ('.tix', 2),

216

'signature': ('.six', 3),

217

}

218

219

319

def __init__(self, pack_collection, upload_suffix='', file_mode=None):

220

320

"""Create a NewPack instance.

221

321

274

374

mutter('%s: create_pack: pack stream open: %s%s t+%6.3fs',

275

375

time.ctime(), self.upload_transport.base, self.random_name,

276

376

time.time() - self.start_time)

277

# A list of byte sequences to be written to the new pack, and the

278

# aggregate size of them. Stored as a list rather than separate

377

# A list of byte sequences to be written to the new pack, and the

378

# aggregate size of them. Stored as a list rather than separate

279

379

# variables so that the _write_data closure below can update them.

280

380

self._buffer = [[], 0]

281

# create a callable for adding data

381

# create a callable for adding data

282

382

283

383

# robertc says- this is a closure rather than a method on the object

284

384

# so that the variables are locals, and faster than accessing object

318

418

else:

319

419

raise AssertionError(self._state)

320

420

321

def _check_references(self):

322

"""Make sure our external references are present.

323

324

Packs are allowed to have deltas whose base is not in the pack, but it

325

must be present somewhere in this collection. It is not allowed to

326

have deltas based on a fallback repository.

327

(See <https://bugs.launchpad.net/bzr/+bug/288751>)

328

"""

329

missing_items = {}

330

for (index_name, external_refs, index) in [

331

('texts',

332

self.text_index._external_references(),

333

self._pack_collection.text_index.combined_index),

334

('inventories',

335

self.inventory_index._external_references(),

336

self._pack_collection.inventory_index.combined_index),

337

338

missing = external_refs.difference(

339

k for (idx, k, v, r) in

340

index.iter_entries(external_refs))

341

if missing:

342

missing_items[index_name] = sorted(list(missing))

343

if missing_items:

344

from pprint import pformat

345

raise errors.BzrCheckError(

346

"Newly created pack file %r has delta references to "

347

"items not in its repository:\n%s"

348

% (self, pformat(missing_items)))

349

350

421

def data_inserted(self):

351

422

"""True if data has been added to this pack."""

352

423

return bool(self.get_revision_count() or

354

425

self.text_index.key_count() or

355

426

self.signature_index.key_count())

356

427

357

def finish(self):

428

def finish(self, suspend=False):

358

429

"""Finish the new pack.

359

430

360

431

This:

369

440

if self._buffer[1]:

370

441

self._write_data('', flush=True)

371

442

self.name = self._hash.hexdigest()

372

self._check_references()

443

if not suspend:

444

self._check_references()

373

445

# write indices

374

446

# XXX: It'd be better to write them all to temporary names, then

375

447

# rename them all into place, so that the window when only some are

376

448

# visible is smaller. On the other hand none will be seen until

377

449

# they're in the names list.

378

450

self.index_sizes = [None, None, None, None]

379

self._write_index('revision', self.revision_index, 'revision')

380

self._write_index('inventory', self.inventory_index, 'inventory')

381

self._write_index('text', self.text_index, 'file texts')

451

self._write_index('revision', self.revision_index, 'revision', suspend)

452

self._write_index('inventory', self.inventory_index, 'inventory',

453

suspend)

454

self._write_index('text', self.text_index, 'file texts', suspend)

382

455

self._write_index('signature', self.signature_index,

383

'revision signatures')

456

'revision signatures', suspend)

384

457

self.write_stream.close()

385

458

# Note that this will clobber an existing pack with the same name,

386

459

# without checking for hash collisions. While this is undesirable this

393

466

# - try for HASH.pack

394

467

# - try for temporary-name

395

468

# - refresh the pack-list to see if the pack is now absent

396

self.upload_transport.rename(self.random_name,

397

'../packs/' + self.name + '.pack')

469

new_name = self.name + '.pack'

470

if not suspend:

471

new_name = '../packs/' + new_name

472

self.upload_transport.rename(self.random_name, new_name)

398

473

self._state = 'finished'

399

474

if 'pack' in debug.debug_flags:

400

475

# XXX: size might be interesting?

401

mutter('%s: create_pack: pack renamed into place: %s%s->%s%s t+%6.3fs',

476

mutter('%s: create_pack: pack finished: %s%s->%s t+%6.3fs',

402

477

time.ctime(), self.upload_transport.base, self.random_name,

403

self.pack_transport, self.name,

404

time.time() - self.start_time)

478

new_name, time.time() - self.start_time)

405

479

406

480

def flush(self):

407

481

"""Flush any current data."""

411

485

self._hash.update(bytes)

412

486

self._buffer[:] = [[], 0]

413

487

414

def index_name(self, index_type, name):

415

"""Get the disk name of an index type for pack name 'name'."""

416

return name + NewPack.index_definitions[index_type][0]

417

418

def index_offset(self, index_type):

419

"""Get the position in a index_size array for a given index type."""

420

return NewPack.index_definitions[index_type][1]

421

422

def _replace_index_with_readonly(self, index_type):

423

setattr(self, index_type + '_index',

424

self.index_class(self.index_transport,

425

self.index_name(index_type, self.name),

426

self.index_sizes[self.index_offset(index_type)]))

488

def _get_external_refs(self, index):

489

return index._external_references()

427

490

428

491

def set_write_cache_size(self, size):

429

492

self._cache_limit = size

430

493

431

def _write_index(self, index_type, index, label):

494

def _write_index(self, index_type, index, label, suspend=False):

432

495

"""Write out an index.

433

496

434

497

:param index_type: The type of index to write - e.g. 'revision'.

436

499

:param label: What label to give the index e.g. 'revision'.

437

500

"""

438

501

index_name = self.index_name(index_type, self.name)

439

self.index_sizes[self.index_offset(index_type)] = \

440

self.index_transport.put_file(index_name, index.finish(),

441

mode=self._file_mode)

502

if suspend:

503

transport = self.upload_transport

504

else:

505

transport = self.index_transport

506

self.index_sizes[self.index_offset(index_type)] = transport.put_file(

507

index_name, index.finish(), mode=self._file_mode)

442

508

if 'pack' in debug.debug_flags:

443

509

# XXX: size might be interesting?

444

510

mutter('%s: create_pack: wrote %s index: %s%s t+%6.3fs',

445

511

time.ctime(), label, self.upload_transport.base,

446

512

self.random_name, time.time() - self.start_time)

447

# Replace the writable index on this object with a readonly,

513

# Replace the writable index on this object with a readonly,

448

514

# presently unloaded index. We should alter

449

515

# the index layer to make its finish() error if add_node is

450

516

# subsequently used. RBC

459

525

such as 'revision index'.

460

526

461

527

A CombinedIndex provides an index on a single key space built up

462

from several on-disk indices. The AggregateIndex builds on this

528

from several on-disk indices. The AggregateIndex builds on this

463

529

to provide a knit access layer, and allows having up to one writable

464

530

index within the collection.

465

531

"""

505

571

506

572

Future searches on the aggregate index will seach this new index

507

573

before all previously inserted indices.

508

574

509

575

:param index: An Index for the pack.

510

576

:param pack: A Pack instance.

511

577

"""

519

585

520

586

There can be at most one writable index at any time. Any

521

587

modifications made to the knit are put into this index.

522

588

523

589

:param index: An index from the pack parameter.

524

590

:param pack: A Pack instance.

525

591

"""

542

608

543

609

def remove_index(self, index, pack):

544

610

"""Remove index from the indices used to answer queries.

545

611

546

612

:param index: An index from the pack parameter.

547

613

:param pack: A Pack instance.

548

614

"""

623

689

This does little more than a bulk copy of data. One key difference

624

690

is that data with the same item key across multiple packs is elided

625

691

from the output. The new pack is written into the current pack store

626

along with its indices, and the name added to the pack names. The

692

along with its indices, and the name added to the pack names. The

627

693

source packs are not altered and are not required to be in the current

628

694

pack collection.

629

695

848

914

nodes = sorted(nodes)

849

915

# how to map this into knit.py - or knit.py into this?

850

916

# we don't want the typical knit logic, we want grouping by pack

851

# at this point - perhaps a helper library for the following code

917

# at this point - perhaps a helper library for the following code

852

918

# duplication points?

853

919

request_groups = {}

854

920

for index, key, value in nodes:

954

1020

955

1021

def _least_readv_node_readv(self, nodes):

956

1022

"""Generate request groups for nodes using the least readv's.

957

1023

958

1024

:param nodes: An iterable of graph index nodes.

959

1025

:return: Total node count and an iterator of the data needed to perform

960

1026

readvs to obtain the data for nodes. Each item yielded by the

1071

1137

1072

1138

class ReconcilePacker(Packer):

1073

1139

"""A packer which regenerates indices etc as it copies.

1074

1140

1075

1141

This is used by ``bzr reconcile`` to cause parent text pointers to be

1076

1142

regenerated.

1077

1143

"""

1100

1166

# 1) generate the ideal index

1101

1167

repo = self._pack_collection.repo

1102

1168

ancestors = dict([(key[0], tuple(ref[0] for ref in refs[0])) for

1103

_1, key, _2, refs in

1169

_1, key, _2, refs in

1104

1170

self.new_pack.revision_index.iter_all_entries()])

1105

1171

ideal_index = repo._generate_text_key_index(self._text_refs, ancestors)

1106

1172

# 2) generate a text_nodes list that contains all the deltas that can

1112

1178

text_index_map, text_nodes = self._get_text_nodes()

1113

1179

for node in text_nodes:

1114

1180

# 0 - index

1115

# 1 - key

1181

# 1 - key

1116

1182

# 2 - value

1117

1183

# 3 - refs

1118

1184

try:

1213

1279

1214

1280

class RepositoryPackCollection(object):

1215

1281

"""Management of packs within a repository.

1216

1282

1217

1283

:ivar _names: map of {pack_name: (index_size,)}

1218

1284

"""

1219

1285

1221

1287

pack_transport, index_builder_class, index_class):

1222

1288

"""Create a new RepositoryPackCollection.

1223

1289

1224

:param transport: Addresses the repository base directory

1290

:param transport: Addresses the repository base directory

1225

1291

(typically .bzr/repository/).

1226

1292

:param index_transport: Addresses the directory containing indices.

1227

1293

:param upload_transport: Addresses the directory into which packs are written

1250

1316

self.inventory_index = AggregateIndex(self.reload_pack_names)

1251

1317

self.text_index = AggregateIndex(self.reload_pack_names)

1252

1318

self.signature_index = AggregateIndex(self.reload_pack_names)

1319

# resumed packs

1320

self._resumed_packs = []

1253

1321

1254

1322

def add_pack_to_memory(self, pack):

1255

1323

"""Make a Pack object available to the repository to satisfy queries.

1256

1324

1257

1325

:param pack: A Pack object.

1258

1326

"""

1259

1327

if pack.name in self._packs_by_name:

1260

raise AssertionError()

1328

raise AssertionError(

1329

'pack %s already in _packs_by_name' % (pack.name,))

1261

1330

self.packs.append(pack)

1262

1331

self._packs_by_name[pack.name] = pack

1263

1332

self.revision_index.add_index(pack.revision_index, pack)

1264

1333

self.inventory_index.add_index(pack.inventory_index, pack)

1265

1334

self.text_index.add_index(pack.text_index, pack)

1266

1335

self.signature_index.add_index(pack.signature_index, pack)

1267

1336

1268

1337

def all_packs(self):

1269

1338

"""Return a list of all the Pack objects this repository has.

1270

1339

1279

1348

1280

1349

def autopack(self):

1281

1350

"""Pack the pack collection incrementally.

1282

1351

1283

1352

This will not attempt global reorganisation or recompression,

1284

1353

rather it will just ensure that the total number of packs does

1285

1354

not grow without bound. It uses the _max_pack_count method to

1322

1391

# group their data with the relevant commit, and that may

1323

1392

# involve rewriting ancient history - which autopack tries to

1324

1393

# avoid. Alternatively we could not group the data but treat

1325

# each of these as having a single revision, and thus add

1394

# each of these as having a single revision, and thus add

1326

1395

# one revision for each to the total revision count, to get

1327

1396

# a matching distribution.

1328

1397

continue

1375

1444

1376

1445

def lock_names(self):

1377

1446

"""Acquire the mutex around the pack-names index.

1378

1447

1379

1448

This cannot be used in the middle of a read-only transaction on the

1380

1449

repository.

1381

1450

"""

1493

1562

self.add_pack_to_memory(result)

1494

1563

return result

1495

1564

1565

def _resume_pack(self, name):

1566

"""Get a suspended Pack object by name.

1567

1568

:param name: The name of the pack - e.g. '123456'

1569

:return: A Pack object.

1570

"""

1571

if not re.match('[a-f0-9]{32}', name):

1572

# Tokens should be md5sums of the suspended pack file, i.e. 32 hex

1573

# digits.

1574

raise errors.UnresumableWriteGroup(

1575

self.repo, [name], 'Malformed write group token')

1576

try:

1577

rev_index = self._make_index(name, '.rix', resume=True)

1578

inv_index = self._make_index(name, '.iix', resume=True)

1579

txt_index = self._make_index(name, '.tix', resume=True)

1580

sig_index = self._make_index(name, '.six', resume=True)

1581

result = ResumedPack(name, rev_index, inv_index, txt_index,

1582

sig_index, self._upload_transport, self._pack_transport,

1583

self._index_transport, self)

1584

except errors.NoSuchFile, e:

1585

raise errors.UnresumableWriteGroup(self.repo, [name], str(e))

1586

self.add_pack_to_memory(result)

1587

self._resumed_packs.append(result)

1588

return result

1589

1496

1590

def allocate(self, a_new_pack):

1497

1591

"""Allocate name in the list of packs.

1498

1592

1508

1602

1509

1603

def _iter_disk_pack_index(self):

1510

1604

"""Iterate over the contents of the pack-names index.

1511

1605

1512

1606

This is used when loading the list from disk, and before writing to

1513

1607

detect updates from others during our write operation.

1514

1608

:return: An iterator of the index contents.

1516

1610

return self._index_class(self.transport, 'pack-names', None

1517

1611

).iter_all_entries()

1518

1612

1519

def _make_index(self, name, suffix):

1613

def _make_index(self, name, suffix, resume=False):

1520

1614

size_offset = self._suffix_offsets[suffix]

1521

1615

index_name = name + suffix

1522

index_size = self._names[name][size_offset]

1523

return self._index_class(

1524

self._index_transport, index_name, index_size)

1616

if resume:

1617

transport = self._upload_transport

1618

index_size = transport.stat(index_name).st_size

1619

else:

1620

transport = self._index_transport

1621

index_size = self._names[name][size_offset]

1622

return self._index_class(transport, index_name, index_size)

1525

1623

1526

1624

def _max_pack_count(self, total_revisions):

1527

1625

"""Return the maximum number of packs to use for total revisions.

1528

1626

1529

1627

:param total_revisions: The total number of revisions in the

1530

1628

repository.

1531

1629

"""

1586

1684

1587

1685

def _remove_pack_from_memory(self, pack):

1588

1686

"""Remove pack from the packs accessed by this repository.

1589

1687

1590

1688

Only affects memory state, until self._save_pack_names() is invoked.

1591

1689

"""

1592

1690

self._names.pop(pack.name)

1717

1815

try:

1718

1816

builder = self._index_builder_class()

1719

1817

disk_nodes, deleted_nodes, new_nodes = self._diff_pack_names()

1720

# TODO: handle same-name, index-size-changes here -

1818

# TODO: handle same-name, index-size-changes here -

1721

1819

# e.g. use the value from disk, not ours, *unless* we're the one

1722

1820

# changing it.

1723

1821

for key, value in disk_nodes:

1802

1900

# case. -- mbp 20081113

1803

1901

self._remove_pack_indices(self._new_pack)

1804

1902

self._new_pack = None

1903

for resumed_pack in self._resumed_packs:

1904

try:

1905

resumed_pack.abort()

1906

finally:

1907

# See comment in previous finally block.

1908

try:

1909

self._remove_pack_indices(resumed_pack)

1910

except KeyError:

1911

pass

1912

del self._resumed_packs[:]

1805

1913

self.repo._text_knit = None

1806

1914

1915

def _remove_resumed_pack_indices(self):

1916

for resumed_pack in self._resumed_packs:

1917

self._remove_pack_indices(resumed_pack)

1918

del self._resumed_packs[:]

1919

1807

1920

def _commit_write_group(self):

1921

all_missing = set()

1922

for prefix, versioned_file in (

1923

('revisions', self.repo.revisions),

1924

('inventories', self.repo.inventories),

1925

('texts', self.repo.texts),

1926

('signatures', self.repo.signatures),

1927

1928

missing = versioned_file.get_missing_compression_parent_keys()

1929

all_missing.update([(prefix,) + key for key in missing])

1930

if all_missing:

1931

raise errors.BzrCheckError(

1932

"Repository %s has missing compression parent(s) %r "

1933

% (self.repo, sorted(all_missing)))

1808

1934

self._remove_pack_indices(self._new_pack)

1935

should_autopack = False

1809

1936

if self._new_pack.data_inserted():

1810

1937

# get all the data to disk and read to use

1811

1938

self._new_pack.finish()

1812

1939

self.allocate(self._new_pack)

1813

1940

self._new_pack = None

1941

should_autopack = True

1942

else:

1943

self._new_pack.abort()

1944

self._new_pack = None

1945

for resumed_pack in self._resumed_packs:

1946

# XXX: this is a pretty ugly way to turn the resumed pack into a

1947

# properly committed pack.

1948

self._names[resumed_pack.name] = None

1949

self._remove_pack_from_memory(resumed_pack)

1950

resumed_pack.finish()

1951

self.allocate(resumed_pack)

1952

should_autopack = True

1953

del self._resumed_packs[:]

1954

if should_autopack:

1814

1955

if not self.autopack():

1815

1956

# when autopack takes no steps, the names list is still

1816

1957

# unsaved.

1817

1958

self._save_pack_names()

1959

self.repo._text_knit = None

1960

1961

def _suspend_write_group(self):

1962

tokens = [pack.name for pack in self._resumed_packs]

1963

self._remove_pack_indices(self._new_pack)

1964

if self._new_pack.data_inserted():

1965

# get all the data to disk and read to use

1966

self._new_pack.finish(suspend=True)

1967

tokens.append(self._new_pack.name)

1968

self._new_pack = None

1818

1969

else:

1819

1970

self._new_pack.abort()

1820

1971

self._new_pack = None

1972

self._remove_resumed_pack_indices()

1821

1973

self.repo._text_knit = None

1974

return tokens

1975

1976

def _resume_write_group(self, tokens):

1977

for token in tokens:

1978

self._resume_pack(token)

1822

1979

1823

1980

1824

1981

class KnitPackRepository(KnitRepository):

1825

1982

"""Repository with knit objects stored inside pack containers.

1826

1983

1827

1984

The layering for a KnitPackRepository is:

1828

1985

1829

1986

Graph | HPSS | Repository public layer |

1843

2000

pack file. The GraphIndex layer works in N-tuples and is unaware of any

1844

2001

semantic value.

1845

2002

===================================================

1846

2003

1847

2004

"""

1848

2005

1849

2006

def __init__(self, _format, a_bzrdir, control_files, _commit_builder_class,

1882

2039

data_access=self._pack_collection.text_index.data_access,

1883

2040

max_delta_chain=200)

1884

2041

# True when the repository object is 'write locked' (as opposed to the

1885

# physical lock only taken out around changes to the pack-names list.)

2042

# physical lock only taken out around changes to the pack-names list.)

1886

2043

# Another way to represent this would be a decorator around the control

1887

2044

# files object that presents logical locks as physical ones - if this

1888

2045

# gets ugly consider that alternative design. RBC 20071011

1973

2130

def _commit_write_group(self):

1974

2131

return self._pack_collection._commit_write_group()

1975

2132

2133

def suspend_write_group(self):

2134

# XXX check self._write_group is self.get_transaction()?

2135

tokens = self._pack_collection._suspend_write_group()

2136

self._write_group = None

2137

return tokens

2138

2139

def _resume_write_group(self, tokens):

2140

self._start_write_group()

2141

self._pack_collection._resume_write_group(tokens)

2142

1976

2143

def get_transaction(self):

1977

2144

if self._write_lock_count:

1978

2145

return self._transaction

2097

2264

builder = self.index_builder_class()

2098

2265

files = [('pack-names', builder.finish())]

2099

2266

utf8_files = [('format', self.get_format_string())]

2100

2267

2101

2268

self._upload_blank_content(a_bzrdir, dirs, files, utf8_files, shared)

2102

2269

return self.open(a_bzrdir=a_bzrdir, _found=True)

2103

2270

2104

2271

def open(self, a_bzrdir, _found=False, _override_transport=None):

2105

2272

"""See RepositoryFormat.open().

2106

2273

2107

2274

:param _override_transport: INTERNAL USE ONLY. Allows opening the

2108

2275

repository at a slightly different url

2109

2276

than normal. I.e. during 'upgrade'.

2195

2362

if not getattr(target_format, 'supports_tree_reference', False):

2196

2363

raise errors.BadConversionTarget(

2197

2364

'Does not support nested trees', target_format)

2198

2365

2199

2366

def get_format_string(self):

2200

2367

"""See RepositoryFormat.get_format_string()."""

2201

2368

return "Bazaar pack repository format 1 with subtree support (needs bzr 0.92)\n"

2541

2708

if not getattr(target_format, 'supports_tree_reference', False):

2542

2709

raise errors.BadConversionTarget(

2543

2710

'Does not support nested trees', target_format)

2544

2711

2545

2712

def get_format_string(self):

2546

2713

"""See RepositoryFormat.get_format_string()."""

2547

2714

return ("Bazaar development format 2 with subtree support "

Older »