~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/knit.py

Committer: John Arbash Meinel
Date: 2006-08-14 16:07:29 UTC
mfrom: (1907.2.2 bzr.dev)
mto: (1946.2.6 reduce-knit-churn)
mto: This revision was merged to the branch mainline in revision 1918.
Revision ID: john@arbash-meinel.com-20060814160729-a87d9e3104eea2a2

[merge] Hermann Kraus: updates to Bundle exceptions

files added:
bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

files removed:
bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bundle/serializer/v09.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/inspect_for_copy.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/memorytree.py

bzrlib/mutabletree.py

bzrlib/registry.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/transport/smart.py

bzrlib/transport/ssh.py

bzrlib/treebuilder.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/xml6.py

doc/centralized_workflow.txt

doc/server.txt

doc/version_info.txt

tools/rst2html.py

tools/win32/info.txt

files renamed:
bzrlib/tests/repository_implementations/test_revision.py => bzrlib/tests/repository_implementations/test_revprops.py

files modified:
.bzrignore

BRANCH.TODO

HACKING

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib/newinventory.py

doc/default.css

doc/index.txt

doc/tutorial.txt

profile_imports.py

setup.py *

tools/doc_generate/autodoc_man.py

tools/http_client.py

tools/win32/bzr.iss.cog

Show diffs side-by-side

added added

removed removed

bzrlib/knit.py

# Written by Martin Pool.

# Modified by Johan Rydberg <jrydberg@gnu.org>

# Modified by Robert Collins <robert.collins@canonical.com>

import warnings

import bzrlib

from bzrlib import (

cache_utf8,

errors,

progress,

)

import bzrlib.errors as errors

from bzrlib.errors import FileExists, NoSuchFile, KnitError, \

InvalidRevisionId, KnitCorrupt, KnitHeaderError, \

RevisionNotPresent, RevisionAlreadyPresent

from bzrlib.trace import mutter

from bzrlib.osutils import contains_whitespace, contains_linebreaks, \

sha_strings

from bzrlib.versionedfile import VersionedFile, InterVersionedFile

from bzrlib.symbol_versioning import DEPRECATED_PARAMETER, deprecated_passed

from bzrlib.tsort import topo_sort

import bzrlib.weave

from bzrlib.versionedfile import VersionedFile, InterVersionedFile

import bzrlib.patiencediff

# TODO: Split out code specific to this format into an associated object.

167

162

internal representation is of the format:

168

163

(revid, plaintext)

169

164

"""

170

decode_utf8 = cache_utf8.decode

171

165

lines = []

172

166

for line in content:

173

167

origin, text = line.split(' ', 1)

174

lines.append((decode_utf8(origin), text))

168

lines.append((origin.decode('utf-8'), text))

175

169

return KnitContent(lines)

176

170

177

171

def parse_line_delta_iter(self, lines):

188

182

internal representation is

189

183

(start, end, count, [1..count tuples (revid, newline)])

190

184

"""

191

decode_utf8 = cache_utf8.decode

192

185

result = []

193

186

lines = iter(lines)

194

187

next = lines.next

200

193

while remaining:

201

194

origin, text = next().split(' ', 1)

202

195

remaining -= 1

203

contents.append((decode_utf8(origin), text))

196

contents.append((origin.decode('utf-8'), text))

204

197

result.append((start, end, count, contents))

205

198

return result

206

199

209

202

210

203

see parse_fulltext which this inverts.

211

204

"""

212

encode_utf8 = cache_utf8.encode

213

return ['%s %s' % (encode_utf8(o), t) for o, t in content._lines]

205

return ['%s %s' % (o.encode('utf-8'), t) for o, t in content._lines]

214

206

215

207

def lower_line_delta(self, delta):

216

208

"""convert a delta into a serializable form.

217

209

218

210

See parse_line_delta which this inverts.

219

211

"""

220

encode_utf8 = cache_utf8.encode

221

212

out = []

222

213

for start, end, c, lines in delta:

223

214

out.append('%d,%d,%d\n' % (start, end, c))

224

out.extend(encode_utf8(origin) + ' ' + text

225

for origin, text in lines)

215

for origin, text in lines:

216

out.append('%s %s' % (origin.encode('utf-8'), text))

226

217

return out

227

218

228

219

281

272

stored and retrieved.

282

273

"""

283

274

284

def __init__(self, relpath, transport, file_mode=None, access_mode=None,

275

def __init__(self, relpath, transport, file_mode=None, access_mode=None,

285

276

factory=None, basis_knit=DEPRECATED_PARAMETER, delta=True,

286

create=False, create_parent_dir=False, delay_create=False,

287

dir_mode=None):

277

create=False):

288

278

"""Construct a knit at location specified by relpath.

289

279

290

280

:param create: If not True, only open an existing knit.

291

:param create_parent_dir: If True, create the parent directory if

292

creating the file fails. (This is used for stores with

293

hash-prefixes that may not exist yet)

294

:param delay_create: The calling code is aware that the knit won't

295

actually be created until the first data is stored.

296

281

"""

297

282

if deprecated_passed(basis_knit):

298

283

warnings.warn("KnitVersionedFile.__(): The basis_knit parameter is"

309

294

self.delta = delta

310

295

311

296

self._index = _KnitIndex(transport, relpath + INDEX_SUFFIX,

312

access_mode, create=create, file_mode=file_mode,

313

create_parent_dir=create_parent_dir, delay_create=delay_create,

314

dir_mode=dir_mode)

297

access_mode, create=create, file_mode=file_mode)

315

298

self._data = _KnitData(transport, relpath + DATA_SUFFIX,

316

access_mode, create=create and not len(self), file_mode=file_mode,

317

create_parent_dir=create_parent_dir, delay_create=delay_create,

318

dir_mode=dir_mode)

299

access_mode, create=create and not len(self), file_mode=file_mode)

319

300

320

301

def __repr__(self):

321

302

return '%s(%s)' % (self.__class__.__name__,

415

396

"""See VersionedFile.copy_to()."""

416

397

# copy the current index to a temp index to avoid racing with local

417

398

# writes

418

transport.put_file_non_atomic(name + INDEX_SUFFIX + '.tmp',

419

self.transport.get(self._index._filename))

399

transport.put(name + INDEX_SUFFIX + '.tmp', self.transport.get(self._index._filename),)

420

400

# copy the data file

421

401

f = self._data._open_file()

422

402

try:

423

transport.put_file(name + DATA_SUFFIX, f)

403

transport.put(name + DATA_SUFFIX, f)

424

404

finally:

425

405

f.close()

426

406

# move the copied index into place

427

407

transport.move(name + INDEX_SUFFIX + '.tmp', name + INDEX_SUFFIX)

428

408

429

409

def create_empty(self, name, transport, mode=None):

430

return KnitVersionedFile(name, transport, factory=self.factory,

431

delta=self.delta, create=True)

410

return KnitVersionedFile(name, transport, factory=self.factory, delta=self.delta, create=True)

432

411

433

412

def _fix_parents(self, version, new_parents):

434

413

"""Fix the parents list for version.

523

502

delta_seq = None

524

503

for parent_id in parents:

525

504

merge_content = self._get_content(parent_id, parent_texts)

526

seq = bzrlib.patiencediff.PatienceSequenceMatcher(

527

None, merge_content.text(), content.text())

505

seq = KnitSequenceMatcher(None, merge_content.text(), content.text())

528

506

if delta_seq is None:

529

507

# setup a delta seq to reuse.

530

508

delta_seq = seq

541

519

reference_content = self._get_content(parents[0], parent_texts)

542

520

new_texts = content.text()

543

521

old_texts = reference_content.text()

544

delta_seq = bzrlib.patiencediff.PatienceSequenceMatcher(

545

None, old_texts, new_texts)

522

delta_seq = KnitSequenceMatcher(None, old_texts, new_texts)

546

523

return self._make_line_delta(delta_seq, content)

547

524

548

525

def _make_line_delta(self, delta_seq, new_content):

802

779

text_map[version_id] = text

803

780

return text_map, final_content

804

781

805

def iter_lines_added_or_present_in_versions(self, version_ids=None,

806

pb=None):

782

def iter_lines_added_or_present_in_versions(self, version_ids=None):

807

783

"""See VersionedFile.iter_lines_added_or_present_in_versions()."""

808

784

if version_ids is None:

809

785

version_ids = self.versions()

810

if pb is None:

811

pb = progress.DummyProgress()

812

786

# we don't care about inclusions, the caller cares.

813

787

# but we need to setup a list of records to visit.

814

788

# we need version_id, position, length

826

800

data_pos, length = self._index.get_position(version_id)

827

801

version_id_records.append((version_id, data_pos, length))

828

802

803

pb = bzrlib.ui.ui_factory.nested_progress_bar()

829

804

count = 0

830

805

total = len(version_id_records)

831

pb.update('Walking content.', count, total)

832

for version_id, data, sha_value in \

833

self._data.read_records_iter(version_id_records):

806

try:

834

807

pb.update('Walking content.', count, total)

835

method = self._index.get_method(version_id)

836

version_idx = self._index.lookup(version_id)

837

assert method in ('fulltext', 'line-delta')

838

if method == 'fulltext':

839

content = self.factory.parse_fulltext(data, version_idx)

840

for line in content.text():

841

yield line

842

else:

843

delta = self.factory.parse_line_delta(data, version_idx)

844

for start, end, count, lines in delta:

845

for origin, line in lines:

808

for version_id, data, sha_value in \

809

self._data.read_records_iter(version_id_records):

810

pb.update('Walking content.', count, total)

811

method = self._index.get_method(version_id)

812

version_idx = self._index.lookup(version_id)

813

assert method in ('fulltext', 'line-delta')

814

if method == 'fulltext':

815

content = self.factory.parse_fulltext(data, version_idx)

816

for line in content.text():

846

817

yield line

847

count +=1

848

pb.update('Walking content.', total, total)

818

else:

819

delta = self.factory.parse_line_delta(data, version_idx)

820

for start, end, count, lines in delta:

821

for origin, line in lines:

822

yield line

823

count +=1

824

pb.update('Walking content.', total, total)

825

pb.finished()

826

except:

827

pb.update('Walking content.', total, total)

828

pb.finished()

829

raise

849

830

850

831

def num_versions(self):

851

832

"""See VersionedFile.num_versions()."""

958

939

class _KnitComponentFile(object):

959

940

"""One of the files used to implement a knit database"""

960

941

961

def __init__(self, transport, filename, mode, file_mode=None,

962

create_parent_dir=False, dir_mode=None):

942

def __init__(self, transport, filename, mode, file_mode=None):

963

943

self._transport = transport

964

944

self._filename = filename

965

945

self._mode = mode

966

self._file_mode = file_mode

967

self._dir_mode = dir_mode

968

self._create_parent_dir = create_parent_dir

969

self._need_to_create = False

946

self._file_mode=file_mode

947

948

def write_header(self):

949

if self._transport.append(self._filename, StringIO(self.HEADER),

950

mode=self._file_mode):

951

raise KnitCorrupt(self._filename, 'misaligned after writing header')

970

952

971

953

def check_header(self, fp):

972

954

line = fp.readline()

1059

1041

parents,

1060

1042

index)

1061

1043

1062

def __init__(self, transport, filename, mode, create=False, file_mode=None,

1063

create_parent_dir=False, delay_create=False, dir_mode=None):

1064

_KnitComponentFile.__init__(self, transport, filename, mode,

1065

file_mode=file_mode,

1066

create_parent_dir=create_parent_dir,

1067

dir_mode=dir_mode)

1044

def __init__(self, transport, filename, mode, create=False, file_mode=None):

1045

_KnitComponentFile.__init__(self, transport, filename, mode, file_mode)

1068

1046

self._cache = {}

1069

1047

# position in _history is the 'official' index for a revision

1070

1048

# but the values may have come from a newer entry.

1139

1117

except NoSuchFile, e:

1140

1118

if mode != 'w' or not create:

1141

1119

raise

1142

if delay_create:

1143

self._need_to_create = True

1144

else:

1145

self._transport.put_bytes_non_atomic(self._filename,

1146

self.HEADER, mode=self._file_mode)

1147

1120

self.write_header()

1148

1121

finally:

1149

1122

pb.update('read knit index', total, total)

1150

1123

pb.finished()

1233

1206

return self._cache[version_id][5]

1234

1207

1235

1208

def _version_list_to_index(self, versions):

1236

encode_utf8 = cache_utf8.encode

1237

1209

result_list = []

1238

1210

for version in versions:

1239

1211

if version in self._cache:

1241

1213

result_list.append(str(self._cache[version][5]))

1242

1214

# -- end lookup () --

1243

1215

else:

1244

result_list.append('.' + encode_utf8(version))

1216

result_list.append('.' + version.encode('utf-8'))

1245

1217

return ' '.join(result_list)

1246

1218

1247

1219

def add_version(self, version_id, options, pos, size, parents):

1255

1227

(version_id, options, pos, size, parents).

1256

1228

"""

1257

1229

lines = []

1258

encode_utf8 = cache_utf8.encode

1259

1230

for version_id, options, pos, size, parents in versions:

1260

line = "\n%s %s %s %s %s :" % (encode_utf8(version_id),

1231

line = "\n%s %s %s %s %s :" % (version_id.encode('utf-8'),

1261

1232

','.join(options),

1262

1233

pos,

1263

1234

size,

1265

1236

assert isinstance(line, str), \

1266

1237

'content must be utf-8 encoded: %r' % (line,)

1267

1238

lines.append(line)

1268

if not self._need_to_create:

1269

self._transport.append_bytes(self._filename, ''.join(lines))

1270

else:

1271

sio = StringIO()

1272

sio.write(self.HEADER)

1273

sio.writelines(lines)

1274

sio.seek(0)

1275

self._transport.put_file_non_atomic(self._filename, sio,

1276

create_parent_dir=self._create_parent_dir,

1277

mode=self._file_mode,

1278

dir_mode=self._dir_mode)

1279

self._need_to_create = False

1280

1239

self._transport.append(self._filename, StringIO(''.join(lines)))

1281

1240

# cache after writing, so that a failed write leads to missing cache

1282

1241

# entries not extra ones. XXX TODO: RBC 20060502 in the event of a

1283

1242

# failure, reload the index or flush it or some such, to prevent

1287

1246

1288

1247

def has_version(self, version_id):

1289

1248

"""True if the version is in the index."""

1290

return (version_id in self._cache)

1249

return self._cache.has_key(version_id)

1291

1250

1292

1251

def get_position(self, version_id):

1293

1252

"""Return data position and size of specified version."""

1328

1287

class _KnitData(_KnitComponentFile):

1329

1288

"""Contents of the knit data file"""

1330

1289

1331

def __init__(self, transport, filename, mode, create=False, file_mode=None,

1332

create_parent_dir=False, delay_create=False,

1333

dir_mode=None):

1334

_KnitComponentFile.__init__(self, transport, filename, mode,

1335

file_mode=file_mode,

1336

create_parent_dir=create_parent_dir,

1337

dir_mode=dir_mode)

1290

HEADER = "# bzr knit data 8\n"

1291

1292

def __init__(self, transport, filename, mode, create=False, file_mode=None):

1293

_KnitComponentFile.__init__(self, transport, filename, mode)

1338

1294

self._checked = False

1339

1295

# TODO: jam 20060713 conceptually, this could spill to disk

1340

1296

# if the cached size gets larger than a certain amount

1343

1299

self._cache = {}

1344

1300

self._do_cache = False

1345

1301

if create:

1346

if delay_create:

1347

self._need_to_create = create

1348

else:

1349

self._transport.put_bytes_non_atomic(self._filename, '',

1350

mode=self._file_mode)

1302

self._transport.put(self._filename, StringIO(''), mode=file_mode)

1351

1303

1352

1304

def enable_cache(self):

1353

1305

"""Enable caching of reads."""

1372

1324

"""

1373

1325

sio = StringIO()

1374

1326

data_file = GzipFile(None, mode='wb', fileobj=sio)

1375

1376

version_id_utf8 = cache_utf8.encode(version_id)

1377

1327

data_file.writelines(chain(

1378

["version %s %d %s\n" % (version_id_utf8,

1328

["version %s %d %s\n" % (version_id.encode('utf-8'),

1379

1329

len(lines),

1380

1330

digest)],

1381

1331

lines,

1382

["end %s\n" % version_id_utf8]))

1332

["end %s\n" % version_id.encode('utf-8')]))

1383

1333

data_file.close()

1384

1334

length= sio.tell()

1385

1335

1392

1342

:return: the offset in the data file raw_data was written.

1393

1343

"""

1394

1344

assert isinstance(raw_data, str), 'data must be plain bytes'

1395

if not self._need_to_create:

1396

return self._transport.append_bytes(self._filename, raw_data)

1397

else:

1398

self._transport.put_bytes_non_atomic(self._filename, raw_data,

1399

create_parent_dir=self._create_parent_dir,

1400

mode=self._file_mode,

1401

dir_mode=self._dir_mode)

1402

self._need_to_create = False

1403

return 0

1345

return self._transport.append(self._filename, StringIO(raw_data))

1404

1346

1405

1347

def add_record(self, version_id, digest, lines):

1406

1348

"""Write new text record to disk. Returns the position in the

1407

1349

file where it was written."""

1408

1350

size, sio = self._record_to_data(version_id, digest, lines)

1409

1351

# write to disk

1410

if not self._need_to_create:

1411

start_pos = self._transport.append_file(self._filename, sio)

1412

else:

1413

self._transport.put_file_non_atomic(self._filename, sio,

1414

create_parent_dir=self._create_parent_dir,

1415

mode=self._file_mode,

1416

dir_mode=self._dir_mode)

1417

self._need_to_create = False

1418

start_pos = 0

1352

start_pos = self._transport.append(self._filename, sio)

1419

1353

if self._do_cache:

1420

1354

self._cache[version_id] = sio.getvalue()

1421

1355

return start_pos, size

1430

1364

rec = df.readline().split()

1431

1365

if len(rec) != 4:

1432

1366

raise KnitCorrupt(self._filename, 'unexpected number of elements in record header')

1433

if cache_utf8.decode(rec[1]) != version_id:

1367

if rec[1].decode('utf-8')!= version_id:

1434

1368

raise KnitCorrupt(self._filename,

1435

1369

'unexpected version, wanted %r, got %r' % (

1436

1370

version_id, rec[1]))

1445

1379

record_contents = df.readlines()

1446

1380

l = record_contents.pop()

1447

1381

assert len(record_contents) == int(rec[2])

1448

if l != 'end %s\n' % cache_utf8.encode(version_id):

1382

if l.decode('utf-8') != 'end %s\n' % version_id:

1449

1383

raise KnitCorrupt(self._filename, 'unexpected version end line %r, wanted %r'

1450

1384

% (l, version_id))

1451

1385

df.close()

Older »