~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/pack.py

Committer: Alexander Belchenko
Date: 2007-08-10 09:04:38 UTC
mto: This revision was merged to the branch mainline in revision 2694.
Revision ID: bialix@ukr.net-20070810090438-0835xdz0rl8825qv

fixes after Ian's review

files added:
bzrlib/plugins/multiparent.py

bzrlib/transport/http/_pycurl_errors.py

doc/README.1st

doc/developers/scratch.txt

files removed:
bzrlib/_patiencediff_c.c

bzrlib/benchmarks/bench_pack.py

bzrlib/bisect_multi.py

bzrlib/directory_service.py

bzrlib/help_topics

bzrlib/help_topics/en

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/test_account.py

bzrlib/plugins/launchpad/test_lp_service.py

bzrlib/reconfigure.py

bzrlib/repofmt/pack_repo.py

bzrlib/switch.py

bzrlib/tests/blackbox/test_bundle_info.py

bzrlib/tests/blackbox/test_check.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/ftp_server.py

bzrlib/tests/inventory_implementations

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/repository_implementations/helpers.py

bzrlib/tests/repository_implementations/test__generate_text_key_index.py

bzrlib/tests/repository_implementations/test_check.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_find_text_key_references.py

bzrlib/tests/repository_implementations/test_has_revisions.py

bzrlib/tests/repository_implementations/test_is_write_locked.py

bzrlib/tests/test_bisect_multi.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_http_implementations.py

bzrlib/tests/test_lru_cache.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_switch.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/tests/tree_implementations/test_get_root_id.py

bzrlib/tests/tree_implementations/test_path_content_summary.py

bzrlib/transport/trace.py

bzrlib/util/simplemapi.py

bzrlib/version_info_formats/format_custom.py

contrib/bzr_access

doc/developers/authentication-ring.txt

doc/developers/development-repo.txt

doc/developers/directory-fingerprints.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/lca-merge.txt

doc/developers/missing.txt

doc/developers/network-protocol.txt

doc/developers/packrepo.txt

doc/developers/revision-properties.txt

doc/developers/update.txt

doc/en

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/developer-guide

doc/en/mini-tutorial

doc/en/mini-tutorial/index.txt

doc/en/quick-reference

doc/en/quick-reference/Makefile

doc/en/quick-reference/quick-start-summary.pdf

doc/en/quick-reference/quick-start-summary.png

doc/en/quick-reference/quick-start-summary.svg

doc/en/release-notes

doc/en/tutorials

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/best_practice_intro.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/browsing_history.txt

doc/en/user-guide/central_intro.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/entering_commands.txt

doc/en/user-guide/getting_help.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/images

doc/en/user-guide/images/workflows_centralized.png

doc/en/user-guide/images/workflows_centralized.svg

doc/en/user-guide/images/workflows_gatekeeper.png

doc/en/user-guide/images/workflows_gatekeeper.svg

doc/en/user-guide/images/workflows_localcommit.png

doc/en/user-guide/images/workflows_localcommit.svg

doc/en/user-guide/images/workflows_peer.png

doc/en/user-guide/images/workflows_peer.svg

doc/en/user-guide/images/workflows_pqm.png

doc/en/user-guide/images/workflows_pqm.svg

doc/en/user-guide/images/workflows_shared.png

doc/en/user-guide/images/workflows_shared.svg

doc/en/user-guide/images/workflows_single.png

doc/en/user-guide/images/workflows_single.svg

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/merging_changes.txt

doc/en/user-guide/organizing_branches.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reusing_a_checkout.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/revnos.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/solo_intro.txt

doc/en/user-guide/starting_a_project.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/using_checkouts.txt

doc/en/user-guide/using_gatekeepers.txt

doc/en/user-guide/working_offline_central.txt

doc/en/user-guide/writing_a_plugin.txt

doc/en/user-reference

doc/en/user-reference/readme.txt

doc/index.txt

tools/package_mf.py

files renamed:
bzrlib/help_topics/__init__.py => bzrlib/help_topics.py

bzrlib/_patiencediff_py.py => bzrlib/patiencediff.py

bzrlib/plugins/launchpad/lp_directory.py => bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_directory.py => bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/tests/http_utils.py => bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/http_server.py => bzrlib/tests/HttpServer.py

doc/en/user-guide/bug_trackers.txt => doc/bug_trackers.txt

doc/en/tutorials/centralized_workflow.txt => doc/centralized_workflow.txt

bzrlib/help_topics/en/configuration.txt => doc/configuration.txt

bzrlib/help_topics/en/conflicts.txt => doc/conflicts.txt

doc/en/user-guide/http_smart_server.txt => doc/http_smart_server.txt

doc/en/user-guide/index.txt => doc/index.txt

doc/en/user-guide/plugins.txt => doc/plugins.txt

doc/en/user-guide/server.txt => doc/server.txt

doc/en/user-guide/setting_up_email.txt => doc/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt => doc/shared_repository_layouts.txt

doc/en/user-guide/specifying_revisions.txt => doc/specifying_revisions.txt

doc/en/tutorials/tutorial.txt => doc/tutorial.txt

doc/en/user-guide/using_aliases.txt => doc/using_aliases.txt

doc/en/user-guide/version_info.txt => doc/version_info.txt

files modified:
.bzrignore

INSTALL

Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/annotate.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/branch.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/api/__init__.py

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/help.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/sign_my_commits.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_write_group.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_multiparent.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml_serializer.py

doc/bazaar-vcs.org.kid

doc/developers/HACKING.txt

doc/developers/bundles.txt

doc/developers/index.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap.txt

doc/developers/performance.dot

doc/developers/profiling.txt

doc/developers/repository.txt

generate_docs.py

setup.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/ostools.py

Show diffs side-by-side

added added

removed removed

bzrlib/pack.py

"""Container format for Bazaar data.

"Containers" and "records" are described in

doc/developers/container-format.txt.

"Containers" and "records" are described in doc/developers/container-format.txt.

"""

from cStringIO import StringIO

raise errors.InvalidRecordError(str(e))

class ContainerSerialiser(object):

"""A helper class for serialising containers.

It simply returns bytes from method calls to 'begin', 'end' and

'bytes_record'. You may find ContainerWriter to be a more convenient

interface.

"""

def begin(self):

"""Return the bytes to begin a container."""

return FORMAT_ONE + "\n"

def end(self):

"""Return the bytes to finish a container."""

return "E"

def bytes_record(self, bytes, names):

"""Return the bytes for a Bytes record with the given name and

contents.

"""

# Kind marker

byte_sections = ["B"]

# Length

byte_sections.append(str(len(bytes)) + "\n")

# Names

for name_tuple in names:

# Make sure we're writing valid names. Note that we will leave a

# half-written record if a name is bad!

for name in name_tuple:

_check_name(name)

byte_sections.append('\x00'.join(name_tuple) + "\n")

# End of headers

byte_sections.append("\n")

# Finally, the contents.

byte_sections.append(bytes)

# XXX: This causes a memory copy of bytes in size, but is usually

# faster than two write calls (12 vs 13 seconds to output a gig of

# 1k records.) - results may differ on significantly larger records

100

# like .iso's but as they should be rare in any case and thus not

101

# likely to be the common case. The biggest issue is causing extreme

102

# memory pressure in that case. One possibly improvement here is to

103

# check the size of the content before deciding to join here vs call

104

# write twice.

105

return ''.join(byte_sections)

106

107

108

class ContainerWriter(object):

109

"""A class for writing containers to a file.

110

111

:attribute records_written: The number of user records added to the

112

container. This does not count the prelude or suffix of the container

113

introduced by the begin() and end() methods.

114

"""

"""A class for writing containers."""

115

116

def __init__(self, write_func):

117

"""Constructor.

121

"""

122

self._write_func = write_func

123

self.current_offset = 0

124

self.records_written = 0

125

self._serialiser = ContainerSerialiser()

126

127

def begin(self):

128

"""Begin writing a container."""

129

self.write_func(self._serialiser.begin())

self.write_func(FORMAT_ONE + "\n")

130

131

def write_func(self, bytes):

132

self._write_func(bytes)

134

135

def end(self):

136

"""Finish writing a container."""

137

self.write_func(self._serialiser.end())

self.write_func("E")

138

139

def add_bytes_record(self, bytes, names):

140

"""Add a Bytes record with the given names.

141

142

:param bytes: The bytes to insert.

143

:param names: The names to give the inserted bytes. Each name is

144

a tuple of bytestrings. The bytestrings may not contain

145

whitespace.

:param names: The names to give the inserted bytes.

146

:return: An offset, length tuple. The offset is the offset

147

of the record within the container, and the length is the

148

length of data that will need to be read to reconstitute the

151

and thus are only suitable for use by a ContainerReader.

152

"""

153

current_offset = self.current_offset

154

serialised_record = self._serialiser.bytes_record(bytes, names)

155

self.write_func(serialised_record)

156

self.records_written += 1

# Kind marker

self.write_func("B")

100

# Length

101

self.write_func(str(len(bytes)) + "\n")

102

# Names

103

for name in names:

104

# Make sure we're writing valid names. Note that we will leave a

105

# half-written record if a name is bad!

106

_check_name(name)

107

self.write_func(name + "\n")

108

# End of headers

109

self.write_func("\n")

110

# Finally, the contents.

111

self.write_func(bytes)

157

112

# return a memo of where we wrote data to allow random access.

158

113

return current_offset, self.current_offset - current_offset

159

114

307

262

all_names = set()

308

263

for record_names, read_bytes in self.iter_records():

309

264

read_bytes(None)

310

for name_tuple in record_names:

311

for name in name_tuple:

312

_check_name_encoding(name)

265

for name in record_names:

266

_check_name_encoding(name)

313

267

# Check that the name is unique. Note that Python will refuse

314

268

# to decode non-shortest forms of UTF-8 encoding, so there is no

315

269

# risk that the same unicode string has been encoded two

316

270

# different ways.

317

if name_tuple in all_names:

318

raise errors.DuplicateRecordNameError(name_tuple)

319

all_names.add(name_tuple)

271

if name in all_names:

272

raise errors.DuplicateRecordNameError(name)

273

all_names.add(name)

320

274

excess_bytes = self.reader_func(1)

321

275

if excess_bytes != '':

322

276

raise errors.ContainerHasExcessDataError(excess_bytes)

346

300

# Read the list of names.

347

301

names = []

348

302

while True:

349

name_line = self._read_line()

350

if name_line == '':

303

name = self._read_line()

304

if name == '':

351

305

break

352

name_tuple = tuple(name_line.split('\x00'))

353

for name in name_tuple:

354

_check_name(name)

355

names.append(name_tuple)

306

_check_name(name)

307

names.append(name)

356

308

357

309

self._remaining_length = length

358

310

return names, self._content_reader

376

328

:raises ContainerError: if this record is invalid.

377

329

"""

378

330

names, read_bytes = self.read()

379

for name_tuple in names:

380

for name in name_tuple:

381

_check_name_encoding(name)

331

for name in names:

332

_check_name_encoding(name)

382

333

read_bytes(None)

383

334

384

385

class ContainerPushParser(object):

386

"""A "push" parser for container format 1.

387

388

It accepts bytes via the ``accept_bytes`` method, and parses them into

389

records which can be retrieved via the ``read_pending_records`` method.

390

"""

391

392

def __init__(self):

393

self._buffer = ''

394

self._state_handler = self._state_expecting_format_line

395

self._parsed_records = []

396

self._reset_current_record()

397

self.finished = False

398

399

def _reset_current_record(self):

400

self._current_record_length = None

401

self._current_record_names = []

402

403

def accept_bytes(self, bytes):

404

self._buffer += bytes

405

# Keep iterating the state machine until it stops consuming bytes from

406

# the buffer.

407

last_buffer_length = None

408

cur_buffer_length = len(self._buffer)

409

while cur_buffer_length != last_buffer_length:

410

last_buffer_length = cur_buffer_length

411

self._state_handler()

412

cur_buffer_length = len(self._buffer)

413

414

def read_pending_records(self):

415

records = self._parsed_records

416

self._parsed_records = []

417

return records

418

419

def _consume_line(self):

420

"""Take a line out of the buffer, and return the line.

421

422

If a newline byte is not found in the buffer, the buffer is

423

unchanged and this returns None instead.

424

"""

425

newline_pos = self._buffer.find('\n')

426

if newline_pos != -1:

427

line = self._buffer[:newline_pos]

428

self._buffer = self._buffer[newline_pos+1:]

429

return line

430

else:

431

return None

432

433

def _state_expecting_format_line(self):

434

line = self._consume_line()

435

if line is not None:

436

if line != FORMAT_ONE:

437

raise errors.UnknownContainerFormatError(line)

438

self._state_handler = self._state_expecting_record_type

439

440

def _state_expecting_record_type(self):

441

if len(self._buffer) >= 1:

442

record_type = self._buffer[0]

443

self._buffer = self._buffer[1:]

444

if record_type == 'B':

445

self._state_handler = self._state_expecting_length

446

elif record_type == 'E':

447

self.finished = True

448

self._state_handler = self._state_expecting_nothing

449

else:

450

raise errors.UnknownRecordTypeError(record_type)

451

452

def _state_expecting_length(self):

453

line = self._consume_line()

454

if line is not None:

455

try:

456

self._current_record_length = int(line)

457

except ValueError:

458

raise errors.InvalidRecordError(

459

"%r is not a valid length." % (line,))

460

self._state_handler = self._state_expecting_name

461

462

def _state_expecting_name(self):

463

encoded_name_parts = self._consume_line()

464

if encoded_name_parts == '':

465

self._state_handler = self._state_expecting_body

466

elif encoded_name_parts:

467

name_parts = tuple(encoded_name_parts.split('\x00'))

468

for name_part in name_parts:

469

_check_name(name_part)

470

self._current_record_names.append(name_parts)

471

472

def _state_expecting_body(self):

473

if len(self._buffer) >= self._current_record_length:

474

body_bytes = self._buffer[:self._current_record_length]

475

self._buffer = self._buffer[self._current_record_length:]

476

record = (self._current_record_names, body_bytes)

477

self._parsed_records.append(record)

478

self._reset_current_record()

479

self._state_handler = self._state_expecting_record_type

480

481

def _state_expecting_nothing(self):

482

pass

483

484

def read_size_hint(self):

485

hint = 16384

486

if self._state_handler == self._state_expecting_body:

487

remaining = self._current_record_length - len(self._buffer)

488

if remaining < 0:

489

remaining = 0

490

return max(hint, remaining)

491

return hint

492

493

494

def iter_records_from_file(source_file):

495

parser = ContainerPushParser()

496

while True:

497

bytes = source_file.read(parser.read_size_hint())

498

parser.accept_bytes(bytes)

499

for record in parser.read_pending_records():

500

yield record

501

if parser.finished:

502

break

503

Older »