~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/tuned_gzip.py

Committer: Patch Queue Manager
Date: 2016-02-01 19:56:05 UTC
mfrom: (6615.1.1 trunk)
Revision ID: pqm@pqm.ubuntu.com-20160201195605-o7rl92wf6uyum3fk

(vila) Open trunk again as 2.8b1 (Vincent Ladeuil)

files added:
bzrlib/_termcolor.py

bzrlib/branchfmt

bzrlib/branchfmt/__init__.py

bzrlib/branchfmt/fullhistory.py

bzrlib/plugins/grep

bzrlib/plugins/grep/.bzrignore

bzrlib/plugins/grep/NEWS

bzrlib/plugins/grep/__init__.py

bzrlib/plugins/grep/cmds.py

bzrlib/plugins/grep/grep.py

bzrlib/plugins/grep/test_grep.py

bzrlib/plugins/launchpad/cmds.py

bzrlib/smart/ping.py

bzrlib/tests/blackbox/test_ping.py

bzrlib/tests/blackbox/test_verify_signatures.py

bzrlib/tests/per_tree/test_ids.py

doc/developers/nested-trees.txt

doc/en/release-notes/bzr-2.7.txt

doc/en/release-notes/bzr-2.8.txt

doc/en/user-guide/switch_store.txt

doc/en/whats-new/whats-new-in-2.7.txt

doc/en/whats-new/whats-new-in-2.8.txt

po/cs.po

po/el.po

po/fa.po

po/he.po

po/id.po

po/ko.po

po/my.po

po/nb.po

po/si.po

po/sk.po

po/sr.po

po/sv.po

po/uk.po

po/vi.po

po/zh_CN.po

files removed:
bzrlib/doc_generate/builders

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/writers

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/tests/doc_generate

bzrlib/tests/doc_generate/__init__.py

bzrlib/tests/doc_generate/builders

bzrlib/tests/doc_generate/builders/__init__.py

bzrlib/tests/doc_generate/builders/test_texinfo.py

bzrlib/tests/doc_generate/writers

bzrlib/tests/doc_generate/writers/__init__.py

bzrlib/tests/doc_generate/writers/test_texinfo.py

bzrlib/tests/per_branch/test_bound_sftp.py

bzrlib/tests/per_branch/test_revision_history.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

files modified:
.bzrignore

INSTALL

Makefile

bzrlib/__init__.py

bzrlib/_walkdirs_win32.pyx

bzrlib/add.py

bzrlib/annotate.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/cmdline.py

bzrlib/commands.py

bzrlib/commit_signature_commands.py

bzrlib/config.py

bzrlib/crash.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/conf.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/filter_tree.py

bzrlib/filters/__init__.py

bzrlib/gpg.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/configuration.txt

bzrlib/hooks.py

bzrlib/i18n.py

bzrlib/inventory.py

bzrlib/library_state.py

bzrlib/lock.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/mergetools.py

bzrlib/missing.py

bzrlib/osutils.py

bzrlib/patches.py

bzrlib/plugins/changelog_merge/tests/test_changelog_merge.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/plugins/netrc_credential_store/tests/test_netrc.py

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repository.py

bzrlib/shelf.py

bzrlib/smart/branch.py

bzrlib/smart/medium.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/store/versioned/__init__.py

bzrlib/switch.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_branches.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_deleted.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mkdir.py

bzrlib/tests/blackbox/test_modified.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_reference.py

bzrlib/tests/blackbox/test_remember_option.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_script.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_unknowns.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_view.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/features.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/per_branch/__init__.py

bzrlib/tests/per_branch/test_branch.py

bzrlib/tests/per_branch/test_check.py

bzrlib/tests/per_branch/test_config.py

bzrlib/tests/per_branch/test_get_revision_id_to_revno_map.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_last_revision_info.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_permissions.py

bzrlib/tests/per_branch/test_pull.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_branch/test_reconcile.py

bzrlib/tests/per_branch/test_revision_id_to_revno.py

bzrlib/tests/per_branch/test_stacking.py

bzrlib/tests/per_branch/test_tags.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/per_controldir/test_push.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_foreign_vcs/test_branch.py

bzrlib/tests/per_interbranch/__init__.py

bzrlib/tests/per_interbranch/test_fetch.py

bzrlib/tests/per_interbranch/test_pull.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/__init__.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_inventory/basics.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_file_graph.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_signatures.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_graph.py

bzrlib/tests/per_repository_vf/test_fileid_involved.py

bzrlib/tests/per_repository_vf/test_reconcile.py

bzrlib/tests/per_repository_vf/test_repository.py

bzrlib/tests/per_repository_vf/test_write_group.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/__init__.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_tree.py

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree/__init__.py

bzrlib/tests/per_workingtree/test_basis_inventory.py

bzrlib/tests/per_workingtree/test_commit.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_eol_conversion.py

bzrlib/tests/per_workingtree/test_executable.py

bzrlib/tests/per_workingtree/test_parents.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_remove.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_symlinks.py

bzrlib/tests/per_workingtree/test_views.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/test__bencode.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cethread.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_chk_serializer.py

bzrlib/tests/test_clean_tree.py

bzrlib/tests/test_cmdline.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_controldir.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_debug.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_email_message.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_features.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_filter_tree.py

bzrlib/tests/test_filters.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_urllib.py

bzrlib/tests/test_i18n.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_inventory_delta.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_mergetools.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_rules.py

bzrlib/tests/test_scenarios.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_store.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_upgrade_stacked.py

bzrlib/tests/test_url_policy_open.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_utextwrap.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/gio_transport.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/version.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml_serializer.py

doc/developers/HACKING.txt

doc/developers/authentication-ring.txt

doc/developers/code-style.txt

doc/developers/conf.py

doc/developers/configuration.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/plans.txt

doc/developers/releasing.txt

doc/developers/xdg_config_spec.txt

doc/en/Makefile

doc/en/_static/en/bzr-en-quick-reference.svg

doc/en/_templates/index.html

doc/en/admin-guide/introduction.txt

doc/en/conf.py

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/bzr-2.5.txt

doc/en/release-notes/bzr-2.6.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/whats-new/whats-new-in-2.5.txt

doc/en/whats-new/whats-new-in-2.6.txt

doc/es/_static/es/bzr-es-quick-reference.svg

doc/es/conf.py

doc/ja/conf.py

doc/ja/user-guide/http_smart_server.txt

doc/ru/_static/ru/bzr-ru-quick-reference.svg

doc/ru/conf.py

po/ar.po

po/ast.po

po/bs.po

po/bzr.pot

po/ca.po

po/de.po

po/en_AU.po

po/en_GB.po

po/es.po

po/fo.po

po/fr.po

po/gl.po

po/it.po

po/ja.po

po/ms.po

po/nl.po

po/oc.po

po/pl.po

po/pt_BR.po

po/ro.po

po/ru.po

po/sco.po

po/tr.po

po/ug.po

setup.py

tools/generate_docs.py

Show diffs side-by-side

added added

removed removed

bzrlib/tuned_gzip.py

127

DeprecationWarning, stacklevel=2)

128

gzip.GzipFile.__init__(self, *args, **kwargs)

129

130

def _add_read_data(self, data):

131

# 4169 calls in 183

132

# temp var for len(data) and switch to +='s.

133

# 4169 in 139

134

len_data = len(data)

135

self.crc = zlib.crc32(data, self.crc)

136

self.extrabuf += data

137

self.extrasize += len_data

138

self.size += len_data

130

if sys.version_info >= (2, 7, 4):

131

def _add_read_data(self, data):

132

# 4169 calls in 183

133

# temp var for len(data) and switch to +='s.

134

# 4169 in 139

135

len_data = len(data)

136

self.crc = zlib.crc32(data, self.crc) & 0xffffffffL

137

offset = self.offset - self.extrastart

138

self.extrabuf = self.extrabuf[offset:] + data

139

self.extrasize = self.extrasize + len_data

140

self.extrastart = self.offset

141

self.size = self.size + len_data

142

else:

143

def _add_read_data(self, data):

144

# 4169 calls in 183

145

# temp var for len(data) and switch to +='s.

146

# 4169 in 139

147

len_data = len(data)

148

self.crc = zlib.crc32(data, self.crc)

149

self.extrabuf += data

150

self.extrasize += len_data

151

self.size += len_data

139

152

140

153

def _write_gzip_header(self):

141

154

"""A tuned version of gzip._write_gzip_header

161

174

'' # self.fileobj.write(fname + '\000')

162

175

)

163

176

164

def _read(self, size=1024):

165

# various optimisations:

166

# reduces lsprof count from 2500 to

167

# 8337 calls in 1272, 365 internal

168

if self.fileobj is None:

169

raise EOFError, "Reached EOF"

170

171

if self._new_member:

172

# If the _new_member flag is set, we have to

173

# jump to the next member, if there is one.

174

175

# First, check if we're at the end of the file;

176

# if so, it's time to stop; no more members to read.

177

next_header_bytes = self.fileobj.read(10)

178

if next_header_bytes == '':

177

if sys.version_info < (2, 7, 4):

178

def _read(self, size=1024):

179

# various optimisations:

180

# reduces lsprof count from 2500 to

181

# 8337 calls in 1272, 365 internal

182

if self.fileobj is None:

179

183

raise EOFError, "Reached EOF"

180

184

181

self._init_read()

182

self._read_gzip_header(next_header_bytes)

183

self.decompress = zlib.decompressobj(-zlib.MAX_WBITS)

184

self._new_member = False

185

186

# Read a chunk of data from the file

187

buf = self.fileobj.read(size)

188

189

# If the EOF has been reached, flush the decompression object

190

# and mark this object as finished.

191

192

if buf == "":

193

self._add_read_data(self.decompress.flush())

194

if len(self.decompress.unused_data) < 8:

195

raise AssertionError("what does flush do?")

196

self._gzip_tail = self.decompress.unused_data[0:8]

197

self._read_eof()

198

# tell the driving read() call we have stuffed all the data

199

# in self.extrabuf

200

raise EOFError, 'Reached EOF'

201

202

self._add_read_data(self.decompress.decompress(buf))

203

204

if self.decompress.unused_data != "":

205

# Ending case: we've come to the end of a member in the file,

206

# so seek back to the start of the data for the next member which

207

# is the length of the decompress objects unused data - the first

208

# 8 bytes for the end crc and size records.

209

210

# so seek back to the start of the unused data, finish up

211

# this member, and read a new gzip header.

212

# (The number of bytes to seek back is the length of the unused

213

# data, minus 8 because those 8 bytes are part of this member.

214

seek_length = len (self.decompress.unused_data) - 8

215

if seek_length > 0:

216

# we read too much data

217

self.fileobj.seek(-seek_length, 1)

185

if self._new_member:

186

# If the _new_member flag is set, we have to

187

# jump to the next member, if there is one.

188

189

# First, check if we're at the end of the file;

190

# if so, it's time to stop; no more members to read.

191

next_header_bytes = self.fileobj.read(10)

192

if next_header_bytes == '':

193

raise EOFError, "Reached EOF"

194

195

self._init_read()

196

self._read_gzip_header(next_header_bytes)

197

self.decompress = zlib.decompressobj(-zlib.MAX_WBITS)

198

self._new_member = False

199

200

# Read a chunk of data from the file

201

buf = self.fileobj.read(size)

202

203

# If the EOF has been reached, flush the decompression object

204

# and mark this object as finished.

205

206

if buf == "":

207

self._add_read_data(self.decompress.flush())

208

if len(self.decompress.unused_data) < 8:

209

raise AssertionError("what does flush do?")

218

210

self._gzip_tail = self.decompress.unused_data[0:8]

219

elif seek_length < 0:

220

# we haven't read enough to check the checksum.

221

if not (-8 < seek_length):

222

raise AssertionError("too great a seek")

223

buf = self.fileobj.read(-seek_length)

224

self._gzip_tail = self.decompress.unused_data + buf

225

else:

226

self._gzip_tail = self.decompress.unused_data

227

228

# Check the CRC and file size, and set the flag so we read

229

# a new member on the next call

230

self._read_eof()

231

self._new_member = True

232

233

def _read_eof(self):

234

"""tuned to reduce function calls and eliminate file seeking:

235

pass 1:

236

reduces lsprof count from 800 to 288

237

4168 in 296

238

avoid U32 call by using struct format L

239

4168 in 200

240

"""

241

# We've read to the end of the file, so we should have 8 bytes of

242

# unused data in the decompressor. If we don't, there is a corrupt file.

243

# We use these 8 bytes to calculate the CRC and the recorded file size.

244

# We then check the that the computed CRC and size of the

245

# uncompressed data matches the stored values. Note that the size

246

# stored is the true file size mod 2**32.

247

if not (len(self._gzip_tail) == 8):

248

raise AssertionError("gzip trailer is incorrect length.")

249

crc32, isize = struct.unpack("<LL", self._gzip_tail)

250

# note that isize is unsigned - it can exceed 2GB

251

if crc32 != U32(self.crc):

252

raise IOError, "CRC check failed %d %d" % (crc32, U32(self.crc))

253

elif isize != LOWU32(self.size):

254

raise IOError, "Incorrect length of data produced"

211

self._read_eof()

212

# tell the driving read() call we have stuffed all the data

213

# in self.extrabuf

214

raise EOFError, 'Reached EOF'

215

216

self._add_read_data(self.decompress.decompress(buf))

217

218

if self.decompress.unused_data != "":

219

# Ending case: we've come to the end of a member in the file,

220

# so seek back to the start of the data for the next member

221

# which is the length of the decompress objects unused data -

222

# the first 8 bytes for the end crc and size records.

223

224

# so seek back to the start of the unused data, finish up

225

# this member, and read a new gzip header.

226

# (The number of bytes to seek back is the length of the unused

227

# data, minus 8 because those 8 bytes are part of this member.

228

seek_length = len (self.decompress.unused_data) - 8

229

if seek_length > 0:

230

# we read too much data

231

self.fileobj.seek(-seek_length, 1)

232

self._gzip_tail = self.decompress.unused_data[0:8]

233

elif seek_length < 0:

234

# we haven't read enough to check the checksum.

235

if not (-8 < seek_length):

236

raise AssertionError("too great a seek")

237

buf = self.fileobj.read(-seek_length)

238

self._gzip_tail = self.decompress.unused_data + buf

239

else:

240

self._gzip_tail = self.decompress.unused_data

241

242

# Check the CRC and file size, and set the flag so we read

243

# a new member on the next call

244

self._read_eof()

245

self._new_member = True

246

247

def _read_eof(self):

248

"""tuned to reduce function calls and eliminate file seeking:

249

pass 1:

250

reduces lsprof count from 800 to 288

251

4168 in 296

252

avoid U32 call by using struct format L

253

4168 in 200

254

"""

255

# We've read to the end of the file, so we should have 8 bytes of

256

# unused data in the decompressor. If we don't, there is a corrupt

257

# file. We use these 8 bytes to calculate the CRC and the recorded

258

# file size. We then check the that the computed CRC and size of

259

# the uncompressed data matches the stored values. Note that the

260

# size stored is the true file size mod 2**32.

261

if not (len(self._gzip_tail) == 8):

262

raise AssertionError("gzip trailer is incorrect length.")

263

crc32, isize = struct.unpack("<LL", self._gzip_tail)

264

# note that isize is unsigned - it can exceed 2GB

265

if crc32 != U32(self.crc):

266

raise IOError, "CRC check failed %d %d" % (crc32, U32(self.crc))

267

elif isize != LOWU32(self.size):

268

raise IOError, "Incorrect length of data produced"

255

269

256

270

def _read_gzip_header(self, bytes=None):

257

271

"""Supply bytes if the minimum header size is already read.

Older »