~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Michael Ellerman
Date: 2005-12-10 22:11:46 UTC
mto: This revision was merged to the branch mainline in revision 1528.
Revision ID: michael@ellerman.id.au-20051210221145-7765347ea4ca0093

Raise NoSuchFile when someone tries to add a non-existant file.

files added:
bzrlib/clone.py

bzrlib/merge_core.py

bzrlib/tests/test_reweave.py

bzrlib/util/configobj/validate.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

files removed:
BRANCH.TODO

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/read_bundle.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v07.py

bzrlib/bzrdir.py

bzrlib/decorators.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/sign_my_commits.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/symbol_versioning.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transform.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/readonly.py

bzrlib/tuned_gzip.py

bzrlib/urlutils.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/using_aliases.txt

generate_docs.py

tools/__init__.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

files renamed:
tools/doc_generate/autodoc_man.py => bzr_man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

bzrlib/store/versioned/__init__.py => bzrlib/store/weave.py

bzrlib/tests/blackbox/test_annotate.py => bzrlib/tests/test_annotate.py

bzrlib/tests/branch_implementations/test_branch.py => bzrlib/tests/test_branch.py

bzrlib/tests/branch_implementations/test_parent.py => bzrlib/tests/test_parent.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/tests/test_revision_info.py

bzrlib/tests/test_sftp_transport.py => bzrlib/tests/test_sftp.py

bzrlib/tests/blackbox/test_status.py => bzrlib/tests/test_status.py

bzrlib/tests/blackbox/test_uncommit.py => bzrlib/tests/test_uncommit.py

bzrlib/transport/http/__init__.py => bzrlib/transport/http.py

bzrlib/xml_serializer.py => bzrlib/xml.py

doc/tutorial.txt => tutorial.txt

files modified:
.bzrignore

HACKING

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_store.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/pwk

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Base implementation of Transport over http.

There are separate implementation modules for each http client implementation.

"""Implementation of Transport over http.

"""

import errno

import os

from collections import deque

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError)

import os, errno

from cStringIO import StringIO

import re

import urllib, urllib2

import urlparse

import urllib

from warnings import warn

from bzrlib.transport import Transport, register_transport, Server

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError, InvalidURL)

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

# TODO: load these only when running http tests

import BaseHTTPServer, SimpleHTTPServer, socket, time

import threading

from bzrlib.ui import ui_factory

def extract_auth(url, password_manager):

"""Extract auth parameters from am HTTP/HTTPS url and add them to the given

"""

Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert re.match(r'^(https?)(\+\w+)?://', url), \

'invalid absolute url %r' % url

scheme, netloc, path, query, fragment = urlparse.urlsplit(url)

if '@' in netloc:

auth, netloc = netloc.split('@', 1)

assert url.startswith('http://') or url.startswith('https://')

scheme, host = url.split('//', 1)

if '/' in host:

host, path = host.split('/', 1)

path = '/' + path

else:

path = ''

port = ''

if '@' in host:

auth, host = host.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in netloc:

host = netloc.split(':', 1)[0]

else:

host = netloc

username = urllib.unquote(username)

if ':' in host:

host, port = host.split(':', 1)

port = ':' + port

# FIXME: if password isn't given, should we ask for it?

if password is not None:

username = urllib.unquote(username)

password = urllib.unquote(password)

else:

password = ui_factory.get_password(prompt='HTTP %(user)@%(host) password',

user=username, host=host)

password_manager.add_password(None, host, username, password)

url = urlparse.urlunsplit((scheme, netloc, path, query, fragment))

password_manager.add_password(None, host, username, password)

url = scheme + '//' + host + port + path

return url

class HttpTransportBase(Transport):

"""Base class for http implementations.

Does URL parsing, etc, but not any network IO.

The protocol can be given as e.g. http+urllib://host/ to use a particular

implementation.

def get_url(url):

import urllib2

mutter("get_url %s" % url)

manager = urllib2.HTTPPasswordMgrWithDefaultRealm()

url = extract_auth(url, manager)

auth_handler = urllib2.HTTPBasicAuthHandler(manager)

opener = urllib2.build_opener(auth_handler)

url_f = opener.open(url)

return url_f

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

TODO: Implement pipelined versions of all of the *_multi() functions.

"""

# _proto: "http" or "https"

# _qualified_proto: may have "+pycurl", etc

def __init__(self, base):

"""Set the base path where files will be stored."""

proto_match = re.match(r'^(https?)(\+\w+)?://', base)

if not proto_match:

raise AssertionError("not a http url: %r" % base)

self._proto = proto_match.group(1)

impl_name = proto_match.group(2)

if impl_name:

impl_name = impl_name[1:]

self._impl_name = impl_name

if base[-1] != '/':

base = base + '/'

super(HttpTransportBase, self).__init__(base)

assert base.startswith('http://') or base.startswith('https://')

super(HttpTransport, self).__init__(base)

# In the future we might actually connect to the remote host

# rather than using get_url

# self._connection = None

100

(apparent_proto, self._host,

(self._proto, self._host,

101

self._path, self._parameters,

102

self._query, self._fragment) = urlparse.urlparse(self.base)

103

self._qualified_proto = apparent_proto

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

"""

return True

def clone(self, offset=None):

"""Return a new HttpTransport with root at self.base + offset

For now HttpTransport does not actually connect, so just return

a new HttpTransport object.

"""

100

if offset is None:

101

return HttpTransport(self.base)

102

else:

103

return HttpTransport(self.abspath(offset))

104

105

def abspath(self, relpath):

106

"""Return the full url to the given relative path.

107

108

This can be supplied with a string or a list.

109

110

The URL returned always has the protocol scheme originally used to

111

construct the transport, even if that includes an explicit

112

implementation qualifier.

107

This can be supplied with a string or a list

113

108

"""

114

109

assert isinstance(relpath, basestring)

115

if isinstance(relpath, unicode):

116

raise InvalidURL(relpath, 'paths must not be unicode.')

117

110

if isinstance(relpath, basestring):

118

111

relpath_parts = relpath.split('/')

119

112

else:

144

137

# I'm concerned about when it chooses to strip the last

145

138

# portion of the path, and when it doesn't.

146

139

path = '/'.join(basepath)

147

if path == '':

148

path = '/'

149

result = urlparse.urlunparse((self._qualified_proto,

150

self._host, path, '', '', ''))

151

return result

152

153

def _real_abspath(self, relpath):

154

"""Produce absolute path, adjusting protocol if needed"""

155

abspath = self.abspath(relpath)

156

qp = self._qualified_proto

157

rp = self._proto

158

if self._qualified_proto != self._proto:

159

abspath = rp + abspath[len(qp):]

160

if not isinstance(abspath, str):

161

# escaping must be done at a higher level

162

abspath = abspath.encode('ascii')

163

return abspath

140

return urlparse.urlunparse((self._proto,

141

self._host, path, '', '', ''))

164

142

165

143

def has(self, relpath):

166

raise NotImplementedError("has() is abstract on %r" % self)

167

168

def get(self, relpath):

144

"""Does the target location exist?

145

146

TODO: HttpTransport.has() should use a HEAD request,

147

not a full GET request.

148

149

TODO: This should be changed so that we don't use

150

urllib2 and get an exception, the code path would be

151

cleaner if we just do an http HEAD request, and parse

152

the return code.

153

"""

154

path = relpath

155

try:

156

path = self.abspath(relpath)

157

f = get_url(path)

158

# Without the read and then close()

159

# we tend to have busy sockets.

160

f.read()

161

f.close()

162

return True

163

except urllib2.URLError, e:

164

mutter('url error code: %s for has url: %r', e.code, path)

165

if e.code == 404:

166

return False

167

raise

168

except IOError, e:

169

mutter('io error: %s %s for has url: %r',

170

e.errno, errno.errorcode.get(e.errno), path)

171

if e.errno == errno.ENOENT:

172

return False

173

raise TransportError(orig_error=e)

174

175

def get(self, relpath, decode=False):

169

176

"""Get the file at the given relative path.

170

177

171

178

:param relpath: The relative path to the file

172

179

"""

173

code, response_file = self._get(relpath, None)

174

return response_file

175

176

def _get(self, relpath, ranges):

177

"""Get a file, or part of a file.

178

179

:param relpath: Path relative to transport base URL

180

:param byte_range: None to get the whole file;

181

or [(start,end)] to fetch parts of a file.

182

183

:returns: (http_code, result_file)

184

185

Note that the current http implementations can only fetch one range at

186

a time through this call.

187

"""

188

raise NotImplementedError(self._get)

189

190

def readv(self, relpath, offsets):

191

"""Get parts of the file at the given relative path.

192

193

:param offsets: A list of (offset, size) tuples.

194

:param return: A list or generator of (offset, data) tuples

195

"""

196

# Ideally we would pass one big request asking for all the ranges in

197

# one go; however then the server will give a multipart mime response

198

# back, and we can't parse them yet. So instead we just get one range

199

# per region, and try to coallesce the regions as much as possible.

200

201

# The read-coallescing code is not quite regular enough to have a

202

# single driver routine and

203

# helper method in Transport.

204

def do_combined_read(combined_offsets):

205

# read one coalesced block

206

total_size = 0

207

for offset, size in combined_offsets:

208

total_size += size

209

mutter('readv coalesced %d reads.', len(combined_offsets))

210

offset = combined_offsets[0][0]

211

byte_range = (offset, offset + total_size - 1)

212

code, result_file = self._get(relpath, [byte_range])

213

if code == 206:

214

for off, size in combined_offsets:

215

result_bytes = result_file.read(size)

216

assert len(result_bytes) == size

217

yield off, result_bytes

218

elif code == 200:

219

data = result_file.read(offset + total_size)[offset:offset + total_size]

220

pos = 0

221

for offset, size in combined_offsets:

222

yield offset, data[pos:pos + size]

223

pos += size

224

del data

225

if not len(offsets):

226

return

227

pending_offsets = deque(offsets)

228

combined_offsets = []

229

while len(pending_offsets):

230

offset, size = pending_offsets.popleft()

231

if not combined_offsets:

232

combined_offsets = [[offset, size]]

233

else:

234

if (len (combined_offsets) < 500 and

235

combined_offsets[-1][0] + combined_offsets[-1][1] == offset):

236

# combatible offset:

237

combined_offsets.append([offset, size])

238

else:

239

# incompatible, or over the threshold issue a read and yield

240

pending_offsets.appendleft((offset, size))

241

for result in do_combined_read(combined_offsets):

242

yield result

243

combined_offsets = []

244

# whatever is left is a single coalesced request

245

if len(combined_offsets):

246

for result in do_combined_read(combined_offsets):

247

yield result

248

249

def put(self, relpath, f, mode=None):

180

path = relpath

181

try:

182

path = self.abspath(relpath)

183

return get_url(path)

184

except urllib2.HTTPError, e:

185

mutter('url error code: %s for has url: %r', e.code, path)

186

if e.code == 404:

187

raise NoSuchFile(path, extra=e)

188

raise

189

except (BzrError, IOError), e:

190

if hasattr(e, 'errno'):

191

mutter('io error: %s %s for has url: %r',

192

e.errno, errno.errorcode.get(e.errno), path)

193

if e.errno == errno.ENOENT:

194

raise NoSuchFile(path, extra=e)

195

raise ConnectionError(msg = "Error retrieving %s: %s"

196

% (self.abspath(relpath), str(e)),

197

orig_error=e)

198

199

def put(self, relpath, f):

250

200

"""Copy the file-like or string object into the location.

251

201

252

202

:param relpath: Location to put the contents, relative to base.

254

204

"""

255

205

raise TransportNotPossible('http PUT not supported')

256

206

257

def mkdir(self, relpath, mode=None):

207

def mkdir(self, relpath):

258

208

"""Create a directory at the given path."""

259

209

raise TransportNotPossible('http does not support mkdir()')

260

210

261

def rmdir(self, relpath):

262

"""See Transport.rmdir."""

263

raise TransportNotPossible('http does not support rmdir()')

264

265

211

def append(self, relpath, f):

266

212

"""Append the text in the file-like object into the final

267

213

location.

272

218

"""Copy the item at rel_from to the location at rel_to"""

273

219

raise TransportNotPossible('http does not support copy()')

274

220

275

def copy_to(self, relpaths, other, mode=None, pb=None):

221

def copy_to(self, relpaths, other, pb=None):

276

222

"""Copy a set of entries from self into another Transport.

277

223

278

224

:param relpaths: A list/generator of entries to be copied.

283

229

# At this point HttpTransport might be able to check and see if

284

230

# the remote location is the same, and rather than download, and

285

231

# then upload, it could just issue a remote copy_this command.

286

if isinstance(other, HttpTransportBase):

232

if isinstance(other, HttpTransport):

287

233

raise TransportNotPossible('http cannot be the target of copy_to()')

288

234

else:

289

return super(HttpTransportBase, self).\

290

copy_to(relpaths, other, mode=mode, pb=pb)

235

return super(HttpTransport, self).copy_to(relpaths, other, pb=pb)

291

236

292

237

def move(self, rel_from, rel_to):

293

238

"""Move the item at rel_from to the location at rel_to"""

297

242

"""Delete the item at relpath"""

298

243

raise TransportNotPossible('http does not support delete()')

299

244

300

def is_readonly(self):

301

"""See Transport.is_readonly."""

302

return True

303

304

245

def listable(self):

305

246

"""See Transport.listable."""

306

247

return False

330

271

:return: A lock object, which should be passed to Transport.unlock()

331

272

"""

332

273

raise TransportNotPossible('http does not support lock_write()')

333

334

def clone(self, offset=None):

335

"""Return a new HttpTransportBase with root at self.base + offset

336

For now HttpTransportBase does not actually connect, so just return

337

a new HttpTransportBase object.

338

"""

339

if offset is None:

340

return self.__class__(self.base)

341

else:

342

return self.__class__(self.abspath(offset))

343

344

#---------------- test server facilities ----------------

345

# TODO: load these only when running tests

346

347

348

class WebserverNotAvailable(Exception):

349

pass

350

351

352

class BadWebserverPath(ValueError):

353

def __str__(self):

354

return 'path %s is not in %s' % self.args

355

356

357

class TestingHTTPRequestHandler(SimpleHTTPServer.SimpleHTTPRequestHandler):

358

359

def log_message(self, format, *args):

360

self.server.test_case.log('webserver - %s - - [%s] %s "%s" "%s"',

361

self.address_string(),

362

self.log_date_time_string(),

363

format % args,

364

self.headers.get('referer', '-'),

365

self.headers.get('user-agent', '-'))

366

367

def handle_one_request(self):

368

"""Handle a single HTTP request.

369

370

You normally don't need to override this method; see the class

371

__doc__ string for information on how to handle specific HTTP

372

commands such as GET and POST.

373

374

"""

375

for i in xrange(1,11): # Don't try more than 10 times

376

try:

377

self.raw_requestline = self.rfile.readline()

378

except socket.error, e:

379

if e.args[0] in (errno.EAGAIN, errno.EWOULDBLOCK):

380

# omitted for now because some tests look at the log of

381

# the server and expect to see no errors. see recent

382

# email thread. -- mbp 20051021.

383

## self.log_message('EAGAIN (%d) while reading from raw_requestline' % i)

384

time.sleep(0.01)

385

continue

386

raise

387

else:

388

break

389

if not self.raw_requestline:

390

self.close_connection = 1

391

return

392

if not self.parse_request(): # An error code has been sent, just exit

393

return

394

mname = 'do_' + self.command

395

if not hasattr(self, mname):

396

self.send_error(501, "Unsupported method (%r)" % self.command)

397

return

398

method = getattr(self, mname)

399

method()

400

401

402

class TestingHTTPServer(BaseHTTPServer.HTTPServer):

403

def __init__(self, server_address, RequestHandlerClass, test_case):

404

BaseHTTPServer.HTTPServer.__init__(self, server_address,

405

RequestHandlerClass)

406

self.test_case = test_case

407

408

class HttpServer(Server):

409

"""A test server for http transports."""

410

411

# used to form the url that connects to this server

412

_url_protocol = 'http'

413

414

def _http_start(self):

415

httpd = None

416

httpd = TestingHTTPServer(('localhost', 0),

417

TestingHTTPRequestHandler,

418

self)

419

host, port = httpd.socket.getsockname()

420

self._http_base_url = '%s://localhost:%s/' % (self._url_protocol, port)

421

self._http_starting.release()

422

httpd.socket.settimeout(0.1)

423

424

while self._http_running:

425

try:

426

httpd.handle_request()

427

except socket.timeout:

428

pass

429

430

def _get_remote_url(self, path):

431

path_parts = path.split(os.path.sep)

432

if os.path.isabs(path):

433

if path_parts[:len(self._local_path_parts)] != \

434

self._local_path_parts:

435

raise BadWebserverPath(path, self.test_dir)

436

remote_path = '/'.join(path_parts[len(self._local_path_parts):])

437

else:

438

remote_path = '/'.join(path_parts)

439

440

self._http_starting.acquire()

441

self._http_starting.release()

442

return self._http_base_url + remote_path

443

444

def log(self, format, *args):

445

"""Capture Server log output."""

446

self.logs.append(format % args)

447

448

def setUp(self):

449

"""See bzrlib.transport.Server.setUp."""

450

self._home_dir = os.getcwdu()

451

self._local_path_parts = self._home_dir.split(os.path.sep)

452

self._http_starting = threading.Lock()

453

self._http_starting.acquire()

454

self._http_running = True

455

self._http_base_url = None

456

self._http_thread = threading.Thread(target=self._http_start)

457

self._http_thread.setDaemon(True)

458

self._http_thread.start()

459

self._http_proxy = os.environ.get("http_proxy")

460

if self._http_proxy is not None:

461

del os.environ["http_proxy"]

462

self.logs = []

463

464

def tearDown(self):

465

"""See bzrlib.transport.Server.tearDown."""

466

self._http_running = False

467

self._http_thread.join()

468

if self._http_proxy is not None:

469

import os

470

os.environ["http_proxy"] = self._http_proxy

471

472

def get_url(self):

473

"""See bzrlib.transport.Server.get_url."""

474

return self._get_remote_url(self._home_dir)

475

476

def get_bogus_url(self):

477

"""See bzrlib.transport.Server.get_bogus_url."""

478

# this is chosen to try to prevent trouble with proxies, wierd dns,

479

# etc

480

return 'http://127.0.0.1:1/'

481

Older »