~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Robert Collins
Date: 2005-10-09 23:12:35 UTC
Revision ID: robertc@robertcollins.net-20051009231235-93626e72cac71b78

clean up test dirs on make clean

files added:
bzrlib/clone.py

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/revfile.py

bzrlib/store/compressed_text.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files removed:
BRANCH.TODO

INSTALL

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/read_bundle.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v07.py

bzrlib/bzrdir.py

bzrlib/config.py

bzrlib/decorators.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/gpg.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/option.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/rio.py

bzrlib/sign_my_commits.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_api.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_config.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_http.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transform.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/win32console.py

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/using_aliases.txt

generate_docs.py

tools/__init__.py

tools/biobench.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/riodemo.py

tools/trace-revisions

files renamed:
tools/doc_generate/autodoc_man.py => bzr-man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

bzrlib/conflicts.py => bzrlib/plugins/conflicts.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/branch_implementations/test_parent.py => bzrlib/selftest/test_parent.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/selftest/test_revision_info.py

bzrlib/tests/branch_implementations/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_identitymap.py => bzrlib/selftest/testidentitymap.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/test_sampler.py => bzrlib/selftest/testsampler.py

bzrlib/tests/blackbox/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/test_transactions.py => bzrlib/selftest/testtransactions.py

bzrlib/tests/test_transport.py => bzrlib/selftest/testtransport.py

bzrlib/tests/test_workingtree.py => bzrlib/selftest/testworkingtree.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/versioned/__init__.py => bzrlib/store/weave.py

bzrlib/transport/http/__init__.py => bzrlib/transport/http.py

bzrlib/ui/__init__.py => bzrlib/ui.py

bzrlib/xml_serializer.py => bzrlib/xml.py

doc/tutorial.txt => tutorial.txt

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_conflicts.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/treeshape.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport/__init__.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/pwk

contrib/zsh/_bzr

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Base implementation of Transport over http.

There are separate implementation modules for each http client implementation.

"""Implementation of Transport over http.

"""

import errno

import os

from collections import deque

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

NonRelativePath, TransportError)

import os, errno

from cStringIO import StringIO

import re

import urllib2

import urlparse

import urllib

from warnings import warn

from bzrlib.transport import Transport, register_transport, Server

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError, InvalidURL)

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

# TODO: load these only when running http tests

import BaseHTTPServer, SimpleHTTPServer, socket, time

import threading

from bzrlib.ui import ui_factory

def extract_auth(url, password_manager):

"""Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert re.match(r'^(https?)(\+\w+)?://', url), \

'invalid absolute url %r' % url

scheme, netloc, path, query, fragment = urlparse.urlsplit(url)

# velocitynet.com.au transparently proxies connections and thereby

# breaks keep-alive -- sucks!

def get_url(url):

import urllib2

mutter("get_url %s" % url)

url_f = urllib2.urlopen(url)

return url_f

class HttpTransportError(TransportError):

pass

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

if '@' in netloc:

auth, netloc = netloc.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in netloc:

host = netloc.split(':', 1)[0]

else:

host = netloc

username = urllib.unquote(username)

if password is not None:

password = urllib.unquote(password)

else:

password = ui_factory.get_password(prompt='HTTP %(user)@%(host) password',

user=username, host=host)

password_manager.add_password(None, host, username, password)

url = urlparse.urlunsplit((scheme, netloc, path, query, fragment))

return url

class HttpTransportBase(Transport):

"""Base class for http implementations.

Does URL parsing, etc, but not any network IO.

The protocol can be given as e.g. http+urllib://host/ to use a particular

implementation.

TODO: Implement pipelined versions of all of the *_multi() functions.

"""

# _proto: "http" or "https"

# _qualified_proto: may have "+pycurl", etc

def __init__(self, base):

"""Set the base path where files will be stored."""

proto_match = re.match(r'^(https?)(\+\w+)?://', base)

if not proto_match:

raise AssertionError("not a http url: %r" % base)

self._proto = proto_match.group(1)

impl_name = proto_match.group(2)

if impl_name:

impl_name = impl_name[1:]

self._impl_name = impl_name

if base[-1] != '/':

base = base + '/'

super(HttpTransportBase, self).__init__(base)

assert base.startswith('http://') or base.startswith('https://')

super(HttpTransport, self).__init__(base)

# In the future we might actually connect to the remote host

# rather than using get_url

# self._connection = None

100

(apparent_proto, self._host,

(self._proto, self._host,

101

self._path, self._parameters,

102

self._query, self._fragment) = urlparse.urlparse(self.base)

103

self._qualified_proto = apparent_proto

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

"""

return True

def clone(self, offset=None):

"""Return a new HttpTransport with root at self.base + offset

For now HttpTransport does not actually connect, so just return

a new HttpTransport object.

"""

if offset is None:

return HttpTransport(self.base)

else:

return HttpTransport(self.abspath(offset))

104

105

def abspath(self, relpath):

106

"""Return the full url to the given relative path.

107

108

This can be supplied with a string or a list.

109

110

The URL returned always has the protocol scheme originally used to

111

construct the transport, even if that includes an explicit

112

implementation qualifier.

This can be supplied with a string or a list

113

"""

114

assert isinstance(relpath, basestring)

115

if isinstance(relpath, unicode):

116

raise InvalidURL(relpath, 'paths must not be unicode.')

117

if isinstance(relpath, basestring):

118

relpath_parts = relpath.split('/')

119

else:

120

# TODO: Don't call this with an array - no magic interfaces

121

relpath_parts = relpath[:]

122

if len(relpath_parts) > 1:

123

if relpath_parts[0] == '':

124

raise ValueError("path %r within branch %r seems to be absolute"

125

% (relpath, self._path))

126

if relpath_parts[-1] == '':

127

raise ValueError("path %r within branch %r seems to be a directory"

128

% (relpath, self._path))

relpath = [relpath]

129

basepath = self._path.split('/')

130

if len(basepath) > 0 and basepath[-1] == '':

131

basepath = basepath[:-1]

132

for p in relpath_parts:

for p in relpath:

133

if p == '..':

134

if len(basepath) == 0:

if len(basepath) < 0:

135

# In most filesystems, a request for the parent

136

# of root, just returns root.

137

continue

138

basepath.pop()

139

elif p == '.' or p == '':

if len(basepath) > 0:

basepath.pop()

elif p == '.':

140

continue # No-op

141

else:

142

basepath.append(p)

143

# Possibly, we could use urlparse.urljoin() here, but

144

100

# I'm concerned about when it chooses to strip the last

145

101

# portion of the path, and when it doesn't.

146

102

path = '/'.join(basepath)

147

if path == '':

148

path = '/'

149

result = urlparse.urlunparse((self._qualified_proto,

150

self._host, path, '', '', ''))

151

return result

103

return urlparse.urlunparse((self._proto,

104

self._host, path, '', '', ''))

152

105

153

def _real_abspath(self, relpath):

154

"""Produce absolute path, adjusting protocol if needed"""

155

abspath = self.abspath(relpath)

156

qp = self._qualified_proto

157

rp = self._proto

158

if self._qualified_proto != self._proto:

159

abspath = rp + abspath[len(qp):]

160

if not isinstance(abspath, str):

161

# escaping must be done at a higher level

162

abspath = abspath.encode('ascii')

163

return abspath

106

def relpath(self, abspath):

107

if not abspath.startswith(self.base):

108

raise NonRelativePath('path %r is not under base URL %r'

109

% (abspath, self.base))

110

pl = len(self.base)

111

return abspath[pl:].lstrip('/')

164

112

165

113

def has(self, relpath):

166

raise NotImplementedError("has() is abstract on %r" % self)

167

168

def get(self, relpath):

114

"""Does the target location exist?

115

116

TODO: HttpTransport.has() should use a HEAD request,

117

not a full GET request.

118

119

TODO: This should be changed so that we don't use

120

urllib2 and get an exception, the code path would be

121

cleaner if we just do an http HEAD request, and parse

122

the return code.

123

"""

124

try:

125

f = get_url(self.abspath(relpath))

126

# Without the read and then close()

127

# we tend to have busy sockets.

128

f.read()

129

f.close()

130

return True

131

except BzrError:

132

return False

133

except urllib2.URLError:

134

return False

135

except IOError, e:

136

if e.errno == errno.ENOENT:

137

return False

138

raise HttpTransportError(orig_error=e)

139

140

def get(self, relpath, decode=False):

169

141

"""Get the file at the given relative path.

170

142

171

143

:param relpath: The relative path to the file

172

144

"""

173

code, response_file = self._get(relpath, None)

174

return response_file

175

176

def _get(self, relpath, ranges):

177

"""Get a file, or part of a file.

178

179

:param relpath: Path relative to transport base URL

180

:param byte_range: None to get the whole file;

181

or [(start,end)] to fetch parts of a file.

182

183

:returns: (http_code, result_file)

184

185

Note that the current http implementations can only fetch one range at

186

a time through this call.

187

"""

188

raise NotImplementedError(self._get)

189

190

def readv(self, relpath, offsets):

191

"""Get parts of the file at the given relative path.

192

193

:param offsets: A list of (offset, size) tuples.

194

:param return: A list or generator of (offset, data) tuples

195

"""

196

# Ideally we would pass one big request asking for all the ranges in

197

# one go; however then the server will give a multipart mime response

198

# back, and we can't parse them yet. So instead we just get one range

199

# per region, and try to coallesce the regions as much as possible.

200

201

# The read-coallescing code is not quite regular enough to have a

202

# single driver routine and

203

# helper method in Transport.

204

def do_combined_read(combined_offsets):

205

# read one coalesced block

206

total_size = 0

207

for offset, size in combined_offsets:

208

total_size += size

209

mutter('readv coalesced %d reads.', len(combined_offsets))

210

offset = combined_offsets[0][0]

211

byte_range = (offset, offset + total_size - 1)

212

code, result_file = self._get(relpath, [byte_range])

213

if code == 206:

214

for off, size in combined_offsets:

215

result_bytes = result_file.read(size)

216

assert len(result_bytes) == size

217

yield off, result_bytes

218

elif code == 200:

219

data = result_file.read(offset + total_size)[offset:offset + total_size]

220

pos = 0

221

for offset, size in combined_offsets:

222

yield offset, data[pos:pos + size]

223

pos += size

224

del data

225

if not len(offsets):

226

return

227

pending_offsets = deque(offsets)

228

combined_offsets = []

229

while len(pending_offsets):

230

offset, size = pending_offsets.popleft()

231

if not combined_offsets:

232

combined_offsets = [[offset, size]]

233

else:

234

if (len (combined_offsets) < 500 and

235

combined_offsets[-1][0] + combined_offsets[-1][1] == offset):

236

# combatible offset:

237

combined_offsets.append([offset, size])

238

else:

239

# incompatible, or over the threshold issue a read and yield

240

pending_offsets.appendleft((offset, size))

241

for result in do_combined_read(combined_offsets):

242

yield result

243

combined_offsets = []

244

# whatever is left is a single coalesced request

245

if len(combined_offsets):

246

for result in do_combined_read(combined_offsets):

247

yield result

248

249

def put(self, relpath, f, mode=None):

145

try:

146

return get_url(self.abspath(relpath))

147

except (BzrError, urllib2.URLError, IOError), e:

148

raise NoSuchFile(orig_error=e)

149

except Exception,e:

150

raise HttpTransportError(orig_error=e)

151

152

def get_partial(self, relpath, start, length=None):

153

"""Get just part of a file.

154

155

:param relpath: Path to the file, relative to base

156

:param start: The starting position to read from

157

:param length: The length to read. A length of None indicates

158

read to the end of the file.

159

:return: A file-like object containing at least the specified bytes.

160

Some implementations may return objects which can be read

161

past this length, but this is not guaranteed.

162

"""

163

# TODO: You can make specialized http requests for just

164

# a portion of the file. Figure out how to do that.

165

# For now, urllib2 returns files that cannot seek() so

166

# we just read bytes off the beginning, until we

167

# get to the point that we care about.

168

f = self.get(relpath)

169

# TODO: read in smaller chunks, in case things are

170

# buffered internally.

171

f.read(start)

172

return f

173

174

def put(self, relpath, f):

250

175

"""Copy the file-like or string object into the location.

251

176

252

177

:param relpath: Location to put the contents, relative to base.

254

179

"""

255

180

raise TransportNotPossible('http PUT not supported')

256

181

257

def mkdir(self, relpath, mode=None):

182

def mkdir(self, relpath):

258

183

"""Create a directory at the given path."""

259

184

raise TransportNotPossible('http does not support mkdir()')

260

185

261

def rmdir(self, relpath):

262

"""See Transport.rmdir."""

263

raise TransportNotPossible('http does not support rmdir()')

264

265

186

def append(self, relpath, f):

266

187

"""Append the text in the file-like object into the final

267

188

location.

272

193

"""Copy the item at rel_from to the location at rel_to"""

273

194

raise TransportNotPossible('http does not support copy()')

274

195

275

def copy_to(self, relpaths, other, mode=None, pb=None):

196

def copy_to(self, relpaths, other, pb=None):

276

197

"""Copy a set of entries from self into another Transport.

277

198

278

199

:param relpaths: A list/generator of entries to be copied.

283

204

# At this point HttpTransport might be able to check and see if

284

205

# the remote location is the same, and rather than download, and

285

206

# then upload, it could just issue a remote copy_this command.

286

if isinstance(other, HttpTransportBase):

207

if isinstance(other, HttpTransport):

287

208

raise TransportNotPossible('http cannot be the target of copy_to()')

288

209

else:

289

return super(HttpTransportBase, self).\

290

copy_to(relpaths, other, mode=mode, pb=pb)

210

return super(HttpTransport, self).copy_to(relpaths, other, pb=pb)

291

211

292

212

def move(self, rel_from, rel_to):

293

213

"""Move the item at rel_from to the location at rel_to"""

297

217

"""Delete the item at relpath"""

298

218

raise TransportNotPossible('http does not support delete()')

299

219

300

def is_readonly(self):

301

"""See Transport.is_readonly."""

302

return True

303

304

220

def listable(self):

305

221

"""See Transport.listable."""

306

222

return False

331

247

"""

332

248

raise TransportNotPossible('http does not support lock_write()')

333

249

334

def clone(self, offset=None):

335

"""Return a new HttpTransportBase with root at self.base + offset

336

For now HttpTransportBase does not actually connect, so just return

337

a new HttpTransportBase object.

338

"""

339

if offset is None:

340

return self.__class__(self.base)

341

else:

342

return self.__class__(self.abspath(offset))

343

344

#---------------- test server facilities ----------------

345

# TODO: load these only when running tests

346

347

348

class WebserverNotAvailable(Exception):

349

pass

350

351

352

class BadWebserverPath(ValueError):

353

def __str__(self):

354

return 'path %s is not in %s' % self.args

355

356

357

class TestingHTTPRequestHandler(SimpleHTTPServer.SimpleHTTPRequestHandler):

358

359

def log_message(self, format, *args):

360

self.server.test_case.log('webserver - %s - - [%s] %s "%s" "%s"',

361

self.address_string(),

362

self.log_date_time_string(),

363

format % args,

364

self.headers.get('referer', '-'),

365

self.headers.get('user-agent', '-'))

366

367

def handle_one_request(self):

368

"""Handle a single HTTP request.

369

370

You normally don't need to override this method; see the class

371

__doc__ string for information on how to handle specific HTTP

372

commands such as GET and POST.

373

374

"""

375

for i in xrange(1,11): # Don't try more than 10 times

376

try:

377

self.raw_requestline = self.rfile.readline()

378

except socket.error, e:

379

if e.args[0] in (errno.EAGAIN, errno.EWOULDBLOCK):

380

# omitted for now because some tests look at the log of

381

# the server and expect to see no errors. see recent

382

# email thread. -- mbp 20051021.

383

## self.log_message('EAGAIN (%d) while reading from raw_requestline' % i)

384

time.sleep(0.01)

385

continue

386

raise

387

else:

388

break

389

if not self.raw_requestline:

390

self.close_connection = 1

391

return

392

if not self.parse_request(): # An error code has been sent, just exit

393

return

394

mname = 'do_' + self.command

395

if not hasattr(self, mname):

396

self.send_error(501, "Unsupported method (%r)" % self.command)

397

return

398

method = getattr(self, mname)

399

method()

400

401

402

class TestingHTTPServer(BaseHTTPServer.HTTPServer):

403

def __init__(self, server_address, RequestHandlerClass, test_case):

404

BaseHTTPServer.HTTPServer.__init__(self, server_address,

405

RequestHandlerClass)

406

self.test_case = test_case

407

408

class HttpServer(Server):

409

"""A test server for http transports."""

410

411

# used to form the url that connects to this server

412

_url_protocol = 'http'

413

414

def _http_start(self):

415

httpd = None

416

httpd = TestingHTTPServer(('localhost', 0),

417

TestingHTTPRequestHandler,

418

self)

419

host, port = httpd.socket.getsockname()

420

self._http_base_url = '%s://localhost:%s/' % (self._url_protocol, port)

421

self._http_starting.release()

422

httpd.socket.settimeout(0.1)

423

424

while self._http_running:

425

try:

426

httpd.handle_request()

427

except socket.timeout:

428

pass

429

430

def _get_remote_url(self, path):

431

path_parts = path.split(os.path.sep)

432

if os.path.isabs(path):

433

if path_parts[:len(self._local_path_parts)] != \

434

self._local_path_parts:

435

raise BadWebserverPath(path, self.test_dir)

436

remote_path = '/'.join(path_parts[len(self._local_path_parts):])

437

else:

438

remote_path = '/'.join(path_parts)

439

440

self._http_starting.acquire()

441

self._http_starting.release()

442

return self._http_base_url + remote_path

443

444

def log(self, format, *args):

445

"""Capture Server log output."""

446

self.logs.append(format % args)

447

448

def setUp(self):

449

"""See bzrlib.transport.Server.setUp."""

450

self._home_dir = os.getcwdu()

451

self._local_path_parts = self._home_dir.split(os.path.sep)

452

self._http_starting = threading.Lock()

453

self._http_starting.acquire()

454

self._http_running = True

455

self._http_base_url = None

456

self._http_thread = threading.Thread(target=self._http_start)

457

self._http_thread.setDaemon(True)

458

self._http_thread.start()

459

self._http_proxy = os.environ.get("http_proxy")

460

if self._http_proxy is not None:

461

del os.environ["http_proxy"]

462

self.logs = []

463

464

def tearDown(self):

465

"""See bzrlib.transport.Server.tearDown."""

466

self._http_running = False

467

self._http_thread.join()

468

if self._http_proxy is not None:

469

import os

470

os.environ["http_proxy"] = self._http_proxy

471

472

def get_url(self):

473

"""See bzrlib.transport.Server.get_url."""

474

return self._get_remote_url(self._home_dir)

475

476

def get_bogus_url(self):

477

"""See bzrlib.transport.Server.get_bogus_url."""

478

# this is chosen to try to prevent trouble with proxies, wierd dns,

479

# etc

480

return 'http://127.0.0.1:1/'

481

250

register_transport('http://', HttpTransport)

251

register_transport('https://', HttpTransport)

Older »