~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Robert Collins
Date: 2005-10-06 00:52:53 UTC
Revision ID: robertc@robertcollins.net-20051006005253-415c38ad22094f13

define some expected behaviour for inventory_entry.snapshot

files added:
bzrlib/clone.py

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/revfile.py

bzrlib/store/compressed_text.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files removed:
BRANCH.TODO

INSTALL

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/gpg.py

bzrlib/identitymap.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/option.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/rio.py

bzrlib/sign_my_commits.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_api.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_emptytree.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/win32console.py

doc/README.1st

doc/configuration.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/using_aliases.txt

generate_docs.py

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/riodemo.py

tools/trace-revisions

files renamed:
tools/doc_generate/autodoc_man.py => bzr-man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/branch_implementations/test_parent.py => bzrlib/selftest/test_parent.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/selftest/test_revision_info.py

bzrlib/tests/branch_implementations/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/blackbox/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/test_transport.py => bzrlib/selftest/testtransport.py

bzrlib/tests/test_workingtree.py => bzrlib/selftest/testworkingtree.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/versioned/__init__.py => bzrlib/store/weave.py

bzrlib/transport/http/__init__.py => bzrlib/transport/http.py

bzrlib/ui/__init__.py => bzrlib/ui.py

bzrlib/xml_serializer.py => bzrlib/xml.py

doc/tutorial.txt => tutorial.txt

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/treeshape.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/pwk

contrib/zsh/_bzr

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Base implementation of Transport over http.

There are separate implementation modules for each http client implementation.

"""Implementation of Transport over http.

"""

from collections import deque

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

NonRelativePath, TransportError)

import os, errno

from cStringIO import StringIO

import errno

import os

import posixpath

import re

import sys

import urllib2

import urlparse

import urllib

from warnings import warn

from bzrlib.transport import Transport, register_transport, Server

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError, InvalidURL)

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

# TODO: load these only when running http tests

import BaseHTTPServer, SimpleHTTPServer, socket, time

import threading

from bzrlib.ui import ui_factory

def extract_auth(url, password_manager):

"""Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert re.match(r'^(https?)(\+\w+)?://', url), \

'invalid absolute url %r' % url

scheme, netloc, path, query, fragment = urlparse.urlsplit(url)

# velocitynet.com.au transparently proxies connections and thereby

# breaks keep-alive -- sucks!

def get_url(url):

import urllib2

mutter("get_url %s" % url)

url_f = urllib2.urlopen(url)

return url_f

class HttpTransportError(TransportError):

pass

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

if '@' in netloc:

auth, netloc = netloc.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in netloc:

host = netloc.split(':', 1)[0]

else:

host = netloc

username = urllib.unquote(username)

if password is not None:

password = urllib.unquote(password)

else:

password = ui_factory.get_password(prompt='HTTP %(user)@%(host) password',

user=username, host=host)

password_manager.add_password(None, host, username, password)

url = urlparse.urlunsplit((scheme, netloc, path, query, fragment))

return url

class HttpTransportBase(Transport):

"""Base class for http implementations.

Does URL parsing, etc, but not any network IO.

The protocol can be given as e.g. http+urllib://host/ to use a particular

implementation.

TODO: Implement pipelined versions of all of the *_multi() functions.

"""

# _proto: "http" or "https"

# _qualified_proto: may have "+pycurl", etc

def __init__(self, base):

"""Set the base path where files will be stored."""

proto_match = re.match(r'^(https?)(\+\w+)?://', base)

if not proto_match:

raise AssertionError("not a http url: %r" % base)

self._proto = proto_match.group(1)

impl_name = proto_match.group(2)

if impl_name:

impl_name = impl_name[1:]

self._impl_name = impl_name

if base[-1] != '/':

base = base + '/'

super(HttpTransportBase, self).__init__(base)

assert base.startswith('http://') or base.startswith('https://')

super(HttpTransport, self).__init__(base)

# In the future we might actually connect to the remote host

100

# rather than using get_url

101

# self._connection = None

102

(apparent_proto, self._host,

(self._proto, self._host,

103

self._path, self._parameters,

104

self._query, self._fragment) = urlparse.urlparse(self.base)

105

self._qualified_proto = apparent_proto

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

"""

return True

def clone(self, offset=None):

"""Return a new HttpTransport with root at self.base + offset

For now HttpTransport does not actually connect, so just return

a new HttpTransport object.

"""

if offset is None:

return HttpTransport(self.base)

else:

return HttpTransport(self.abspath(offset))

106

107

def abspath(self, relpath):

108

"""Return the full url to the given relative path.

109

110

This can be supplied with a string or a list.

111

112

The URL returned always has the protocol scheme originally used to

113

construct the transport, even if that includes an explicit

114

implementation qualifier.

This can be supplied with a string or a list

115

"""

116

assert isinstance(relpath, basestring)

117

if isinstance(relpath, unicode):

118

raise InvalidURL(relpath, 'paths must not be unicode.')

119

if isinstance(relpath, basestring):

120

relpath_parts = relpath.split('/')

121

else:

122

# TODO: Don't call this with an array - no magic interfaces

123

relpath_parts = relpath[:]

124

if len(relpath_parts) > 1:

125

if relpath_parts[0] == '':

126

raise ValueError("path %r within branch %r seems to be absolute"

127

% (relpath, self._path))

128

if relpath_parts[-1] == '':

129

raise ValueError("path %r within branch %r seems to be a directory"

130

% (relpath, self._path))

relpath = [relpath]

131

basepath = self._path.split('/')

132

if len(basepath) > 0 and basepath[-1] == '':

133

basepath = basepath[:-1]

134

for p in relpath_parts:

for p in relpath:

135

if p == '..':

136

if len(basepath) == 0:

if len(basepath) < 0:

137

# In most filesystems, a request for the parent

138

# of root, just returns root.

139

continue

140

basepath.pop()

141

elif p == '.' or p == '':

elif p == '.':

142

continue # No-op

143

else:

144

basepath.append(p)

145

# Possibly, we could use urlparse.urljoin() here, but

146

# I'm concerned about when it chooses to strip the last

147

100

# portion of the path, and when it doesn't.

148

101

path = '/'.join(basepath)

149

if path == '':

150

path = '/'

151

result = urlparse.urlunparse((self._qualified_proto,

152

self._host, path, '', '', ''))

153

return result

102

return urlparse.urlunparse((self._proto,

103

self._host, path, '', '', ''))

154

104

155

def _real_abspath(self, relpath):

156

"""Produce absolute path, adjusting protocol if needed"""

157

abspath = self.abspath(relpath)

158

qp = self._qualified_proto

159

rp = self._proto

160

if self._qualified_proto != self._proto:

161

abspath = rp + abspath[len(qp):]

162

if not isinstance(abspath, str):

163

# escaping must be done at a higher level

164

abspath = abspath.encode('ascii')

165

return abspath

105

def relpath(self, abspath):

106

if not abspath.startswith(self.base):

107

raise NonRelativePath('path %r is not under base URL %r'

108

% (abspath, self.base))

109

pl = len(self.base)

110

return abspath[pl:].lstrip('/')

166

111

167

112

def has(self, relpath):

168

raise NotImplementedError("has() is abstract on %r" % self)

169

170

def get(self, relpath):

113

"""Does the target location exist?

114

115

TODO: HttpTransport.has() should use a HEAD request,

116

not a full GET request.

117

118

TODO: This should be changed so that we don't use

119

urllib2 and get an exception, the code path would be

120

cleaner if we just do an http HEAD request, and parse

121

the return code.

122

"""

123

try:

124

f = get_url(self.abspath(relpath))

125

# Without the read and then close()

126

# we tend to have busy sockets.

127

f.read()

128

f.close()

129

return True

130

except BzrError:

131

return False

132

except urllib2.URLError:

133

return False

134

except IOError, e:

135

if e.errno == errno.ENOENT:

136

return False

137

raise HttpTransportError(orig_error=e)

138

139

def get(self, relpath, decode=False):

171

140

"""Get the file at the given relative path.

172

141

173

142

:param relpath: The relative path to the file

174

143

"""

175

code, response_file = self._get(relpath, None)

176

return response_file

177

178

def _get(self, relpath, ranges):

179

"""Get a file, or part of a file.

180

181

:param relpath: Path relative to transport base URL

182

:param byte_range: None to get the whole file;

183

or [(start,end)] to fetch parts of a file.

184

185

:returns: (http_code, result_file)

186

187

Note that the current http implementations can only fetch one range at

188

a time through this call.

189

"""

190

raise NotImplementedError(self._get)

191

192

def readv(self, relpath, offsets):

193

"""Get parts of the file at the given relative path.

194

195

:param offsets: A list of (offset, size) tuples.

196

:param return: A list or generator of (offset, data) tuples

197

"""

198

# Ideally we would pass one big request asking for all the ranges in

199

# one go; however then the server will give a multipart mime response

200

# back, and we can't parse them yet. So instead we just get one range

201

# per region, and try to coallesce the regions as much as possible.

202

203

# The read-coallescing code is not quite regular enough to have a

204

# single driver routine and

205

# helper method in Transport.

206

def do_combined_read(combined_offsets):

207

# read one coalesced block

208

total_size = 0

209

for offset, size in combined_offsets:

210

total_size += size

211

mutter('readv coalesced %d reads.', len(combined_offsets))

212

offset = combined_offsets[0][0]

213

byte_range = (offset, offset + total_size - 1)

214

code, result_file = self._get(relpath, [byte_range])

215

if code == 206:

216

for off, size in combined_offsets:

217

result_bytes = result_file.read(size)

218

assert len(result_bytes) == size

219

yield off, result_bytes

220

elif code == 200:

221

data = result_file.read(offset + total_size)[offset:offset + total_size]

222

pos = 0

223

for offset, size in combined_offsets:

224

yield offset, data[pos:pos + size]

225

pos += size

226

del data

227

if not len(offsets):

228

return

229

pending_offsets = deque(offsets)

230

combined_offsets = []

231

while len(pending_offsets):

232

offset, size = pending_offsets.popleft()

233

if not combined_offsets:

234

combined_offsets = [[offset, size]]

235

else:

236

if (len (combined_offsets) < 500 and

237

combined_offsets[-1][0] + combined_offsets[-1][1] == offset):

238

# combatible offset:

239

combined_offsets.append([offset, size])

240

else:

241

# incompatible, or over the threshold issue a read and yield

242

pending_offsets.appendleft((offset, size))

243

for result in do_combined_read(combined_offsets):

244

yield result

245

combined_offsets = []

246

# whatever is left is a single coalesced request

247

if len(combined_offsets):

248

for result in do_combined_read(combined_offsets):

249

yield result

250

251

def put(self, relpath, f, mode=None):

144

try:

145

return get_url(self.abspath(relpath))

146

except (BzrError, urllib2.URLError, IOError), e:

147

raise NoSuchFile(orig_error=e)

148

except Exception,e:

149

raise HttpTransportError(orig_error=e)

150

151

def get_partial(self, relpath, start, length=None):

152

"""Get just part of a file.

153

154

:param relpath: Path to the file, relative to base

155

:param start: The starting position to read from

156

:param length: The length to read. A length of None indicates

157

read to the end of the file.

158

:return: A file-like object containing at least the specified bytes.

159

Some implementations may return objects which can be read

160

past this length, but this is not guaranteed.

161

"""

162

# TODO: You can make specialized http requests for just

163

# a portion of the file. Figure out how to do that.

164

# For now, urllib2 returns files that cannot seek() so

165

# we just read bytes off the beginning, until we

166

# get to the point that we care about.

167

f = self.get(relpath)

168

# TODO: read in smaller chunks, in case things are

169

# buffered internally.

170

f.read(start)

171

return f

172

173

def put(self, relpath, f):

252

174

"""Copy the file-like or string object into the location.

253

175

254

176

:param relpath: Location to put the contents, relative to base.

256

178

"""

257

179

raise TransportNotPossible('http PUT not supported')

258

180

259

def mkdir(self, relpath, mode=None):

181

def mkdir(self, relpath):

260

182

"""Create a directory at the given path."""

261

183

raise TransportNotPossible('http does not support mkdir()')

262

184

263

def rmdir(self, relpath):

264

"""See Transport.rmdir."""

265

raise TransportNotPossible('http does not support rmdir()')

266

267

185

def append(self, relpath, f):

268

186

"""Append the text in the file-like object into the final

269

187

location.

274

192

"""Copy the item at rel_from to the location at rel_to"""

275

193

raise TransportNotPossible('http does not support copy()')

276

194

277

def copy_to(self, relpaths, other, mode=None, pb=None):

195

def copy_to(self, relpaths, other, pb=None):

278

196

"""Copy a set of entries from self into another Transport.

279

197

280

198

:param relpaths: A list/generator of entries to be copied.

285

203

# At this point HttpTransport might be able to check and see if

286

204

# the remote location is the same, and rather than download, and

287

205

# then upload, it could just issue a remote copy_this command.

288

if isinstance(other, HttpTransportBase):

206

if isinstance(other, HttpTransport):

289

207

raise TransportNotPossible('http cannot be the target of copy_to()')

290

208

else:

291

return super(HttpTransportBase, self).\

292

copy_to(relpaths, other, mode=mode, pb=pb)

209

return super(HttpTransport, self).copy_to(relpaths, other, pb=pb)

293

210

294

211

def move(self, rel_from, rel_to):

295

212

"""Move the item at rel_from to the location at rel_to"""

299

216

"""Delete the item at relpath"""

300

217

raise TransportNotPossible('http does not support delete()')

301

218

302

def is_readonly(self):

303

"""See Transport.is_readonly."""

304

return True

305

306

219

def listable(self):

307

220

"""See Transport.listable."""

308

221

return False

333

246

"""

334

247

raise TransportNotPossible('http does not support lock_write()')

335

248

336

def clone(self, offset=None):

337

"""Return a new HttpTransportBase with root at self.base + offset

338

For now HttpTransportBase does not actually connect, so just return

339

a new HttpTransportBase object.

340

"""

341

if offset is None:

342

return self.__class__(self.base)

343

else:

344

return self.__class__(self.abspath(offset))

345

346

#---------------- test server facilities ----------------

347

# TODO: load these only when running tests

348

349

350

class WebserverNotAvailable(Exception):

351

pass

352

353

354

class BadWebserverPath(ValueError):

355

def __str__(self):

356

return 'path %s is not in %s' % self.args

357

358

359

class TestingHTTPRequestHandler(SimpleHTTPServer.SimpleHTTPRequestHandler):

360

361

def log_message(self, format, *args):

362

self.server.test_case.log('webserver - %s - - [%s] %s "%s" "%s"',

363

self.address_string(),

364

self.log_date_time_string(),

365

format % args,

366

self.headers.get('referer', '-'),

367

self.headers.get('user-agent', '-'))

368

369

def handle_one_request(self):

370

"""Handle a single HTTP request.

371

372

You normally don't need to override this method; see the class

373

__doc__ string for information on how to handle specific HTTP

374

commands such as GET and POST.

375

376

"""

377

for i in xrange(1,11): # Don't try more than 10 times

378

try:

379

self.raw_requestline = self.rfile.readline()

380

except socket.error, e:

381

if e.args[0] in (errno.EAGAIN, errno.EWOULDBLOCK):

382

# omitted for now because some tests look at the log of

383

# the server and expect to see no errors. see recent

384

# email thread. -- mbp 20051021.

385

## self.log_message('EAGAIN (%d) while reading from raw_requestline' % i)

386

time.sleep(0.01)

387

continue

388

raise

389

else:

390

break

391

if not self.raw_requestline:

392

self.close_connection = 1

393

return

394

if not self.parse_request(): # An error code has been sent, just exit

395

return

396

mname = 'do_' + self.command

397

if not hasattr(self, mname):

398

self.send_error(501, "Unsupported method (%r)" % self.command)

399

return

400

method = getattr(self, mname)

401

method()

402

403

if sys.platform == 'win32':

404

# On win32 you cannot access non-ascii filenames without

405

# decoding them into unicode first.

406

# However, under Linux, you can access bytestream paths

407

# without any problems. If this function was always active

408

# it would probably break tests when LANG=C was set

409

def translate_path(self, path):

410

"""Translate a /-separated PATH to the local filename syntax.

411

412

For bzr, all url paths are considered to be utf8 paths.

413

On Linux, you can access these paths directly over the bytestream

414

request, but on win32, you must decode them, and access them

415

as Unicode files.

416

"""

417

# abandon query parameters

418

path = urlparse.urlparse(path)[2]

419

path = posixpath.normpath(urllib.unquote(path))

420

path = path.decode('utf-8')

421

words = path.split('/')

422

words = filter(None, words)

423

path = os.getcwdu()

424

for word in words:

425

drive, word = os.path.splitdrive(word)

426

head, word = os.path.split(word)

427

if word in (os.curdir, os.pardir): continue

428

path = os.path.join(path, word)

429

return path

430

431

432

class TestingHTTPServer(BaseHTTPServer.HTTPServer):

433

def __init__(self, server_address, RequestHandlerClass, test_case):

434

BaseHTTPServer.HTTPServer.__init__(self, server_address,

435

RequestHandlerClass)

436

self.test_case = test_case

437

438

class HttpServer(Server):

439

"""A test server for http transports."""

440

441

# used to form the url that connects to this server

442

_url_protocol = 'http'

443

444

def _http_start(self):

445

httpd = None

446

httpd = TestingHTTPServer(('localhost', 0),

447

TestingHTTPRequestHandler,

448

self)

449

host, port = httpd.socket.getsockname()

450

self._http_base_url = '%s://localhost:%s/' % (self._url_protocol, port)

451

self._http_starting.release()

452

httpd.socket.settimeout(0.1)

453

454

while self._http_running:

455

try:

456

httpd.handle_request()

457

except socket.timeout:

458

pass

459

460

def _get_remote_url(self, path):

461

path_parts = path.split(os.path.sep)

462

if os.path.isabs(path):

463

if path_parts[:len(self._local_path_parts)] != \

464

self._local_path_parts:

465

raise BadWebserverPath(path, self.test_dir)

466

remote_path = '/'.join(path_parts[len(self._local_path_parts):])

467

else:

468

remote_path = '/'.join(path_parts)

469

470

self._http_starting.acquire()

471

self._http_starting.release()

472

return self._http_base_url + remote_path

473

474

def log(self, format, *args):

475

"""Capture Server log output."""

476

self.logs.append(format % args)

477

478

def setUp(self):

479

"""See bzrlib.transport.Server.setUp."""

480

self._home_dir = os.getcwdu()

481

self._local_path_parts = self._home_dir.split(os.path.sep)

482

self._http_starting = threading.Lock()

483

self._http_starting.acquire()

484

self._http_running = True

485

self._http_base_url = None

486

self._http_thread = threading.Thread(target=self._http_start)

487

self._http_thread.setDaemon(True)

488

self._http_thread.start()

489

self._http_proxy = os.environ.get("http_proxy")

490

if self._http_proxy is not None:

491

del os.environ["http_proxy"]

492

self.logs = []

493

494

def tearDown(self):

495

"""See bzrlib.transport.Server.tearDown."""

496

self._http_running = False

497

self._http_thread.join()

498

if self._http_proxy is not None:

499

import os

500

os.environ["http_proxy"] = self._http_proxy

501

502

def get_url(self):

503

"""See bzrlib.transport.Server.get_url."""

504

return self._get_remote_url(self._home_dir)

505

506

def get_bogus_url(self):

507

"""See bzrlib.transport.Server.get_bogus_url."""

508

# this is chosen to try to prevent trouble with proxies, wierd dns,

509

# etc

510

return 'http://127.0.0.1:1/'

511

249

register_transport('http://', HttpTransport)

250

register_transport('https://', HttpTransport)

Older »