~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Robert Collins
Date: 2006-02-11 11:58:06 UTC
mto: (1534.1.22 integration)
mto: This revision was merged to the branch mainline in revision 1554.
Revision ID: robertc@robertcollins.net-20060211115806-732dabc1e35714ed

Give format3 working trees their own last-revision marker.

files added:
bzrlib/_merge_core.py

bzrlib/tests/test_reweave.py

bzrlib/util/configobj/validate.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

files removed:
COPYING.txt

bzr.ico

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/cache_utf8.py

bzrlib/ignores.py

bzrlib/inter.py

bzrlib/knit.py

bzrlib/lockdir.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/revisiontree.py

bzrlib/sign_my_commits.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_status.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transform.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/tuned_gzip.py

bzrlib/urlutils.py

bzrlib/version.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

doc/README.1st

doc/configuration.txt

doc/default.css

doc/index.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/using_aliases.txt

profile_imports.py

tools/doc_generate/autodoc_rstx.py

tools/rst2html.py

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/ostools.py

tools/win32/start_bzr.bat

files renamed:
bzrlib/bundle/__init__.py => bzrlib/_changeset.py

bzrlib/store/versioned/__init__.py => bzrlib/store/weave.py

bzrlib/tests/blackbox/test_annotate.py => bzrlib/tests/test_annotate.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py => bzrlib/tests/test_basis_inventory.py

bzrlib/tests/repository_implementations/test_revision.py => bzrlib/tests/test_revprops.py

bzrlib/tests/blackbox/test_uncommit.py => bzrlib/tests/test_uncommit.py

bzrlib/transport/http/__init__.py => bzrlib/transport/http.py

doc/tutorial.txt => tutorial.txt

files modified:
.bzrignore

BRANCH.TODO

HACKING

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/errors.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml_serializer.py

contrib/newinventory.py

contrib/pwk

generate_docs.py

setup.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/history2revfiles.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Base implementation of Transport over http.

There are separate implementation modules for each http client implementation.

"""Implementation of Transport over http.

"""

import os, errno

from cStringIO import StringIO

import errno

import mimetools

import os

import posixpath

import re

import sys

import urllib, urllib2

import urlparse

import urllib

from warnings import warn

# TODO: load these only when running http tests

import BaseHTTPServer, SimpleHTTPServer, socket, time

import threading

from bzrlib import errors

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError, InvalidURL)

from bzrlib.transport import Transport, Server

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError)

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

from bzrlib.transport import Transport, register_transport, Server

from bzrlib.transport.http.response import (HttpMultipartRangeResponse,

HttpRangeResponse)

from bzrlib.ui import ui_factory

def extract_auth(url, password_manager):

"""Extract auth parameters from am HTTP/HTTPS url and add them to the given

"""

Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert re.match(r'^(https?)(\+\w+)?://', url), \

'invalid absolute url %r' % url

scheme, netloc, path, query, fragment = urlparse.urlsplit(url)

if '@' in netloc:

auth, netloc = netloc.split('@', 1)

assert url.startswith('http://') or url.startswith('https://')

scheme, host = url.split('//', 1)

if '/' in host:

host, path = host.split('/', 1)

path = '/' + path

else:

path = ''

port = ''

if '@' in host:

auth, host = host.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in netloc:

host = netloc.split(':', 1)[0]

else:

host = netloc

username = urllib.unquote(username)

if ':' in host:

host, port = host.split(':', 1)

port = ':' + port

# FIXME: if password isn't given, should we ask for it?

if password is not None:

username = urllib.unquote(username)

password = urllib.unquote(password)

else:

password = ui_factory.get_password(prompt='HTTP %(user)@%(host) password',

user=username, host=host)

password_manager.add_password(None, host, username, password)

url = urlparse.urlunsplit((scheme, netloc, path, query, fragment))

password_manager.add_password(None, host, username, password)

url = scheme + '//' + host + port + path

return url

def _extract_headers(header_text, url):

"""Extract the mapping for an rfc2822 header

This is a helper function for the test suite and for _pycurl.

(urllib already parses the headers for us)

In the case that there are multiple headers inside the file,

the last one is returned.

:param header_text: A string of header information.

This expects that the first line of a header will always be HTTP ...

:param url: The url we are parsing, so we can raise nice errors

:return: mimetools.Message object, which basically acts like a case

insensitive dictionary.

"""

first_header = True

remaining = header_text

if not remaining:

raise errors.InvalidHttpResponse(url, 'Empty headers')

while remaining:

100

header_file = StringIO(remaining)

101

first_line = header_file.readline()

102

if not first_line.startswith('HTTP'):

103

if first_header: # The first header *must* start with HTTP

104

raise errors.InvalidHttpResponse(url,

105

'Opening header line did not start with HTTP: %s'

106

% (first_line,))

107

assert False, 'Opening header line was not HTTP'

108

else:

109

break # We are done parsing

110

first_header = False

111

m = mimetools.Message(header_file)

112

113

# mimetools.Message parses the first header up to a blank line

114

# So while there is remaining data, it probably means there is

115

# another header to be parsed.

116

# Get rid of any preceeding whitespace, which if it is all whitespace

117

# will get rid of everything.

118

remaining = header_file.read().lstrip()

119

return m

120

121

122

class HttpTransportBase(Transport):

123

"""Base class for http implementations.

124

125

Does URL parsing, etc, but not any network IO.

126

127

The protocol can be given as e.g. http+urllib://host/ to use a particular

128

implementation.

129

"""

130

131

# _proto: "http" or "https"

132

# _qualified_proto: may have "+pycurl", etc

def get_url(url):

import urllib2

mutter("get_url %s" % url)

manager = urllib2.HTTPPasswordMgrWithDefaultRealm()

url = extract_auth(url, manager)

auth_handler = urllib2.HTTPBasicAuthHandler(manager)

opener = urllib2.build_opener(auth_handler)

url_f = opener.open(url)

return url_f

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

TODO: Implement pipelined versions of all of the *_multi() functions.

"""

133

134

def __init__(self, base):

135

"""Set the base path where files will be stored."""

136

proto_match = re.match(r'^(https?)(\+\w+)?://', base)

137

if not proto_match:

138

raise AssertionError("not a http url: %r" % base)

139

self._proto = proto_match.group(1)

140

impl_name = proto_match.group(2)

141

if impl_name:

142

impl_name = impl_name[1:]

143

self._impl_name = impl_name

assert base.startswith('http://') or base.startswith('https://')

144

if base[-1] != '/':

145

base = base + '/'

146

super(HttpTransportBase, self).__init__(base)

super(HttpTransport, self).__init__(base)

147

# In the future we might actually connect to the remote host

148

# rather than using get_url

149

# self._connection = None

150

(apparent_proto, self._host,

(self._proto, self._host,

151

self._path, self._parameters,

152

self._query, self._fragment) = urlparse.urlparse(self.base)

153

self._qualified_proto = apparent_proto

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

"""

return True

def clone(self, offset=None):

"""Return a new HttpTransport with root at self.base + offset

100

For now HttpTransport does not actually connect, so just return

101

a new HttpTransport object.

102

"""

103

if offset is None:

104

return HttpTransport(self.base)

105

else:

106

return HttpTransport(self.abspath(offset))

154

107

155

108

def abspath(self, relpath):

156

109

"""Return the full url to the given relative path.

157

158

This can be supplied with a string or a list.

159

160

The URL returned always has the protocol scheme originally used to

161

construct the transport, even if that includes an explicit

162

implementation qualifier.

110

This can be supplied with a string or a list

163

111

"""

164

112

assert isinstance(relpath, basestring)

165

if isinstance(relpath, unicode):

166

raise InvalidURL(relpath, 'paths must not be unicode.')

167

113

if isinstance(relpath, basestring):

168

114

relpath_parts = relpath.split('/')

169

115

else:

194

140

# I'm concerned about when it chooses to strip the last

195

141

# portion of the path, and when it doesn't.

196

142

path = '/'.join(basepath)

197

if path == '':

198

path = '/'

199

result = urlparse.urlunparse((self._qualified_proto,

200

self._host, path, '', '', ''))

201

return result

202

203

def _real_abspath(self, relpath):

204

"""Produce absolute path, adjusting protocol if needed"""

205

abspath = self.abspath(relpath)

206

qp = self._qualified_proto

207

rp = self._proto

208

if self._qualified_proto != self._proto:

209

abspath = rp + abspath[len(qp):]

210

if not isinstance(abspath, str):

211

# escaping must be done at a higher level

212

abspath = abspath.encode('ascii')

213

return abspath

143

return urlparse.urlunparse((self._proto,

144

self._host, path, '', '', ''))

214

145

215

146

def has(self, relpath):

216

raise NotImplementedError("has() is abstract on %r" % self)

217

218

def get(self, relpath):

147

"""Does the target location exist?

148

149

TODO: HttpTransport.has() should use a HEAD request,

150

not a full GET request.

151

152

TODO: This should be changed so that we don't use

153

urllib2 and get an exception, the code path would be

154

cleaner if we just do an http HEAD request, and parse

155

the return code.

156

"""

157

path = relpath

158

try:

159

path = self.abspath(relpath)

160

f = get_url(path)

161

# Without the read and then close()

162

# we tend to have busy sockets.

163

f.read()

164

f.close()

165

return True

166

except urllib2.URLError, e:

167

mutter('url error code: %s for has url: %r', e.code, path)

168

if e.code == 404:

169

return False

170

raise

171

except IOError, e:

172

mutter('io error: %s %s for has url: %r',

173

e.errno, errno.errorcode.get(e.errno), path)

174

if e.errno == errno.ENOENT:

175

return False

176

raise TransportError(orig_error=e)

177

178

def get(self, relpath, decode=False):

219

179

"""Get the file at the given relative path.

220

180

221

181

:param relpath: The relative path to the file

222

182

"""

223

code, response_file = self._get(relpath, None)

224

return response_file

225

226

def _get(self, relpath, ranges):

227

"""Get a file, or part of a file.

228

229

:param relpath: Path relative to transport base URL

230

:param byte_range: None to get the whole file;

231

or [(start,end)] to fetch parts of a file.

232

233

:returns: (http_code, result_file)

234

235

Note that the current http implementations can only fetch one range at

236

a time through this call.

237

"""

238

raise NotImplementedError(self._get)

239

240

def readv(self, relpath, offsets):

241

"""Get parts of the file at the given relative path.

242

243

:param offsets: A list of (offset, size) tuples.

244

:param return: A list or generator of (offset, data) tuples

245

"""

246

ranges = self.offsets_to_ranges(offsets)

247

mutter('http readv of %s collapsed %s offsets => %s',

248

relpath, len(offsets), ranges)

249

code, f = self._get(relpath, ranges)

250

for start, size in offsets:

251

f.seek(start, (start < 0) and 2 or 0)

252

start = f.tell()

253

data = f.read(size)

254

assert len(data) == size

255

yield start, data

256

257

@staticmethod

258

def offsets_to_ranges(offsets):

259

"""Turn a list of offsets and sizes into a list of byte ranges.

260

261

:param offsets: A list of tuples of (start, size). An empty list

262

is not accepted.

263

:return: a list of inclusive byte ranges (start, end)

264

Adjacent ranges will be combined.

265

"""

266

# Make sure we process sorted offsets

267

offsets = sorted(offsets)

268

269

prev_end = None

270

combined = []

271

272

for start, size in offsets:

273

end = start + size - 1

274

if prev_end is None:

275

combined.append([start, end])

276

elif start <= prev_end + 1:

277

combined[-1][1] = end

278

else:

279

combined.append([start, end])

280

prev_end = end

281

282

return combined

183

path = relpath

184

try:

185

path = self.abspath(relpath)

186

return get_url(path)

187

except urllib2.HTTPError, e:

188

mutter('url error code: %s for has url: %r', e.code, path)

189

if e.code == 404:

190

raise NoSuchFile(path, extra=e)

191

raise

192

except (BzrError, IOError), e:

193

if hasattr(e, 'errno'):

194

mutter('io error: %s %s for has url: %r',

195

e.errno, errno.errorcode.get(e.errno), path)

196

if e.errno == errno.ENOENT:

197

raise NoSuchFile(path, extra=e)

198

raise ConnectionError(msg = "Error retrieving %s: %s"

199

% (self.abspath(relpath), str(e)),

200

orig_error=e)

283

201

284

202

def put(self, relpath, f, mode=None):

285

203

"""Copy the file-like or string object into the location.

318

236

# At this point HttpTransport might be able to check and see if

319

237

# the remote location is the same, and rather than download, and

320

238

# then upload, it could just issue a remote copy_this command.

321

if isinstance(other, HttpTransportBase):

239

if isinstance(other, HttpTransport):

322

240

raise TransportNotPossible('http cannot be the target of copy_to()')

323

241

else:

324

return super(HttpTransportBase, self).\

325

copy_to(relpaths, other, mode=mode, pb=pb)

242

return super(HttpTransport, self).copy_to(relpaths, other, mode=mode, pb=pb)

326

243

327

244

def move(self, rel_from, rel_to):

328

245

"""Move the item at rel_from to the location at rel_to"""

366

283

"""

367

284

raise TransportNotPossible('http does not support lock_write()')

368

285

369

def clone(self, offset=None):

370

"""Return a new HttpTransportBase with root at self.base + offset

371

For now HttpTransportBase does not actually connect, so just return

372

a new HttpTransportBase object.

373

"""

374

if offset is None:

375

return self.__class__(self.base)

376

else:

377

return self.__class__(self.abspath(offset))

378

379

@staticmethod

380

def range_header(ranges, tail_amount):

381

"""Turn a list of bytes ranges into a HTTP Range header value.

382

383

:param offsets: A list of byte ranges, (start, end). An empty list

384

is not accepted.

385

386

:return: HTTP range header string.

387

"""

388

strings = []

389

for start, end in ranges:

390

strings.append('%d-%d' % (start, end))

391

392

if tail_amount:

393

strings.append('-%d' % tail_amount)

394

395

return ','.join(strings)

396

397

286

398

287

#---------------- test server facilities ----------------

399

# TODO: load these only when running tests

288

import BaseHTTPServer, SimpleHTTPServer, socket, time

289

import threading

400

290

401

291

402

292

class WebserverNotAvailable(Exception):

411

301

class TestingHTTPRequestHandler(SimpleHTTPServer.SimpleHTTPRequestHandler):

412

302

413

303

def log_message(self, format, *args):

414

self.server.test_case.log('webserver - %s - - [%s] %s "%s" "%s"',

304

self.server.test_case.log("webserver - %s - - [%s] %s",

415

305

self.address_string(),

416

306

self.log_date_time_string(),

417

format % args,

418

self.headers.get('referer', '-'),

419

self.headers.get('user-agent', '-'))

307

format%args)

420

308

421

309

def handle_one_request(self):

422

310

"""Handle a single HTTP request.

452

340

method = getattr(self, mname)

453

341

method()

454

342

455

if sys.platform == 'win32':

456

# On win32 you cannot access non-ascii filenames without

457

# decoding them into unicode first.

458

# However, under Linux, you can access bytestream paths

459

# without any problems. If this function was always active

460

# it would probably break tests when LANG=C was set

461

def translate_path(self, path):

462

"""Translate a /-separated PATH to the local filename syntax.

463

464

For bzr, all url paths are considered to be utf8 paths.

465

On Linux, you can access these paths directly over the bytestream

466

request, but on win32, you must decode them, and access them

467

as Unicode files.

468

"""

469

# abandon query parameters

470

path = urlparse.urlparse(path)[2]

471

path = posixpath.normpath(urllib.unquote(path))

472

path = path.decode('utf-8')

473

words = path.split('/')

474

words = filter(None, words)

475

path = os.getcwdu()

476

for word in words:

477

drive, word = os.path.splitdrive(word)

478

head, word = os.path.split(word)

479

if word in (os.curdir, os.pardir): continue

480

path = os.path.join(path, word)

481

return path

482

483

484

343

class TestingHTTPServer(BaseHTTPServer.HTTPServer):

485

344

def __init__(self, server_address, RequestHandlerClass, test_case):

486

345

BaseHTTPServer.HTTPServer.__init__(self, server_address,

491

350

class HttpServer(Server):

492

351

"""A test server for http transports."""

493

352

494

# used to form the url that connects to this server

495

_url_protocol = 'http'

353

_HTTP_PORTS = range(13000, 0x8000)

496

354

497

355

def _http_start(self):

498

356

httpd = None

499

httpd = TestingHTTPServer(('localhost', 0),

500

TestingHTTPRequestHandler,

501

self)

502

host, port = httpd.socket.getsockname()

503

self._http_base_url = '%s://localhost:%s/' % (self._url_protocol, port)

357

for port in self._HTTP_PORTS:

358

try:

359

httpd = TestingHTTPServer(('localhost', port),

360

TestingHTTPRequestHandler,

361

self)

362

except socket.error, e:

363

if e.args[0] == errno.EADDRINUSE:

364

continue

365

print >>sys.stderr, "Cannot run webserver :-("

366

raise

367

else:

368

break

369

370

if httpd is None:

371

raise WebserverNotAvailable("Cannot run webserver :-( "

372

"no free ports in range %s..%s" %

373

(_HTTP_PORTS[0], _HTTP_PORTS[-1]))

374

375

self._http_base_url = 'http://localhost:%s/' % port

504

376

self._http_starting.release()

505

377

httpd.socket.settimeout(0.1)

506

378

524

396

self._http_starting.release()

525

397

return self._http_base_url + remote_path

526

398

527

def log(self, format, *args):

399

def log(self, *args, **kwargs):

528

400

"""Capture Server log output."""

529

self.logs.append(format % args)

401

self.logs.append(args[3])

530

402

531

403

def setUp(self):

532

404

"""See bzrlib.transport.Server.setUp."""

558

430

559

431

def get_bogus_url(self):

560

432

"""See bzrlib.transport.Server.get_bogus_url."""

561

# this is chosen to try to prevent trouble with proxies, wierd dns,

562

# etc

563

return 'http://127.0.0.1:1/'

564

433

return 'http://jasldkjsalkdjalksjdkljasd'

434

435

436

def get_test_permutations():

437

"""Return the permutations to be used in testing."""

438

warn("There are no HTTPS transport provider tests yet.")

439

return [(HttpTransport, HttpServer),

440

]

Older »