~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Robert Collins
Date: 2005-10-02 22:47:02 UTC
mto: This revision was merged to the branch mainline in revision 1397.
Revision ID: robertc@robertcollins.net-20051002224701-8a8b20b90de559a6

support ghosts in commits

files added:
bzrlib/clone.py

bzrlib/mdiff.py

bzrlib/merge_core.py

bzrlib/revfile.py

bzrlib/store/compressed_text.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files removed:
BRANCH.TODO

COPYING.txt

INSTALL

bzr.ico

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/gpg.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/option.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/sign_my_commits.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_command.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/version.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/win32console.py

doc/README.1st

doc/configuration.txt

doc/default.css

doc/index.txt

doc/plugins.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/using_aliases.txt

generate_docs.py

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/riodemo.py

tools/rst2html.py

tools/trace-revisions

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/ostools.py

tools/win32/start_bzr.bat

files renamed:
tools/doc_generate/autodoc_man.py => bzr-man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/branch_implementations/test_parent.py => bzrlib/selftest/test_parent.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/selftest/test_revision_info.py

bzrlib/tests/branch_implementations/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/blackbox/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/test_transport.py => bzrlib/selftest/testtransport.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/versioned/__init__.py => bzrlib/store/weave.py

bzrlib/transport/http/__init__.py => bzrlib/transport/http.py

bzrlib/ui/__init__.py => bzrlib/ui.py

bzrlib/xml_serializer.py => bzrlib/xml.py

doc/tutorial.txt => tutorial.txt

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/newinventory.py

contrib/pwk

contrib/zsh/_bzr

setup.py *

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Base implementation of Transport over http.

There are separate implementation modules for each http client implementation.

"""Implementation of Transport over http.

"""

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

NonRelativePath, TransportError)

import os, errno

from cStringIO import StringIO

import errno

import mimetools

import os

import posixpath

import re

import sys

import urllib2

import urlparse

import urllib

from warnings import warn

# TODO: load these only when running http tests

import BaseHTTPServer, SimpleHTTPServer, socket, time

import threading

from bzrlib import errors

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError, InvalidURL)

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

from bzrlib.transport import Transport, register_transport, Server

from bzrlib.transport.http.response import (HttpMultipartRangeResponse,

HttpRangeResponse)

from bzrlib.ui import ui_factory

def extract_auth(url, password_manager):

"""Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert re.match(r'^(https?)(\+\w+)?://', url), \

'invalid absolute url %r' % url

scheme, netloc, path, query, fragment = urlparse.urlsplit(url)

# velocitynet.com.au transparently proxies connections and thereby

# breaks keep-alive -- sucks!

def get_url(url):

import urllib2

mutter("get_url %s" % url)

url_f = urllib2.urlopen(url)

return url_f

class HttpTransportError(TransportError):

pass

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

if '@' in netloc:

auth, netloc = netloc.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in netloc:

host = netloc.split(':', 1)[0]

else:

host = netloc

username = urllib.unquote(username)

if password is not None:

password = urllib.unquote(password)

else:

password = ui_factory.get_password(prompt='HTTP %(user)@%(host) password',

user=username, host=host)

password_manager.add_password(None, host, username, password)

url = urlparse.urlunsplit((scheme, netloc, path, query, fragment))

return url

def _extract_headers(header_text, url):

"""Extract the mapping for an rfc2822 header

This is a helper function for the test suite and for _pycurl.

(urllib already parses the headers for us)

In the case that there are multiple headers inside the file,

the last one is returned.

:param header_text: A string of header information.

This expects that the first line of a header will always be HTTP ...

:param url: The url we are parsing, so we can raise nice errors

:return: mimetools.Message object, which basically acts like a case

insensitive dictionary.

"""

first_header = True

remaining = header_text

if not remaining:

raise errors.InvalidHttpResponse(url, 'Empty headers')

while remaining:

100

header_file = StringIO(remaining)

101

first_line = header_file.readline()

102

if not first_line.startswith('HTTP'):

103

if first_header: # The first header *must* start with HTTP

104

raise errors.InvalidHttpResponse(url,

105

'Opening header line did not start with HTTP: %s'

106

% (first_line,))

107

assert False, 'Opening header line was not HTTP'

108

else:

109

break # We are done parsing

110

first_header = False

111

m = mimetools.Message(header_file)

112

113

# mimetools.Message parses the first header up to a blank line

114

# So while there is remaining data, it probably means there is

115

# another header to be parsed.

116

# Get rid of any preceeding whitespace, which if it is all whitespace

117

# will get rid of everything.

118

remaining = header_file.read().lstrip()

119

return m

120

121

122

class HttpTransportBase(Transport):

123

"""Base class for http implementations.

124

125

Does URL parsing, etc, but not any network IO.

126

127

The protocol can be given as e.g. http+urllib://host/ to use a particular

128

implementation.

129

"""

130

131

# _proto: "http" or "https"

132

# _qualified_proto: may have "+pycurl", etc

TODO: Implement pipelined versions of all of the *_multi() functions.

"""

133

134

def __init__(self, base):

135

"""Set the base path where files will be stored."""

136

proto_match = re.match(r'^(https?)(\+\w+)?://', base)

137

if not proto_match:

138

raise AssertionError("not a http url: %r" % base)

139

self._proto = proto_match.group(1)

140

impl_name = proto_match.group(2)

141

if impl_name:

142

impl_name = impl_name[1:]

143

self._impl_name = impl_name

144

if base[-1] != '/':

145

base = base + '/'

146

super(HttpTransportBase, self).__init__(base)

assert base.startswith('http://') or base.startswith('https://')

super(HttpTransport, self).__init__(base)

147

# In the future we might actually connect to the remote host

148

# rather than using get_url

149

# self._connection = None

150

(apparent_proto, self._host,

(self._proto, self._host,

151

self._path, self._parameters,

152

self._query, self._fragment) = urlparse.urlparse(self.base)

153

self._qualified_proto = apparent_proto

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

"""

return True

def clone(self, offset=None):

"""Return a new HttpTransport with root at self.base + offset

For now HttpTransport does not actually connect, so just return

a new HttpTransport object.

"""

if offset is None:

return HttpTransport(self.base)

else:

return HttpTransport(self.abspath(offset))

154

155

def abspath(self, relpath):

156

"""Return the full url to the given relative path.

157

158

This can be supplied with a string or a list.

159

160

The URL returned always has the protocol scheme originally used to

161

construct the transport, even if that includes an explicit

162

implementation qualifier.

This can be supplied with a string or a list

163

"""

164

assert isinstance(relpath, basestring)

165

if isinstance(relpath, unicode):

166

raise InvalidURL(relpath, 'paths must not be unicode.')

167

if isinstance(relpath, basestring):

168

relpath_parts = relpath.split('/')

169

else:

170

# TODO: Don't call this with an array - no magic interfaces

171

relpath_parts = relpath[:]

172

if len(relpath_parts) > 1:

173

if relpath_parts[0] == '':

174

raise ValueError("path %r within branch %r seems to be absolute"

175

% (relpath, self._path))

176

if relpath_parts[-1] == '':

177

raise ValueError("path %r within branch %r seems to be a directory"

178

% (relpath, self._path))

relpath = [relpath]

179

basepath = self._path.split('/')

180

if len(basepath) > 0 and basepath[-1] == '':

181

basepath = basepath[:-1]

182

for p in relpath_parts:

for p in relpath:

183

if p == '..':

184

if len(basepath) == 0:

if len(basepath) < 0:

185

# In most filesystems, a request for the parent

186

# of root, just returns root.

187

continue

188

basepath.pop()

189

elif p == '.' or p == '':

elif p == '.':

190

continue # No-op

191

else:

192

basepath.append(p)

193

# Possibly, we could use urlparse.urljoin() here, but

194

# I'm concerned about when it chooses to strip the last

195

100

# portion of the path, and when it doesn't.

196

101

path = '/'.join(basepath)

197

if path == '':

198

path = '/'

199

result = urlparse.urlunparse((self._qualified_proto,

200

self._host, path, '', '', ''))

201

return result

102

return urlparse.urlunparse((self._proto,

103

self._host, path, '', '', ''))

202

104

203

def _real_abspath(self, relpath):

204

"""Produce absolute path, adjusting protocol if needed"""

205

abspath = self.abspath(relpath)

206

qp = self._qualified_proto

207

rp = self._proto

208

if self._qualified_proto != self._proto:

209

abspath = rp + abspath[len(qp):]

210

if not isinstance(abspath, str):

211

# escaping must be done at a higher level

212

abspath = abspath.encode('ascii')

213

return abspath

105

def relpath(self, abspath):

106

if not abspath.startswith(self.base):

107

raise NonRelativePath('path %r is not under base URL %r'

108

% (abspath, self.base))

109

pl = len(self.base)

110

return abspath[pl:].lstrip('/')

214

111

215

112

def has(self, relpath):

216

raise NotImplementedError("has() is abstract on %r" % self)

217

218

def get(self, relpath):

113

"""Does the target location exist?

114

115

TODO: HttpTransport.has() should use a HEAD request,

116

not a full GET request.

117

118

TODO: This should be changed so that we don't use

119

urllib2 and get an exception, the code path would be

120

cleaner if we just do an http HEAD request, and parse

121

the return code.

122

"""

123

try:

124

f = get_url(self.abspath(relpath))

125

# Without the read and then close()

126

# we tend to have busy sockets.

127

f.read()

128

f.close()

129

return True

130

except BzrError:

131

return False

132

except urllib2.URLError:

133

return False

134

except IOError, e:

135

if e.errno == errno.ENOENT:

136

return False

137

raise HttpTransportError(orig_error=e)

138

139

def get(self, relpath, decode=False):

219

140

"""Get the file at the given relative path.

220

141

221

142

:param relpath: The relative path to the file

222

143

"""

223

code, response_file = self._get(relpath, None)

224

return response_file

225

226

def _get(self, relpath, ranges):

227

"""Get a file, or part of a file.

228

229

:param relpath: Path relative to transport base URL

230

:param byte_range: None to get the whole file;

231

or [(start,end)] to fetch parts of a file.

232

233

:returns: (http_code, result_file)

234

235

Note that the current http implementations can only fetch one range at

236

a time through this call.

237

"""

238

raise NotImplementedError(self._get)

239

240

def readv(self, relpath, offsets):

241

"""Get parts of the file at the given relative path.

242

243

:param offsets: A list of (offset, size) tuples.

244

:param return: A list or generator of (offset, data) tuples

245

"""

246

ranges = self.offsets_to_ranges(offsets)

247

mutter('http readv of %s collapsed %s offsets => %s',

248

relpath, len(offsets), ranges)

249

code, f = self._get(relpath, ranges)

250

for start, size in offsets:

251

f.seek(start, (start < 0) and 2 or 0)

252

start = f.tell()

253

data = f.read(size)

254

assert len(data) == size

255

yield start, data

256

257

@staticmethod

258

def offsets_to_ranges(offsets):

259

"""Turn a list of offsets and sizes into a list of byte ranges.

260

261

:param offsets: A list of tuples of (start, size). An empty list

262

is not accepted.

263

:return: a list of inclusive byte ranges (start, end)

264

Adjacent ranges will be combined.

265

"""

266

# Make sure we process sorted offsets

267

offsets = sorted(offsets)

268

269

prev_end = None

270

combined = []

271

272

for start, size in offsets:

273

end = start + size - 1

274

if prev_end is None:

275

combined.append([start, end])

276

elif start <= prev_end + 1:

277

combined[-1][1] = end

278

else:

279

combined.append([start, end])

280

prev_end = end

281

282

return combined

283

284

def put(self, relpath, f, mode=None):

144

try:

145

return get_url(self.abspath(relpath))

146

except (BzrError, urllib2.URLError, IOError), e:

147

raise NoSuchFile(orig_error=e)

148

except Exception,e:

149

raise HttpTransportError(orig_error=e)

150

151

def get_partial(self, relpath, start, length=None):

152

"""Get just part of a file.

153

154

:param relpath: Path to the file, relative to base

155

:param start: The starting position to read from

156

:param length: The length to read. A length of None indicates

157

read to the end of the file.

158

:return: A file-like object containing at least the specified bytes.

159

Some implementations may return objects which can be read

160

past this length, but this is not guaranteed.

161

"""

162

# TODO: You can make specialized http requests for just

163

# a portion of the file. Figure out how to do that.

164

# For now, urllib2 returns files that cannot seek() so

165

# we just read bytes off the beginning, until we

166

# get to the point that we care about.

167

f = self.get(relpath)

168

# TODO: read in smaller chunks, in case things are

169

# buffered internally.

170

f.read(start)

171

return f

172

173

def put(self, relpath, f):

285

174

"""Copy the file-like or string object into the location.

286

175

287

176

:param relpath: Location to put the contents, relative to base.

289

178

"""

290

179

raise TransportNotPossible('http PUT not supported')

291

180

292

def mkdir(self, relpath, mode=None):

181

def mkdir(self, relpath):

293

182

"""Create a directory at the given path."""

294

183

raise TransportNotPossible('http does not support mkdir()')

295

184

296

def rmdir(self, relpath):

297

"""See Transport.rmdir."""

298

raise TransportNotPossible('http does not support rmdir()')

299

300

185

def append(self, relpath, f):

301

186

"""Append the text in the file-like object into the final

302

187

location.

307

192

"""Copy the item at rel_from to the location at rel_to"""

308

193

raise TransportNotPossible('http does not support copy()')

309

194

310

def copy_to(self, relpaths, other, mode=None, pb=None):

195

def copy_to(self, relpaths, other, pb=None):

311

196

"""Copy a set of entries from self into another Transport.

312

197

313

198

:param relpaths: A list/generator of entries to be copied.

318

203

# At this point HttpTransport might be able to check and see if

319

204

# the remote location is the same, and rather than download, and

320

205

# then upload, it could just issue a remote copy_this command.

321

if isinstance(other, HttpTransportBase):

206

if isinstance(other, HttpTransport):

322

207

raise TransportNotPossible('http cannot be the target of copy_to()')

323

208

else:

324

return super(HttpTransportBase, self).\

325

copy_to(relpaths, other, mode=mode, pb=pb)

209

return super(HttpTransport, self).copy_to(relpaths, other, pb=pb)

326

210

327

211

def move(self, rel_from, rel_to):

328

212

"""Move the item at rel_from to the location at rel_to"""

332

216

"""Delete the item at relpath"""

333

217

raise TransportNotPossible('http does not support delete()')

334

218

335

def is_readonly(self):

336

"""See Transport.is_readonly."""

337

return True

338

339

def listable(self):

340

"""See Transport.listable."""

341

return False

219

def list_dir(self, relpath):

220

"""Return a list of all files at the given location.

221

WARNING: many transports do not support this, so trying avoid using

222

it if at all possible.

223

"""

224

raise TransportNotPossible('http does not support list_dir()')

342

225

343

226

def stat(self, relpath):

344

227

"""Return the stat information for a file.

366

249

"""

367

250

raise TransportNotPossible('http does not support lock_write()')

368

251

369

def clone(self, offset=None):

370

"""Return a new HttpTransportBase with root at self.base + offset

371

For now HttpTransportBase does not actually connect, so just return

372

a new HttpTransportBase object.

373

"""

374

if offset is None:

375

return self.__class__(self.base)

376

else:

377

return self.__class__(self.abspath(offset))

378

379

@staticmethod

380

def range_header(ranges, tail_amount):

381

"""Turn a list of bytes ranges into a HTTP Range header value.

382

383

:param offsets: A list of byte ranges, (start, end). An empty list

384

is not accepted.

385

386

:return: HTTP range header string.

387

"""

388

strings = []

389

for start, end in ranges:

390

strings.append('%d-%d' % (start, end))

391

392

if tail_amount:

393

strings.append('-%d' % tail_amount)

394

395

return ','.join(strings)

396

397

398

#---------------- test server facilities ----------------

399

# TODO: load these only when running tests

400

401

402

class WebserverNotAvailable(Exception):

403

pass

404

405

406

class BadWebserverPath(ValueError):

407

def __str__(self):

408

return 'path %s is not in %s' % self.args

409

410

411

class TestingHTTPRequestHandler(SimpleHTTPServer.SimpleHTTPRequestHandler):

412

413

def log_message(self, format, *args):

414

self.server.test_case.log('webserver - %s - - [%s] %s "%s" "%s"',

415

self.address_string(),

416

self.log_date_time_string(),

417

format % args,

418

self.headers.get('referer', '-'),

419

self.headers.get('user-agent', '-'))

420

421

def handle_one_request(self):

422

"""Handle a single HTTP request.

423

424

You normally don't need to override this method; see the class

425

__doc__ string for information on how to handle specific HTTP

426

commands such as GET and POST.

427

428

"""

429

for i in xrange(1,11): # Don't try more than 10 times

430

try:

431

self.raw_requestline = self.rfile.readline()

432

except socket.error, e:

433

if e.args[0] in (errno.EAGAIN, errno.EWOULDBLOCK):

434

# omitted for now because some tests look at the log of

435

# the server and expect to see no errors. see recent

436

# email thread. -- mbp 20051021.

437

## self.log_message('EAGAIN (%d) while reading from raw_requestline' % i)

438

time.sleep(0.01)

439

continue

440

raise

441

else:

442

break

443

if not self.raw_requestline:

444

self.close_connection = 1

445

return

446

if not self.parse_request(): # An error code has been sent, just exit

447

return

448

mname = 'do_' + self.command

449

if not hasattr(self, mname):

450

self.send_error(501, "Unsupported method (%r)" % self.command)

451

return

452

method = getattr(self, mname)

453

method()

454

455

if sys.platform == 'win32':

456

# On win32 you cannot access non-ascii filenames without

457

# decoding them into unicode first.

458

# However, under Linux, you can access bytestream paths

459

# without any problems. If this function was always active

460

# it would probably break tests when LANG=C was set

461

def translate_path(self, path):

462

"""Translate a /-separated PATH to the local filename syntax.

463

464

For bzr, all url paths are considered to be utf8 paths.

465

On Linux, you can access these paths directly over the bytestream

466

request, but on win32, you must decode them, and access them

467

as Unicode files.

468

"""

469

# abandon query parameters

470

path = urlparse.urlparse(path)[2]

471

path = posixpath.normpath(urllib.unquote(path))

472

path = path.decode('utf-8')

473

words = path.split('/')

474

words = filter(None, words)

475

path = os.getcwdu()

476

for word in words:

477

drive, word = os.path.splitdrive(word)

478

head, word = os.path.split(word)

479

if word in (os.curdir, os.pardir): continue

480

path = os.path.join(path, word)

481

return path

482

483

484

class TestingHTTPServer(BaseHTTPServer.HTTPServer):

485

def __init__(self, server_address, RequestHandlerClass, test_case):

486

BaseHTTPServer.HTTPServer.__init__(self, server_address,

487

RequestHandlerClass)

488

self.test_case = test_case

489

490

491

class HttpServer(Server):

492

"""A test server for http transports."""

493

494

# used to form the url that connects to this server

495

_url_protocol = 'http'

496

497

def _http_start(self):

498

httpd = None

499

httpd = TestingHTTPServer(('localhost', 0),

500

TestingHTTPRequestHandler,

501

self)

502

host, port = httpd.socket.getsockname()

503

self._http_base_url = '%s://localhost:%s/' % (self._url_protocol, port)

504

self._http_starting.release()

505

httpd.socket.settimeout(0.1)

506

507

while self._http_running:

508

try:

509

httpd.handle_request()

510

except socket.timeout:

511

pass

512

513

def _get_remote_url(self, path):

514

path_parts = path.split(os.path.sep)

515

if os.path.isabs(path):

516

if path_parts[:len(self._local_path_parts)] != \

517

self._local_path_parts:

518

raise BadWebserverPath(path, self.test_dir)

519

remote_path = '/'.join(path_parts[len(self._local_path_parts):])

520

else:

521

remote_path = '/'.join(path_parts)

522

523

self._http_starting.acquire()

524

self._http_starting.release()

525

return self._http_base_url + remote_path

526

527

def log(self, format, *args):

528

"""Capture Server log output."""

529

self.logs.append(format % args)

530

531

def setUp(self):

532

"""See bzrlib.transport.Server.setUp."""

533

self._home_dir = os.getcwdu()

534

self._local_path_parts = self._home_dir.split(os.path.sep)

535

self._http_starting = threading.Lock()

536

self._http_starting.acquire()

537

self._http_running = True

538

self._http_base_url = None

539

self._http_thread = threading.Thread(target=self._http_start)

540

self._http_thread.setDaemon(True)

541

self._http_thread.start()

542

self._http_proxy = os.environ.get("http_proxy")

543

if self._http_proxy is not None:

544

del os.environ["http_proxy"]

545

self.logs = []

546

547

def tearDown(self):

548

"""See bzrlib.transport.Server.tearDown."""

549

self._http_running = False

550

self._http_thread.join()

551

if self._http_proxy is not None:

552

import os

553

os.environ["http_proxy"] = self._http_proxy

554

555

def get_url(self):

556

"""See bzrlib.transport.Server.get_url."""

557

return self._get_remote_url(self._home_dir)

558

559

def get_bogus_url(self):

560

"""See bzrlib.transport.Server.get_bogus_url."""

561

# this is chosen to try to prevent trouble with proxies, wierd dns,

562

# etc

563

return 'http://127.0.0.1:1/'

564

252

register_transport('http://', HttpTransport)

253

register_transport('https://', HttpTransport)

Older »