~bzr-pqm/bzr/bzr.dev

4763.2.4 by John Arbash Meinel
merge bzr.2.1 in preparation for NEWS entry.
1
# Copyright (C) 2006-2010 Canonical Ltd
1540.3.18 by Martin Pool
Style review fixes (thanks robertc)
2
#
1540.3.3 by Martin Pool
Review updates of pycurl transport
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
1540.3.18 by Martin Pool
Style review fixes (thanks robertc)
7
#
1540.3.3 by Martin Pool
Review updates of pycurl transport
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
1540.3.18 by Martin Pool
Style review fixes (thanks robertc)
12
#
1540.3.3 by Martin Pool
Review updates of pycurl transport
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
4183.7.1 by Sabin Iacob
update FSF mailing address
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
1540.3.3 by Martin Pool
Review updates of pycurl transport
16
2004.1.2 by vila
Implements a BasicAuthManager.
17
from cStringIO import StringIO
2363.4.9 by Vincent Ladeuil
Catch first succesful authentification to avoid further 401
18
import urllib
19
import urlparse
1540.3.3 by Martin Pool
Review updates of pycurl transport
20
2485.8.41 by Vincent Ladeuil
Finish http refactoring. Test suite passing.
21
from bzrlib import (
22
    errors,
3052.3.3 by Vincent Ladeuil
Add -Dhttp support.
23
    trace,
2485.8.41 by Vincent Ladeuil
Finish http refactoring. Test suite passing.
24
    urlutils,
25
    )
3052.3.3 by Vincent Ladeuil
Add -Dhttp support.
26
from bzrlib.transport import http
3059.2.2 by Vincent Ladeuil
Read http responses on demand without buffering the whole body
27
# TODO: handle_response should be integrated into the http/__init__.py
2004.2.1 by John Arbash Meinel
Cleanup of urllib functions
28
from bzrlib.transport.http.response import handle_response
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
29
from bzrlib.transport.http._urllib2_wrappers import (
2004.2.1 by John Arbash Meinel
Cleanup of urllib functions
30
    Opener,
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
31
    Request,
2004.2.1 by John Arbash Meinel
Cleanup of urllib functions
32
    )
33
1540.3.3 by Martin Pool
Review updates of pycurl transport
34
3052.3.3 by Vincent Ladeuil
Add -Dhttp support.
35
class HttpTransport_urllib(http.HttpTransportBase):
1786.1.33 by John Arbash Meinel
Cleanup pass #2
36
    """Python urllib transport for http and https."""
1540.3.3 by Martin Pool
Review updates of pycurl transport
37
2004.1.9 by vila
Takes jam's remarks into account when possible, add TODOs for the rest.
38
    # In order to debug we have to issue our traces in sync with
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
39
    # httplib, which use print :(
40
    _debuglevel = 0
2004.3.1 by vila
Test ConnectionError exceptions.
41
2004.2.1 by John Arbash Meinel
Cleanup of urllib functions
42
    _opener_class = Opener
43
2485.8.59 by Vincent Ladeuil
Update from review comments.
44
    def __init__(self, base, _from_transport=None):
45
        super(HttpTransport_urllib, self).__init__(
3878.4.6 by Vincent Ladeuil
Fix bug #270863 by preserving 'bzr+http[s]' decorator.
46
            base, 'urllib', _from_transport=_from_transport)
2485.8.59 by Vincent Ladeuil
Update from review comments.
47
        if _from_transport is not None:
48
            self._opener = _from_transport._opener
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
49
        else:
3945.1.5 by Vincent Ladeuil
Start implementing http activity reporting at socket level.
50
            self._opener = self._opener_class(
51
                report_activity=self._report_activity)
2420.1.5 by Vincent Ladeuil
Refactor http and proxy authentication. Tests passing. proxy password can be prompted too.
52
2485.8.41 by Vincent Ladeuil
Finish http refactoring. Test suite passing.
53
    def _perform(self, request):
54
        """Send the request to the server and handles common errors.
55
56
        :returns: urllib2 Response object
57
        """
58
        connection = self._get_connection()
59
        if connection is not None:
60
            # Give back shared info
61
            request.connection = connection
62
            (auth, proxy_auth) = self._get_credentials()
3059.2.2 by Vincent Ladeuil
Read http responses on demand without buffering the whole body
63
            # Clean the httplib.HTTPConnection pipeline in case the previous
64
            # request couldn't do it
65
            connection.cleanup_pipe()
2485.8.41 by Vincent Ladeuil
Finish http refactoring. Test suite passing.
66
        else:
3133.1.2 by Vincent Ladeuil
Fix #177643 by making pycurl handle url-embedded credentials again.
67
            # First request, initialize credentials.
2900.2.16 by Vincent Ladeuil
Make hhtp proxy aware of AuthenticationConfig (for password).
68
            # scheme and realm will be set by the _urllib2_wrappers.AuthHandler
3133.1.2 by Vincent Ladeuil
Fix #177643 by making pycurl handle url-embedded credentials again.
69
            auth = self._create_auth()
70
            # Proxy initialization will be done by the first proxied request
2900.2.24 by Vincent Ladeuil
Review feedback.
71
            proxy_auth = dict()
2363.4.12 by Vincent Ladeuil
Take jam's review comments into account. Fix typos, give better
72
        # Ensure authentication info is provided
2485.8.41 by Vincent Ladeuil
Finish http refactoring. Test suite passing.
73
        request.auth = auth
74
        request.proxy_auth = proxy_auth
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
75
76
        if self._debuglevel > 0:
77
            print 'perform: %s base: %s, url: %s' % (request.method, self.base,
78
                                                     request.get_full_url())
79
        response = self._opener.open(request)
2485.8.41 by Vincent Ladeuil
Finish http refactoring. Test suite passing.
80
        if self._get_connection() is not request.connection:
81
            # First connection or reconnection
82
            self._set_connection(request.connection,
83
                                 (request.auth, request.proxy_auth))
84
        else:
85
            # http may change the credentials while keeping the
86
            # connection opened
87
            self._update_credentials((request.auth, request.proxy_auth))
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
88
2164.2.1 by v.ladeuil+lp at free
First rough http branch redirection implementation.
89
        code = response.code
4795.4.5 by Vincent Ladeuil
Make sure all redirection code paths can handle authentication.
90
        if (request.follow_redirections is False
91
            and code in (301, 302, 303, 307)):
2164.2.1 by v.ladeuil+lp at free
First rough http branch redirection implementation.
92
            raise errors.RedirectRequested(request.get_full_url(),
93
                                           request.redirected_to,
3878.4.4 by Vincent Ladeuil
Cleanup.
94
                                           is_permanent=(code == 301))
2164.2.1 by v.ladeuil+lp at free
First rough http branch redirection implementation.
95
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
96
        if request.redirected_to is not None:
3052.3.3 by Vincent Ladeuil
Add -Dhttp support.
97
            trace.mutter('redirected from: %s to: %s' % (request.get_full_url(),
98
                                                         request.redirected_to))
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
99
100
        return response
1540.3.26 by Martin Pool
[merge] bzr.dev; pycurl not updated for readv yet
101
5247.2.12 by Vincent Ladeuil
Ensure that all transports close their underlying connection.
102
    def disconnect(self):
103
        connection = self._get_connection()
104
        if connection is not None:
105
            connection.close()
106
2520.2.1 by Vincent Ladeuil
First step to fix #115209 use _coalesce_offsets like other transports.
107
    def _get(self, relpath, offsets, tail_amount=0):
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
108
        """See HttpTransport._get"""
2485.8.25 by Vincent Ladeuil
Separate abspath from _remote_path, the intents are different.
109
        abspath = self._remote_path(relpath)
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
110
        headers = {}
2520.2.2 by Vincent Ladeuil
Fix #115209 by issuing a single range request on 400: Bad Request
111
        accepted_errors = [200, 404]
2520.2.1 by Vincent Ladeuil
First step to fix #115209 use _coalesce_offsets like other transports.
112
        if offsets or tail_amount:
113
            range_header = self._attempted_range_header(offsets, tail_amount)
2004.1.30 by v.ladeuil+lp at free
Fix #62276 and #62029 by providing a more robust http range handling.
114
            if range_header is not None:
2520.2.2 by Vincent Ladeuil
Fix #115209 by issuing a single range request on 400: Bad Request
115
                accepted_errors.append(206)
116
                accepted_errors.append(400)
3059.2.2 by Vincent Ladeuil
Read http responses on demand without buffering the whole body
117
                accepted_errors.append(416)
2004.1.30 by v.ladeuil+lp at free
Fix #62276 and #62029 by providing a more robust http range handling.
118
                bytes = 'bytes=' + range_header
119
                headers = {'Range': bytes}
2004.3.1 by vila
Test ConnectionError exceptions.
120
2520.2.2 by Vincent Ladeuil
Fix #115209 by issuing a single range request on 400: Bad Request
121
        request = Request('GET', abspath, None, headers,
122
                          accepted_errors=accepted_errors)
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
123
        response = self._perform(request)
124
125
        code = response.code
126
        if code == 404: # not found
2164.2.1 by v.ladeuil+lp at free
First rough http branch redirection implementation.
127
            raise errors.NoSuchFile(abspath)
3059.2.2 by Vincent Ladeuil
Read http responses on demand without buffering the whole body
128
        elif code in (400, 416):
129
            # We don't know which, but one of the ranges we specified was
130
            # wrong.
131
            raise errors.InvalidHttpRange(abspath, range_header,
132
                                          'Server return code %d' % code)
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
133
3945.1.5 by Vincent Ladeuil
Start implementing http activity reporting at socket level.
134
        data = handle_response(abspath, code, response.info(), response)
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
135
        return code, data
1540.3.3 by Martin Pool
Review updates of pycurl transport
136
2018.2.7 by Andrew Bennetts
Implement _post on HttpTransport_urllib.
137
    def _post(self, body_bytes):
2485.8.25 by Vincent Ladeuil
Separate abspath from _remote_path, the intents are different.
138
        abspath = self._remote_path('.bzr/smart')
3430.3.5 by Vincent Ladeuil
Fixed as per Andrew's review.
139
        # We include 403 in accepted_errors so that send_http_smart_request can
140
        # handle a 403.  Otherwise a 403 causes an unhandled TransportError.
5514.1.1 by Vincent Ladeuil
Correctly set the Content-Type header when POSTing.
141
        response = self._perform(
142
            Request('POST', abspath, body_bytes,
143
                    {'Content-Type': 'application/octet-stream'},
144
                    accepted_errors=[200, 403]))
2004.1.28 by v.ladeuil+lp at free
Merge bzr.dev. Including http modifications by "smart" related code
145
        code = response.code
3945.1.5 by Vincent Ladeuil
Start implementing http activity reporting at socket level.
146
        data = handle_response(abspath, code, response.info(), response)
2004.1.28 by v.ladeuil+lp at free
Merge bzr.dev. Including http modifications by "smart" related code
147
        return code, data
2018.2.7 by Andrew Bennetts
Implement _post on HttpTransport_urllib.
148
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
149
    def _head(self, relpath):
150
        """Request the HEAD of a file.
151
152
        Performs the request and leaves callers handle the results.
153
        """
2485.8.25 by Vincent Ladeuil
Separate abspath from _remote_path, the intents are different.
154
        abspath = self._remote_path(relpath)
2520.2.2 by Vincent Ladeuil
Fix #115209 by issuing a single range request on 400: Bad Request
155
        request = Request('HEAD', abspath,
156
                          accepted_errors=[200, 404])
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
157
        response = self._perform(request)
158
159
        return response
160
1540.3.3 by Martin Pool
Review updates of pycurl transport
161
    def has(self, relpath):
162
        """Does the target location exist?
163
        """
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
164
        response = self._head(relpath)
165
166
        code = response.code
2164.2.16 by Vincent Ladeuil
Add tests.
167
        if code == 200: # "ok",
1540.3.3 by Martin Pool
Review updates of pycurl transport
168
            return True
169
        else:
2004.1.1 by vila
Connection sharing, with redirection. without authentification.
170
            return False
1540.3.25 by Martin Pool
New 'http+urllib' scheme
171
172
1540.3.6 by Martin Pool
[merge] update from bzr.dev
173
def get_test_permutations():
174
    """Return the permutations to be used in testing."""
5967.12.1 by Martin Pool
Move all test features into bzrlib.tests.features
175
    from bzrlib.tests import (
176
        features,
177
        http_server,
178
        )
2929.3.10 by Vincent Ladeuil
Add a fake https server and test facilities.
179
    permutations = [(HttpTransport_urllib, http_server.HttpServer_urllib),]
5967.12.1 by Martin Pool
Move all test features into bzrlib.tests.features
180
    if features.HTTPSServerFeature.available():
2929.3.10 by Vincent Ladeuil
Add a fake https server and test facilities.
181
        from bzrlib.tests import https_server
182
        permutations.append((HttpTransport_urllib,
183
                             https_server.HTTPSServer_urllib))
184
    return permutations