~bzr-pqm/bzr/bzr.dev

2004.1.40 by v.ladeuil+lp at free
Fix the race condition again and correct some small typos to be in
1
# Copyright (C) 2006 Canonical Ltd
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
import BaseHTTPServer
18
import errno
19
import os
20
from SimpleHTTPServer import SimpleHTTPRequestHandler
21
import socket
2146.1.1 by Alexander Belchenko
fixes for test suite: forgotten imports in HttpServer.py
22
import posixpath
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
23
import random
24
import re
25
import sys
26
import threading
27
import time
2146.1.1 by Alexander Belchenko
fixes for test suite: forgotten imports in HttpServer.py
28
import urllib
29
import urlparse
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
30
31
from bzrlib.transport import Server
2381.1.2 by Robert Collins
Fixup the test changes made for hpss to be clean and self contained.
32
from bzrlib.transport.local import LocalURLServer
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
33
34
35
class WebserverNotAvailable(Exception):
36
    pass
37
38
39
class BadWebserverPath(ValueError):
40
    def __str__(self):
41
        return 'path %s is not in %s' % self.args
42
43
44
class TestingHTTPRequestHandler(SimpleHTTPRequestHandler):
45
46
    def log_message(self, format, *args):
2164.2.28 by Vincent Ladeuil
TestingHTTPServer.test_case_server renamed from test_case to avoid confusions.
47
        tcs = self.server.test_case_server
48
        tcs.log('webserver - %s - - [%s] %s "%s" "%s"',
49
                self.address_string(),
50
                self.log_date_time_string(),
51
                format % args,
52
                self.headers.get('referer', '-'),
53
                self.headers.get('user-agent', '-'))
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
54
55
    def handle_one_request(self):
56
        """Handle a single HTTP request.
57
58
        You normally don't need to override this method; see the class
59
        __doc__ string for information on how to handle specific HTTP
60
        commands such as GET and POST.
61
62
        """
63
        for i in xrange(1,11): # Don't try more than 10 times
64
            try:
65
                self.raw_requestline = self.rfile.readline()
66
            except socket.error, e:
67
                if e.args[0] in (errno.EAGAIN, errno.EWOULDBLOCK):
68
                    # omitted for now because some tests look at the log of
69
                    # the server and expect to see no errors.  see recent
70
                    # email thread. -- mbp 20051021. 
71
                    ## self.log_message('EAGAIN (%d) while reading from raw_requestline' % i)
72
                    time.sleep(0.01)
73
                    continue
74
                raise
75
            else:
76
                break
77
        if not self.raw_requestline:
78
            self.close_connection = 1
79
            return
80
        if not self.parse_request(): # An error code has been sent, just exit
81
            return
82
        mname = 'do_' + self.command
83
        if getattr(self, mname, None) is None:
84
            self.send_error(501, "Unsupported method (%r)" % self.command)
85
            return
86
        method = getattr(self, mname)
87
        method()
88
89
    _range_regexp = re.compile(r'^(?P<start>\d+)-(?P<end>\d+)$')
90
    _tail_regexp = re.compile(r'^-(?P<tail>\d+)$')
91
92
    def parse_ranges(self, ranges_header):
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
93
        """Parse the range header value and returns ranges and tail.
94
95
        RFC2616 14.35 says that syntactically invalid range
96
        specifiers MUST be ignored. In that case, we return 0 for
97
        tail and [] for ranges.
98
        """
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
99
        tail = 0
100
        ranges = []
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
101
        if not ranges_header.startswith('bytes='):
102
            # Syntactically invalid header
103
            return 0, []
104
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
105
        ranges_header = ranges_header[len('bytes='):]
106
        for range_str in ranges_header.split(','):
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
107
            # FIXME: RFC2616 says end is optional and default to file_size
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
108
            range_match = self._range_regexp.match(range_str)
109
            if range_match is not None:
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
110
                start = int(range_match.group('start'))
111
                end = int(range_match.group('end'))
112
                if start > end:
113
                    # Syntactically invalid range
114
                    return 0, []
115
                ranges.append((start, end))
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
116
            else:
117
                tail_match = self._tail_regexp.match(range_str)
118
                if tail_match is not None:
119
                    tail = int(tail_match.group('tail'))
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
120
                else:
121
                    # Syntactically invalid range
122
                    return 0, []
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
123
        return tail, ranges
124
125
    def send_range_content(self, file, start, length):
126
        file.seek(start)
127
        self.wfile.write(file.read(length))
128
129
    def get_single_range(self, file, file_size, start, end):
130
        self.send_response(206)
131
        length = end - start + 1
132
        self.send_header('Accept-Ranges', 'bytes')
133
        self.send_header("Content-Length", "%d" % length)
134
135
        self.send_header("Content-Type", 'application/octet-stream')
136
        self.send_header("Content-Range", "bytes %d-%d/%d" % (start,
137
                                                              end,
138
                                                              file_size))
139
        self.end_headers()
140
        self.send_range_content(file, start, length)
141
142
    def get_multiple_ranges(self, file, file_size, ranges):
143
        self.send_response(206)
144
        self.send_header('Accept-Ranges', 'bytes')
145
        boundary = "%d" % random.randint(0,0x7FFFFFFF)
146
        self.send_header("Content-Type",
147
                         "multipart/byteranges; boundary=%s" % boundary)
148
        self.end_headers()
149
        for (start, end) in ranges:
150
            self.wfile.write("--%s\r\n" % boundary)
151
            self.send_header("Content-type", 'application/octet-stream')
152
            self.send_header("Content-Range", "bytes %d-%d/%d" % (start,
153
                                                                  end,
154
                                                                  file_size))
155
            self.end_headers()
156
            self.send_range_content(file, start, end - start + 1)
157
            self.wfile.write("--%s\r\n" % boundary)
158
159
    def do_GET(self):
160
        """Serve a GET request.
161
162
        Handles the Range header.
163
        """
164
165
        path = self.translate_path(self.path)
166
        ranges_header_value = self.headers.get('Range')
167
        if ranges_header_value is None or os.path.isdir(path):
168
            # Let the mother class handle most cases
169
            return SimpleHTTPRequestHandler.do_GET(self)
170
171
        try:
172
            # Always read in binary mode. Opening files in text
173
            # mode may cause newline translations, making the
174
            # actual size of the content transmitted *less* than
175
            # the content-length!
176
            file = open(path, 'rb')
177
        except IOError:
178
            self.send_error(404, "File not found")
2000.3.9 by v.ladeuil+lp at free
The tests that would have help avoid bug #73948 and all that mess :)
179
            return
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
180
181
        file_size = os.fstat(file.fileno())[6]
182
        tail, ranges = self.parse_ranges(ranges_header_value)
183
        # Normalize tail into ranges
184
        if tail != 0:
185
            ranges.append((file_size - tail, file_size))
186
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
187
        self._satisfiable_ranges = True
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
188
        if len(ranges) == 0:
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
189
            self._satisfiable_ranges = False
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
190
        else:
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
191
            def check_range(range_specifier):
192
                start, end = range_specifier
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
193
                # RFC2616 14.35, ranges are invalid if start >= file_size
194
                if start >= file_size:
195
                    self._satisfiable_ranges = False # Side-effect !
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
196
                    return 0, 0
197
                # RFC2616 14.35, end values should be truncated
198
                # to file_size -1 if they exceed it
199
                end = min(end, file_size - 1)
200
                return start, end
201
202
            ranges = map(check_range, ranges)
203
2182.2.2 by v.ladeuil+lp at free
Thanks again to Aaron, the http server RFC2616 compliance
204
        if not self._satisfiable_ranges:
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
205
            # RFC2616 14.16 and 14.35 says that when a server
206
            # encounters unsatisfiable range specifiers, it
207
            # SHOULD return a 416.
2000.3.9 by v.ladeuil+lp at free
The tests that would have help avoid bug #73948 and all that mess :)
208
            file.close()
2182.2.1 by v.ladeuil+lp at free
Aaron was right. Thanks to him, the http server RFC2616 compliance
209
            # FIXME: We SHOULD send a Content-Range header too,
210
            # but the implementation of send_error does not
211
            # allows that. So far.
2000.3.9 by v.ladeuil+lp at free
The tests that would have help avoid bug #73948 and all that mess :)
212
            self.send_error(416, "Requested range not satisfiable")
213
            return
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
214
215
        if len(ranges) == 1:
216
            (start, end) = ranges[0]
217
            self.get_single_range(file, file_size, start, end)
218
        else:
219
            self.get_multiple_ranges(file, file_size, ranges)
220
        file.close()
221
222
    if sys.platform == 'win32':
223
        # On win32 you cannot access non-ascii filenames without
224
        # decoding them into unicode first.
225
        # However, under Linux, you can access bytestream paths
226
        # without any problems. If this function was always active
227
        # it would probably break tests when LANG=C was set
228
        def translate_path(self, path):
229
            """Translate a /-separated PATH to the local filename syntax.
230
231
            For bzr, all url paths are considered to be utf8 paths.
232
            On Linux, you can access these paths directly over the bytestream
233
            request, but on win32, you must decode them, and access them
234
            as Unicode files.
235
            """
236
            # abandon query parameters
237
            path = urlparse.urlparse(path)[2]
238
            path = posixpath.normpath(urllib.unquote(path))
239
            path = path.decode('utf-8')
240
            words = path.split('/')
241
            words = filter(None, words)
242
            path = os.getcwdu()
243
            for word in words:
244
                drive, word = os.path.splitdrive(word)
245
                head, word = os.path.split(word)
246
                if word in (os.curdir, os.pardir): continue
247
                path = os.path.join(path, word)
248
            return path
249
250
251
class TestingHTTPServer(BaseHTTPServer.HTTPServer):
2164.2.28 by Vincent Ladeuil
TestingHTTPServer.test_case_server renamed from test_case to avoid confusions.
252
253
    def __init__(self, server_address, RequestHandlerClass,
254
                 test_case_server):
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
255
        BaseHTTPServer.HTTPServer.__init__(self, server_address,
2164.2.28 by Vincent Ladeuil
TestingHTTPServer.test_case_server renamed from test_case to avoid confusions.
256
                                           RequestHandlerClass)
257
        # test_case_server can be used to communicate between the
2164.2.29 by Vincent Ladeuil
Test the http redirection at the request level even if it's not
258
        # tests and the server (or the request handler and the
259
        # server), allowing dynamic behaviors to be defined from
260
        # the tests cases.
2164.2.28 by Vincent Ladeuil
TestingHTTPServer.test_case_server renamed from test_case to avoid confusions.
261
        self.test_case_server = test_case_server
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
262
263
264
class HttpServer(Server):
265
    """A test server for http transports.
266
267
    Subclasses can provide a specific request handler.
268
    """
269
270
    # used to form the url that connects to this server
271
    _url_protocol = 'http'
272
273
    # Subclasses can provide a specific request handler
274
    def __init__(self, request_handler=TestingHTTPRequestHandler):
275
        Server.__init__(self)
276
        self.request_handler = request_handler
2164.2.13 by v.ladeuil+lp at free
Add tests for redirection. Preserve transport decorations.
277
        self.host = 'localhost'
278
        self.port = 0
279
        self._httpd = None
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
280
2004.1.28 by v.ladeuil+lp at free
Merge bzr.dev. Including http modifications by "smart" related code
281
    def _get_httpd(self):
2164.2.13 by v.ladeuil+lp at free
Add tests for redirection. Preserve transport decorations.
282
        if self._httpd is None:
283
            self._httpd = TestingHTTPServer((self.host, self.port),
284
                                            self.request_handler,
285
                                            self)
286
            host, self.port = self._httpd.socket.getsockname()
287
        return self._httpd
2004.1.28 by v.ladeuil+lp at free
Merge bzr.dev. Including http modifications by "smart" related code
288
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
289
    def _http_start(self):
2004.1.28 by v.ladeuil+lp at free
Merge bzr.dev. Including http modifications by "smart" related code
290
        httpd = self._get_httpd()
2164.2.13 by v.ladeuil+lp at free
Add tests for redirection. Preserve transport decorations.
291
        self._http_base_url = '%s://%s:%s/' % (self._url_protocol,
292
                                               self.host,
293
                                               self.port)
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
294
        self._http_starting.release()
295
        httpd.socket.settimeout(0.1)
296
297
        while self._http_running:
298
            try:
299
                httpd.handle_request()
300
            except socket.timeout:
301
                pass
302
303
    def _get_remote_url(self, path):
304
        path_parts = path.split(os.path.sep)
305
        if os.path.isabs(path):
306
            if path_parts[:len(self._local_path_parts)] != \
307
                   self._local_path_parts:
308
                raise BadWebserverPath(path, self.test_dir)
309
            remote_path = '/'.join(path_parts[len(self._local_path_parts):])
310
        else:
311
            remote_path = '/'.join(path_parts)
312
313
        return self._http_base_url + remote_path
314
315
    def log(self, format, *args):
316
        """Capture Server log output."""
317
        self.logs.append(format % args)
318
2381.1.2 by Robert Collins
Fixup the test changes made for hpss to be clean and self contained.
319
    def setUp(self, backing_transport_server=None):
2381.1.1 by Robert Collins
Split out hpss test fixes which dont depend on new or altered API's.
320
        """See bzrlib.transport.Server.setUp.
321
        
2381.1.2 by Robert Collins
Fixup the test changes made for hpss to be clean and self contained.
322
        :param backing_transport_server: The transport that requests over this
2381.1.1 by Robert Collins
Split out hpss test fixes which dont depend on new or altered API's.
323
            protocol should be forwarded to. Note that this is currently not
2381.1.2 by Robert Collins
Fixup the test changes made for hpss to be clean and self contained.
324
            supported for HTTP.
2381.1.1 by Robert Collins
Split out hpss test fixes which dont depend on new or altered API's.
325
        """
2381.1.2 by Robert Collins
Fixup the test changes made for hpss to be clean and self contained.
326
        # XXX: TODO: make the server back onto vfs_server rather than local
327
        # disk.
328
        assert backing_transport_server is None or \
329
            isinstance(backing_transport_server, LocalURLServer), \
330
            "HTTPServer currently assumes local transport, got %s" % \
331
            backing_transport_server
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
332
        self._home_dir = os.getcwdu()
333
        self._local_path_parts = self._home_dir.split(os.path.sep)
334
        self._http_starting = threading.Lock()
335
        self._http_starting.acquire()
336
        self._http_running = True
337
        self._http_base_url = None
338
        self._http_thread = threading.Thread(target=self._http_start)
339
        self._http_thread.setDaemon(True)
2167.3.5 by v.ladeuil+lp at free
Tests for proxies, covering #74759.
340
        self._http_thread.start()
2167.3.6 by v.ladeuil+lp at free
Take John's comments into account and add more tests.
341
        # Wait for the server thread to start (i.e release the lock)
342
        self._http_starting.acquire()
343
        self._http_starting.release()
2004.1.25 by v.ladeuil+lp at free
Shuffle http related test code. Hopefully it ends up at the right place :)
344
        self.logs = []
345
346
    def tearDown(self):
347
        """See bzrlib.transport.Server.tearDown."""
348
        self._http_running = False
349
        self._http_thread.join()
350
351
    def get_url(self):
352
        """See bzrlib.transport.Server.get_url."""
353
        return self._get_remote_url(self._home_dir)
354
355
    def get_bogus_url(self):
356
        """See bzrlib.transport.Server.get_bogus_url."""
357
        # this is chosen to try to prevent trouble with proxies, weird dns,
358
        # etc
359
        return 'http://127.0.0.1:1/'
360
361
362
class HttpServer_urllib(HttpServer):
363
    """Subclass of HttpServer that gives http+urllib urls.
364
365
    This is for use in testing: connections to this server will always go
366
    through urllib where possible.
367
    """
368
369
    # urls returned by this server should require the urllib client impl
370
    _url_protocol = 'http+urllib'
371
372
373
class HttpServer_PyCurl(HttpServer):
374
    """Subclass of HttpServer that gives http+pycurl urls.
375
376
    This is for use in testing: connections to this server will always go
377
    through pycurl where possible.
378
    """
379
380
    # We don't care about checking the pycurl availability as
381
    # this server will be required only when pycurl is present
382
383
    # urls returned by this server should require the pycurl client impl
384
    _url_protocol = 'http+pycurl'