13
13
# You should have received a copy of the GNU General Public License
14
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17
"""Tests from HTTP response parsing.
19
The handle_response method read the response body of a GET request an returns
20
the corresponding RangeFile.
22
There are four different kinds of RangeFile:
23
- a whole file whose size is unknown, seen as a simple byte stream,
24
- a whole file whose size is known, we can't read past its end,
25
- a single range file, a part of a file with a start and a size,
26
- a multiple range file, several consecutive parts with known start offset
29
Some properties are common to all kinds:
30
- seek can only be forward (its really a socket underneath),
31
- read can't cross ranges,
32
- successive ranges are taken into account transparently,
34
- the expected pattern of use is either seek(offset)+read(size) or a single
35
read with no size specified. For multiple range files, multiple read() will
36
return the corresponding ranges, trying to read further will raise
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17
"""Tests from HTTP response parsing."""
19
from cStringIO import StringIO
22
from bzrlib import errors
23
from bzrlib.transport import http
24
from bzrlib.transport.http import response
25
from bzrlib.tests import TestCase
28
class TestResponseRange(TestCase):
29
"""Test the ResponseRange class."""
32
RR = response.ResponseRange
35
self.assertTrue(r1 < r2)
36
self.assertFalse(r1 > r2)
37
self.assertTrue(r1 < 5)
38
self.assertFalse(r2 < 5)
40
self.assertEqual(RR(0, 10, 5), RR(0, 10, 5))
41
self.assertNotEqual(RR(0, 10, 5), RR(0, 8, 5))
42
self.assertNotEqual(RR(0, 10, 5), RR(0, 10, 6))
44
def test_sort_list(self):
45
"""Ensure longer ranges are sorted after shorter ones"""
46
RR = response.ResponseRange
47
lst = [RR(3, 8, 0), 5, RR(3, 7, 0), 6]
49
self.assertEqual([RR(3,7,0), RR(3,8,0), 5, 6], lst)
52
class TestRangeFile(TestCase):
56
content = "abcdefghijklmnopqrstuvwxyz"
57
self.fp = response.RangeFile('foo', StringIO(content))
58
self.fp._add_range(0, 9, 0)
59
self.fp._add_range(20, 29, 10)
60
self.fp._add_range(30, 39, 15)
62
def test_valid_accesses(self):
63
"""Test so that valid accesses work to the file."""
65
self.assertEquals(self.fp.read(3), 'abc')
66
self.assertEquals(self.fp.read(3), 'def')
67
self.assertEquals(self.fp.tell(), 6)
69
self.assertEquals(self.fp.read(3), 'klm')
70
self.assertEquals(self.fp.read(2), 'no')
71
self.assertEquals(self.fp.tell(), 25)
72
# should wrap over to 30-39 entity
73
self.assertEquals(self.fp.read(3), 'pqr')
75
self.assertEquals(self.fp.read(3), 'def')
76
self.assertEquals(self.fp.tell(), 6)
78
def test_invalid_accesses(self):
79
"""Test so that invalid accesses trigger errors."""
81
self.assertRaises(errors.InvalidRange, self.fp.read, 2)
83
self.assertRaises(errors.InvalidRange, self.fp.read, 2)
85
self.assertRaises(errors.InvalidRange, self.fp.read, 2)
87
def test__finish_ranges(self):
88
"""Test that after RangeFile._finish_ranges the list is sorted."""
89
self.fp._add_range(1, 2, 3)
90
self.fp._add_range(8, 9, 10)
91
self.fp._add_range(3, 4, 5)
93
# TODO: jam 20060706 If we switch to inserting
94
# in sorted order, remove this test
95
self.assertNotEqual(self.fp._ranges, sorted(self.fp._ranges))
97
self.fp._finish_ranges()
98
self.assertEqual(self.fp._ranges, sorted(self.fp._ranges))
100
def test_seek_and_tell(self):
101
# Check for seeking before start
103
self.assertEqual(0, self.fp.tell())
106
self.assertEqual(5, self.fp.tell())
109
self.assertEqual(3, self.fp.tell())
111
# TODO: jam 20060706 following tests will fail if this
112
# is not true, and would be difficult to debug
113
# but it is a layering violation
114
self.assertEqual(39, self.fp._len)
117
self.assertEqual(39, self.fp.tell())
120
self.assertEqual(29, self.fp.tell())
122
self.assertRaises(ValueError, self.fp.seek, 0, 4)
123
self.assertRaises(ValueError, self.fp.seek, 0, -1)
126
class TestRegexes(TestCase):
128
def assertRegexMatches(self, groups, text):
129
"""Check that the regex matches and returns the right values"""
130
m = self.regex.match(text)
131
self.assertNotEqual(None, m, "text %s did not match regex" % (text,))
133
self.assertEqual(groups, m.groups())
135
def test_range_re(self):
136
"""Test that we match valid ranges."""
137
self.regex = response.HttpRangeResponse._CONTENT_RANGE_RE
138
self.assertRegexMatches(('bytes', '1', '10', '11'),
140
self.assertRegexMatches(('bytes', '1', '10', '11'),
142
self.assertRegexMatches(('bytes', '2123', '4242', '1231'),
143
'\tbytes 2123-4242/1231 ')
144
self.assertRegexMatches(('chars', '1', '2', '3'),
147
def test_content_type_re(self):
148
self.regex = response.HttpMultipartRangeResponse._CONTENT_TYPE_RE
149
self.assertRegexMatches(('xxyyzz',),
150
'multipart/byteranges; boundary = xxyyzz')
151
self.assertRegexMatches(('xxyyzz',),
152
'multipart/byteranges;boundary=xxyyzz')
153
self.assertRegexMatches(('xx yy zz',),
154
' multipart/byteranges ; boundary= xx yy zz ')
155
self.assertEqual(None,
156
self.regex.match('multipart byteranges;boundary=xx'))
162
Content-range: bytes 1-10/20\r
166
Content-Range: bytes 21-30/20\r
171
content-range: bytes 41-50/20\r
175
content-range: bytes 51-60/20\r
40
from cStringIO import StringIO
47
from bzrlib.transport.http import (
51
from bzrlib.tests.file_utils import (
56
class ReadSocket(object):
57
"""A socket-like object that can be given a predefined content."""
59
def __init__(self, data):
60
self.readfile = StringIO(data)
62
def makefile(self, mode='r', bufsize=None):
66
class FakeHTTPConnection(_urllib2_wrappers.HTTPConnection):
68
def __init__(self, sock):
69
_urllib2_wrappers.HTTPConnection.__init__(self, 'localhost')
70
# Set the socket to bypass the connection
74
"""Ignores the writes on the socket."""
78
class TestResponseFileIter(tests.TestCase):
80
def test_iter_empty(self):
81
f = response.ResponseFile('empty', StringIO())
82
self.assertEqual([], list(f))
84
def test_iter_many(self):
85
f = response.ResponseFile('many', StringIO('0\n1\nboo!\n'))
86
self.assertEqual(['0\n', '1\n', 'boo!\n'], list(f))
89
class TestHTTPConnection(tests.TestCase):
91
def test_cleanup_pipe(self):
92
sock = ReadSocket("""HTTP/1.1 200 OK\r
93
Content-Type: text/plain; charset=UTF-8\r
98
conn = FakeHTTPConnection(sock)
99
# Simulate the request sending so that the connection will be able to
101
conn.putrequest('GET', 'http://localhost/fictious')
103
# Now, get the response
104
resp = conn.getresponse()
105
# Read part of the response
106
self.assertEqual('0123456789\n', resp.read(11))
107
# Override the thresold to force the warning emission
108
conn._range_warning_thresold = 6 # There are 7 bytes pending
110
self.assertContainsRe(self.get_log(), 'Got a 200 response when asking')
113
class TestRangeFileMixin(object):
114
"""Tests for accessing the first range in a RangeFile."""
116
# A simple string used to represent a file part (also called a range), in
117
# which offsets are easy to calculate for test writers. It's used as a
118
# building block with slight variations but basically 'a' is the first char
119
# of the range and 'z' is the last.
120
alpha = 'abcdefghijklmnopqrstuvwxyz'
122
def test_can_read_at_first_access(self):
123
"""Test that the just created file can be read."""
124
self.assertEqual(self.alpha, self._file.read())
126
def test_seek_read(self):
127
"""Test seek/read inside the range."""
129
start = self.first_range_start
130
# Before any use, tell() should be at the range start
131
self.assertEqual(start, f.tell())
132
cur = start # For an overall offset assertion
135
self.assertEqual('def', f.read(3))
139
self.assertEqual('klmn', f.read(4))
141
# read(0) in the middle of a range
142
self.assertEqual('', f.read(0))
146
self.assertEqual(here, f.tell())
147
self.assertEqual(cur, f.tell())
149
def test_read_zero(self):
151
self.assertEqual('', f.read(0))
153
self.assertEqual('', f.read(0))
155
def test_seek_at_range_end(self):
159
def test_read_at_range_end(self):
160
"""Test read behaviour at range end."""
162
self.assertEqual(self.alpha, f.read())
163
self.assertEqual('', f.read(0))
164
self.assertRaises(errors.InvalidRange, f.read, 1)
166
def test_unbounded_read_after_seek(self):
169
# Should not cross ranges
170
self.assertEqual('yz', f.read())
172
def test_seek_backwards(self):
174
start = self.first_range_start
177
self.assertRaises(errors.InvalidRange, f.seek, start + 5)
179
def test_seek_outside_single_range(self):
181
if f._size == -1 or f._boundary is not None:
182
raise tests.TestNotApplicable('Needs a fully defined range')
183
# Will seek past the range and then errors out
184
self.assertRaises(errors.InvalidRange,
185
f.seek, self.first_range_start + 27)
187
def test_read_past_end_of_range(self):
190
raise tests.TestNotApplicable("Can't check an unknown size")
191
start = self.first_range_start
193
self.assertRaises(errors.InvalidRange, f.read, 10)
195
def test_seek_from_end(self):
196
"""Test seeking from the end of the file.
198
The semantic is unclear in case of multiple ranges. Seeking from end
199
exists only for the http transports, cannot be used if the file size is
200
unknown and is not used in bzrlib itself. This test must be (and is)
201
overridden by daughter classes.
203
Reading from end makes sense only when a range has been requested from
204
the end of the file (see HttpTransportBase._get() when using the
205
'tail_amount' parameter). The HTTP response can only be a whole file or
210
self.assertEqual('yz', f.read())
213
class TestRangeFileSizeUnknown(tests.TestCase, TestRangeFileMixin):
214
"""Test a RangeFile for a whole file whose size is not known."""
217
super(TestRangeFileSizeUnknown, self).setUp()
218
self._file = response.RangeFile('Whole_file_size_known',
219
StringIO(self.alpha))
220
# We define no range, relying on RangeFile to provide default values
221
self.first_range_start = 0 # It's the whole file
223
def test_seek_from_end(self):
224
"""See TestRangeFileMixin.test_seek_from_end.
226
The end of the file can't be determined since the size is unknown.
228
self.assertRaises(errors.InvalidRange, self._file.seek, -1, 2)
230
def test_read_at_range_end(self):
231
"""Test read behaviour at range end."""
233
self.assertEqual(self.alpha, f.read())
234
self.assertEqual('', f.read(0))
235
self.assertEqual('', f.read(1))
238
class TestRangeFileSizeKnown(tests.TestCase, TestRangeFileMixin):
239
"""Test a RangeFile for a whole file whose size is known."""
242
super(TestRangeFileSizeKnown, self).setUp()
243
self._file = response.RangeFile('Whole_file_size_known',
244
StringIO(self.alpha))
245
self._file.set_range(0, len(self.alpha))
246
self.first_range_start = 0 # It's the whole file
249
class TestRangeFileSingleRange(tests.TestCase, TestRangeFileMixin):
250
"""Test a RangeFile for a single range."""
253
super(TestRangeFileSingleRange, self).setUp()
254
self._file = response.RangeFile('Single_range_file',
255
StringIO(self.alpha))
256
self.first_range_start = 15
257
self._file.set_range(self.first_range_start, len(self.alpha))
260
def test_read_before_range(self):
261
# This can't occur under normal circumstances, we have to force it
263
f._pos = 0 # Force an invalid pos
181
class TestHelpers(TestCase):
182
"""Test the helper functions"""
184
def test__parse_range(self):
185
"""Test that _parse_range acts reasonably."""
186
content = StringIO('')
187
parse_range = response.HttpRangeResponse._parse_range
188
self.assertEqual((1,2), parse_range('bytes 1-2/3'))
189
self.assertEqual((10,20), parse_range('bytes 10-20/2'))
191
self.assertRaises(errors.InvalidHttpRange, parse_range, 'char 1-3/2')
192
self.assertRaises(errors.InvalidHttpRange, parse_range, 'bytes a-3/2')
195
parse_range('bytes x-10/3', path='http://foo/bar')
196
except errors.InvalidHttpRange, e:
197
self.assertContainsRe(str(e), 'http://foo/bar')
198
self.assertContainsRe(str(e), 'bytes x-10/3')
200
self.fail('Did not raise InvalidHttpRange')
202
def test__parse_boundary_simple(self):
203
"""Test that _parse_boundary handles Content-type properly"""
204
parse_boundary = response.HttpMultipartRangeResponse._parse_boundary
205
m = parse_boundary(' multipart/byteranges; boundary=xxyyzz')
206
self.assertNotEqual(None, m)
207
# Check that the returned regex is capable of splitting simple_data
208
matches = list(m.finditer(simple_data))
209
self.assertEqual(4, len(matches))
211
# match.group() should be the content-range entry
212
# and match.end() should be the start of the content
213
self.assertEqual(' bytes 1-10/20', matches[0].group(1))
214
self.assertEqual(simple_data.find('1234567890'), matches[0].end())
215
self.assertEqual(' bytes 21-30/20', matches[1].group(1))
216
self.assertEqual(simple_data.find('abcdefghij'), matches[1].end())
217
self.assertEqual(' bytes 41-50/20', matches[2].group(1))
218
self.assertEqual(simple_data.find('zyxwvutsrq'), matches[2].end())
219
self.assertEqual(' bytes 51-60/20', matches[3].group(1))
220
self.assertEqual(simple_data.find('xxyyzz fbd'), matches[3].end())
222
def test__parse_boundary_invalid(self):
223
parse_boundary = response.HttpMultipartRangeResponse._parse_boundary
225
parse_boundary(' multipart/bytes;boundary=xxyyzz',
226
path='http://foo/bar')
227
except errors.InvalidHttpContentType, e:
228
self.assertContainsRe(str(e), 'http://foo/bar')
229
self.assertContainsRe(str(e), 'multipart/bytes;boundary=xxyyzz')
231
self.fail('Did not raise InvalidHttpContentType')
234
class TestHttpRangeResponse(TestCase):
236
def test_smoketest(self):
237
"""A basic test that HttpRangeResponse is reasonable."""
238
content = StringIO('0123456789')
239
f = response.HttpRangeResponse('http://foo', 'bytes 1-10/9', content)
240
self.assertEqual([response.ResponseRange(1,10,0)], f._ranges)
264
243
self.assertRaises(errors.InvalidRange, f.read, 2)
267
class TestRangeFileMultipleRanges(tests.TestCase, TestRangeFileMixin):
268
"""Test a RangeFile for multiple ranges.
270
The RangeFile used for the tests contains three ranges:
272
- at offset 25: alpha
273
- at offset 100: alpha
274
- at offset 126: alpha.upper()
276
The two last ranges are contiguous. This only rarely occurs (should not in
277
fact) in real uses but may lead to hard to track bugs.
280
# The following is used to represent the boundary paramter defined
281
# in HTTP response headers and the boundary lines that separate
284
boundary = "separation"
287
super(TestRangeFileMultipleRanges, self).setUp()
289
boundary = self.boundary
292
self.first_range_start = 25
293
file_size = 200 # big enough to encompass all ranges
294
for (start, part) in [(self.first_range_start, self.alpha),
295
# Two contiguous ranges
297
(126, self.alpha.upper())]:
298
content += self._multipart_byterange(part, start, boundary,
301
content += self._boundary_line()
303
self._file = response.RangeFile('Multiple_ranges_file',
305
self.set_file_boundary()
307
def _boundary_line(self):
308
"""Helper to build the formatted boundary line."""
309
return '--' + self.boundary + '\r\n'
311
def set_file_boundary(self):
312
# Ranges are set by decoding the range headers, the RangeFile user is
313
# supposed to call the following before using seek or read since it
314
# requires knowing the *response* headers (in that case the boundary
315
# which is part of the Content-Type header).
316
self._file.set_boundary(self.boundary)
318
def _multipart_byterange(self, data, offset, boundary, file_size='*'):
319
"""Encode a part of a file as a multipart/byterange MIME type.
321
When a range request is issued, the HTTP response body can be
322
decomposed in parts, each one representing a range (start, size) in a
325
:param data: The payload.
326
:param offset: where data starts in the file
327
:param boundary: used to separate the parts
328
:param file_size: the size of the file containing the range (default to
331
:return: a string containing the data encoded as it will appear in the
334
bline = self._boundary_line()
335
# Each range begins with a boundary line
337
# A range is described by a set of headers, but only 'Content-Range' is
338
# required for our implementation (TestHandleResponse below will
339
# exercise ranges with multiple or missing headers')
340
range += 'Content-Range: bytes %d-%d/%d\r\n' % (offset,
344
# Finally the raw bytes
348
def test_read_all_ranges(self):
350
self.assertEqual(self.alpha, f.read()) # Read first range
351
f.seek(100) # Trigger the second range recognition
352
self.assertEqual(self.alpha, f.read()) # Read second range
353
self.assertEqual(126, f.tell())
354
f.seek(126) # Start of third range which is also the current pos !
355
self.assertEqual('A', f.read(1))
357
self.assertEqual('LMN', f.read(3))
359
def test_seek_from_end(self):
360
"""See TestRangeFileMixin.test_seek_from_end."""
361
# The actual implementation will seek from end for the first range only
362
# and then fail. Since seeking from end is intended to be used for a
363
# single range only anyway, this test just document the actual
367
self.assertEqual('yz', f.read())
368
self.assertRaises(errors.InvalidRange, f.seek, -2, 2)
370
def test_seek_into_void(self):
372
start = self.first_range_start
374
# Seeking to a point between two ranges is possible (only once) but
375
# reading there is forbidden
377
# We crossed a range boundary, so now the file is positioned at the
378
# start of the new range (i.e. trying to seek below 100 will error out)
382
def test_seek_across_ranges(self):
384
f.seek(126) # skip the two first ranges
385
self.assertEqual('AB', f.read(2))
387
def test_checked_read_dont_overflow_buffers(self):
389
# We force a very low value to exercise all code paths in _checked_read
390
f._discarded_buf_size = 8
391
f.seek(126) # skip the two first ranges
392
self.assertEqual('AB', f.read(2))
394
def test_seek_twice_between_ranges(self):
396
start = self.first_range_start
397
f.seek(start + 40) # Past the first range but before the second
398
# Now the file is positioned at the second range start (100)
399
self.assertRaises(errors.InvalidRange, f.seek, start + 41)
401
def test_seek_at_range_end(self):
402
"""Test seek behavior at range end."""
408
def test_read_at_range_end(self):
410
self.assertEqual(self.alpha, f.read())
411
self.assertEqual(self.alpha, f.read())
412
self.assertEqual(self.alpha.upper(), f.read())
413
self.assertRaises(errors.InvalidHttpResponse, f.read, 1)
416
class TestRangeFileMultipleRangesQuotedBoundaries(TestRangeFileMultipleRanges):
417
"""Perform the same tests as TestRangeFileMultipleRanges, but uses
418
an angle-bracket quoted boundary string like IIS 6.0 and 7.0
419
(but not IIS 5, which breaks the RFC in a different way
420
by using square brackets, not angle brackets)
422
This reveals a bug caused by
424
- The bad implementation of RFC 822 unquoting in Python (angles are not
425
quotes), coupled with
427
- The bad implementation of RFC 2046 in IIS (angles are not permitted chars
431
# The boundary as it appears in boundary lines
432
# IIS 6 and 7 use this value
433
_boundary_trimmed = "q1w2e3r4t5y6u7i8o9p0zaxscdvfbgnhmjklkl"
434
boundary = '<' + _boundary_trimmed + '>'
436
def set_file_boundary(self):
437
# Emulate broken rfc822.unquote() here by removing angles
438
self._file.set_boundary(self._boundary_trimmed)
441
class TestRangeFileVarious(tests.TestCase):
442
"""Tests RangeFile aspects not covered elsewhere."""
444
def test_seek_whence(self):
445
"""Test the seek whence parameter values."""
446
f = response.RangeFile('foo', StringIO('abc'))
451
self.assertRaises(ValueError, f.seek, 0, 14)
453
def test_range_syntax(self):
454
"""Test the Content-Range scanning."""
456
f = response.RangeFile('foo', StringIO())
458
def ok(expected, header_value):
459
f.set_range_from_header(header_value)
460
# Slightly peek under the covers to get the size
461
self.assertEqual(expected, (f.tell(), f._size))
463
ok((1, 10), 'bytes 1-10/11')
464
ok((1, 10), 'bytes 1-10/*')
465
ok((12, 2), '\tbytes 12-13/*')
466
ok((28, 1), ' bytes 28-28/*')
467
ok((2123, 2120), 'bytes 2123-4242/12310')
468
ok((1, 10), 'bytes 1-10/ttt') # We don't check total (ttt)
470
def nok(header_value):
471
self.assertRaises(errors.InvalidHttpRange,
472
f.set_range_from_header, header_value)
476
nok('bytes xx-yyy/zzz')
477
nok('bytes xx-12/zzz')
478
nok('bytes 11-yy/zzz')
245
self.assertEqual('012345', f.read(6))
247
def test_invalid(self):
249
f = response.HttpRangeResponse('http://foo', 'bytes x-10/9',
250
StringIO('0123456789'))
251
except errors.InvalidHttpRange, e:
252
self.assertContainsRe(str(e), 'http://foo')
253
self.assertContainsRe(str(e), 'bytes x-10/9')
255
self.fail('Failed to raise InvalidHttpRange')
258
class TestHttpMultipartRangeResponse(TestCase):
259
"""Test the handling of multipart range responses"""
261
def test_simple(self):
262
content = StringIO(simple_data)
263
multi = response.HttpMultipartRangeResponse('http://foo',
264
'multipart/byteranges; boundary = xxyyzz', content)
266
self.assertEqual(4, len(multi._ranges))
269
self.assertEqual('1234567890', multi.read(10))
271
self.assertEqual('abcdefghij', multi.read(10))
273
self.assertEqual('zyxwvutsrq', multi.read(10))
275
self.assertEqual('xxyyzz fbd', multi.read(10))
276
# TODO: jam 20060706 Currently RangeFile does not support
277
# reading across ranges. Consider adding it.
279
# self.assertEqual('zyxwvutsrqxxyyzz fbd', multi.read(20))
280
self.assertRaises(errors.InvalidRange, multi.read, 20)
283
self.assertRaises(errors.InvalidRange, multi.read, 11)
285
self.assertRaises(errors.InvalidRange, multi.read, 10)
287
def test_invalid(self):
288
content = StringIO('')
290
response.HttpMultipartRangeResponse('http://foo',
291
'multipart/byte;boundary=invalid', content)
292
except errors.InvalidHttpContentType, e:
293
self.assertContainsRe(str(e), 'http://foo')
294
self.assertContainsRe(str(e), 'multipart/byte;')
482
297
# Taken from real request responses
678
_multipart_no_content_range = (206, """HTTP/1.0 206 Partial Content\r
679
Content-Type: multipart/byteranges; boundary=THIS_SEPARATES\r
680
Content-Length: 598\r
685
Content-Type: text/plain\r
692
_multipart_no_boundary = (206, """HTTP/1.0 206 Partial Content\r
693
Content-Type: multipart/byteranges; boundary=THIS_SEPARATES\r
694
Content-Length: 598\r
699
Content-Type: text/plain\r
700
Content-Range: bytes 0-18/18672\r
704
The range ended at the line above, this text is garbage instead of a boundary
709
class TestHandleResponse(tests.TestCase):
711
def _build_HTTPMessage(self, raw_headers):
712
status_and_headers = StringIO(raw_headers)
713
# Get rid of the status line
714
status_and_headers.readline()
715
msg = httplib.HTTPMessage(status_and_headers)
440
# This should be in test_http.py, but the headers we
441
# want to parse are here
442
class TestExtractHeader(TestCase):
444
def use_response(self, response):
445
self.headers = http._extract_headers(response[1], 'http://foo')
447
def check_header(self, header, value):
448
self.assertEqual(value, self.headers[header])
450
def test_full_text(self):
451
self.use_response(_full_text_response)
453
self.check_header('Date', 'Tue, 11 Jul 2006 04:32:56 GMT')
454
self.check_header('date', 'Tue, 11 Jul 2006 04:32:56 GMT')
455
self.check_header('Content-Length', '35')
456
self.check_header('Content-Type', 'text/plain; charset=UTF-8')
457
self.check_header('content-type', 'text/plain; charset=UTF-8')
459
def test_missing_response(self):
460
self.use_response(_missing_response)
462
self.check_header('Content-Length', '336')
463
self.check_header('Content-Type', 'text/html; charset=iso-8859-1')
465
def test_single_range(self):
466
self.use_response(_single_range_response)
468
self.check_header('Content-Length', '100')
469
self.check_header('Content-Range', 'bytes 100-199/93890')
470
self.check_header('Content-Type', 'text/plain; charset=UTF-8')
472
def test_multi_range(self):
473
self.use_response(_multipart_range_response)
475
self.check_header('Content-Length', '1534')
476
self.check_header('Content-Type',
477
'multipart/byteranges; boundary=418470f848b63279b')
479
def test_redirect(self):
480
"""We default to returning the last group of headers in the file."""
481
self.use_response(_redirect_response)
482
self.check_header('Content-Range', 'bytes 8623075-8623499/8623500')
483
self.check_header('Content-Type', 'text/plain; charset=UTF-8')
485
def test_empty(self):
486
self.assertRaises(errors.InvalidHttpResponse,
487
http._extract_headers, '', 'bad url')
489
def test_no_opening_http(self):
490
# Remove the HTTP line from the header
491
first, txt = _full_text_response[1].split('\r\n', 1)
492
self.assertRaises(errors.InvalidHttpResponse,
493
http._extract_headers, txt, 'missing HTTTP')
495
def test_trailing_whitespace(self):
496
# Test that we ignore bogus whitespace on the end
497
code, txt, body = _full_text_response
498
txt += '\r\n\n\n\n\n'
499
self.use_response((code, txt, body))
501
self.check_header('Date', 'Tue, 11 Jul 2006 04:32:56 GMT')
502
self.check_header('Content-Length', '35')
503
self.check_header('Content-Type', 'text/plain; charset=UTF-8')
505
def test_trailing_non_http(self):
506
# Test that we ignore bogus stuff on the end
507
code, txt, body = _full_text_response
508
txt = txt + 'Foo: Bar\r\nBaz: Bling\r\n\r\n'
509
self.use_response((code, txt, body))
511
self.check_header('Date', 'Tue, 11 Jul 2006 04:32:56 GMT')
512
self.check_header('Content-Length', '35')
513
self.check_header('Content-Type', 'text/plain; charset=UTF-8')
514
self.assertRaises(KeyError, self.headers.__getitem__, 'Foo')
516
def test_extra_whitespace(self):
517
# Test that we read an HTTP response, even with extra whitespace
518
code, txt, body = _redirect_response
519
# Find the second HTTP location
520
loc = txt.find('HTTP', 5)
521
txt = txt[:loc] + '\r\n\n' + txt[loc:]
522
self.use_response((code, txt, body))
523
self.check_header('Content-Range', 'bytes 8623075-8623499/8623500')
524
self.check_header('Content-Type', 'text/plain; charset=UTF-8')
527
class TestHandleResponse(TestCase):
718
529
def get_response(self, a_response):
719
530
"""Process a supplied response, and return the result."""
720
code, raw_headers, body = a_response
721
msg = self._build_HTTPMessage(raw_headers)
722
return response.handle_response('http://foo', code, msg,
531
headers = http._extract_headers(a_response[1], 'http://foo')
532
return response.handle_response('http://foo', a_response[0], headers,
723
533
StringIO(a_response[2]))
725
535
def test_full_text(self):
757
def test_multi_squid_range(self):
758
out = self.get_response(_multipart_squid_range_response)
760
# Just make sure we can read the right contents
767
564
def test_invalid_response(self):
768
565
self.assertRaises(errors.InvalidHttpResponse,
769
self.get_response, _invalid_response)
566
self.get_response, _invalid_response)
771
568
def test_full_text_no_content_type(self):
772
569
# We should not require Content-Type for a full response
773
code, raw_headers, body = _full_text_response_no_content_type
774
msg = self._build_HTTPMessage(raw_headers)
775
out = response.handle_response('http://foo', code, msg, StringIO(body))
776
self.assertEqual(body, out.read())
778
def test_full_text_no_content_length(self):
779
code, raw_headers, body = _full_text_response_no_content_length
780
msg = self._build_HTTPMessage(raw_headers)
781
out = response.handle_response('http://foo', code, msg, StringIO(body))
782
self.assertEqual(body, out.read())
570
a_response = _full_text_response
571
headers = http._extract_headers(a_response[1], 'http://foo')
572
del headers['Content-Type']
573
out = response.handle_response('http://foo', a_response[0], headers,
574
StringIO(a_response[2]))
575
self.assertEqual(_full_text_response[2], out.read())
577
def test_missing_no_content_type(self):
578
# Without Content-Type we should still raise NoSuchFile on a 404
579
a_response = _missing_response
580
headers = http._extract_headers(a_response[1], 'http://missing')
581
del headers['Content-Type']
582
self.assertRaises(errors.NoSuchFile,
583
response.handle_response, 'http://missing', a_response[0], headers,
584
StringIO(a_response[2]))
586
def test_missing_content_type(self):
587
a_response = _single_range_response
588
headers = http._extract_headers(a_response[1], 'http://nocontent')
589
del headers['Content-Type']
590
self.assertRaises(errors.InvalidHttpContentType,
591
response.handle_response, 'http://nocontent', a_response[0],
592
headers, StringIO(a_response[2]))
784
594
def test_missing_content_range(self):
785
code, raw_headers, body = _single_range_no_content_range
786
msg = self._build_HTTPMessage(raw_headers)
787
self.assertRaises(errors.InvalidHttpResponse,
788
response.handle_response,
789
'http://bogus', code, msg, StringIO(body))
791
def test_multipart_no_content_range(self):
792
code, raw_headers, body = _multipart_no_content_range
793
msg = self._build_HTTPMessage(raw_headers)
794
self.assertRaises(errors.InvalidHttpResponse,
795
response.handle_response,
796
'http://bogus', code, msg, StringIO(body))
798
def test_multipart_no_boundary(self):
799
out = self.get_response(_multipart_no_boundary)
800
out.read() # Read the whole range
801
# Fail to find the boundary line
802
self.assertRaises(errors.InvalidHttpResponse, out.seek, 1, 1)
805
class TestRangeFileSizeReadLimited(tests.TestCase):
806
"""Test RangeFile _max_read_size functionality which limits the size of
807
read blocks to prevent MemoryError messages in socket.recv.
811
super(TestRangeFileSizeReadLimited, self).setUp()
812
# create a test datablock larger than _max_read_size.
813
chunk_size = response.RangeFile._max_read_size
814
test_pattern = '0123456789ABCDEF'
815
self.test_data = test_pattern * (3 * chunk_size / len(test_pattern))
816
self.test_data_len = len(self.test_data)
818
def test_max_read_size(self):
819
"""Read data in blocks and verify that the reads are not larger than
820
the maximum read size.
822
# retrieve data in large blocks from response.RangeFile object
823
mock_read_file = FakeReadFile(self.test_data)
824
range_file = response.RangeFile('test_max_read_size', mock_read_file)
825
response_data = range_file.read(self.test_data_len)
827
# verify read size was equal to the maximum read size
828
self.assertTrue(mock_read_file.get_max_read_size() > 0)
829
self.assertEqual(mock_read_file.get_max_read_size(),
830
response.RangeFile._max_read_size)
831
self.assertEqual(mock_read_file.get_read_count(), 3)
833
# report error if the data wasn't equal (we only report the size due
834
# to the length of the data)
835
if response_data != self.test_data:
836
message = "Data not equal. Expected %d bytes, received %d."
837
self.fail(message % (len(response_data), self.test_data_len))
595
a_response = _single_range_response
596
headers = http._extract_headers(a_response[1], 'http://nocontent')
597
del headers['Content-Range']
598
self.assertRaises(errors.InvalidHttpResponse,
599
response.handle_response, 'http://nocontent', a_response[0],
600
headers, StringIO(a_response[2]))