1
# Copyright (C) 2006, 2007 Canonical Ltd
1
# Copyright (C) 2006-2011 Canonical Ltd
3
3
# This program is free software; you can redistribute it and/or modify
4
4
# it under the terms of the GNU General Public License as published by
24
from __future__ import absolute_import
26
28
from cStringIO import StringIO
29
31
from bzrlib import (
37
class ResponseFile(object):
38
"""A wrapper around the http socket containing the result of a GET request.
40
Only read() and seek() (forward) are supported.
43
def __init__(self, path, infile):
46
:param path: File url, for error reports.
48
:param infile: File-like socket set at body start.
57
Dummy implementation for consistency with the 'file' API.
60
def read(self, size=-1):
61
"""Read size bytes from the current position in the file.
63
:param size: The number of bytes to read. Leave unspecified or pass
66
data = self._file.read(size)
67
self._pos += len(data)
71
data = self._file.readline()
72
self._pos += len(data)
77
line = self.readline()
85
def seek(self, offset, whence=os.SEEK_SET):
86
if whence == os.SEEK_SET:
87
if offset < self._pos:
89
"Can't seek backwards, pos: %s, offset: %s"
90
% (self._pos, offset))
91
to_discard = offset - self._pos
92
elif whence == os.SEEK_CUR:
95
raise AssertionError("Can't seek backwards")
97
# Just discard the unwanted bytes
36
100
# A RangeFile expects the following grammar (simplified to outline the
37
101
# assumptions we rely upon).
41
104
# | multiple_range
43
# whole_file: [content_length_header] data
45
106
# single_range: content_range_header data
47
108
# multiple_range: boundary_header boundary (content_range_header data boundary)+
49
class RangeFile(object):
110
class RangeFile(ResponseFile):
50
111
"""File-like object that allow access to partial available data.
52
113
All accesses should happen sequentially since the acquisition occurs during
73
134
:param path: File url, for error reports.
74
136
:param infile: File-like socket set at body start.
138
super(RangeFile, self).__init__(path, infile)
78
139
self._boundary = None
79
140
# When using multi parts response, this will be set with the headers
80
141
# associated with the range currently read.
109
170
# To be on the safe side we allow it before any boundary line
110
171
boundary_line = self._file.readline()
173
if boundary_line == '':
174
# A timeout in the proxy server caused the response to end early.
175
# See launchpad bug 198646.
176
raise errors.HttpBoundaryMissing(
112
180
if boundary_line != '--' + self._boundary + '\r\n':
113
181
# rfc822.unquote() incorrectly unquotes strings enclosed in <>
114
182
# IIS 6 and 7 incorrectly wrap boundary strings in <>
221
289
% (size, self._start, self._size))
223
291
# read data from file
226
294
if self._size > 0:
227
295
# Don't read past the range definition
228
296
limited = self._start + self._size - self._pos
230
298
limited = min(limited, size)
231
osutils.pumpfile(self._file, buffer, limited, self._max_read_size)
232
data = buffer.getvalue()
299
osutils.pumpfile(self._file, buf, limited, self._max_read_size)
300
data = buf.getvalue()
234
302
# Update _pos respecting the data effectively read
235
303
self._pos += len(data)
291
359
:return: A file-like object that can seek()+read() the
292
360
ranges indicated by the headers.
294
rfile = RangeFile(url, data)
297
size = msg.getheader('content-length', None)
302
rfile.set_range(0, size)
364
rfile = ResponseFile(url, data)
303
365
elif code == 206:
366
rfile = RangeFile(url, data)
304
367
content_type = msg.getheader('content-type', None)
305
368
if content_type is None:
306
369
# When there is no content-type header we treat the response as