~bzr-pqm/bzr/bzr.dev

5752.3.8 by John Arbash Meinel
Merge bzr.dev 5764 to resolve release-notes (aka NEWS) conflicts
1
# Copyright (C) 2006-2011 Canonical Ltd
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
4183.7.1 by Sabin Iacob
update FSF mailing address
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
16
2018.5.19 by Andrew Bennetts
Add docstrings to all the new modules, and a few other places.
17
"""The 'medium' layer for the smart servers and clients.
18
19
"Medium" here is the noun meaning "a means of transmission", not the adjective
20
for "the quality between big and small."
21
22
Media carry the bytes of the requests somehow (e.g. via TCP, wrapped in HTTP, or
23
over SSH), and pass them to and from the protocol logic.  See the overview in
24
bzrlib/transport/smart/__init__.py.
25
"""
26
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
27
import os
2018.5.162 by Andrew Bennetts
Add some missing _ensure_real calls, and a missing import.
28
import sys
3431.3.11 by Andrew Bennetts
Push remote_path_from_transport logic into SmartClientMedium, removing special-casing of bzr+http from _SmartClient.
29
import urllib
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
30
5222.2.9 by Robert Collins
Write up some doc about bzrlib.initialize.
31
import bzrlib
3530.1.1 by John Arbash Meinel
Make bzrlib.smart use lazy imports.
32
from bzrlib.lazy_import import lazy_import
33
lazy_import(globals(), """
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
34
import socket
4913.1.1 by John Arbash Meinel
Switch to using thread.get_ident() which is available on all python versions.
35
import thread
3731.2.4 by Andrew Bennetts
Minor tweaks.
36
import weakref
4889.2.2 by John Arbash Meinel
Add a -Dhpssthread debug flag to include thread.ident info.
37
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
38
from bzrlib import (
3731.2.1 by Andrew Bennetts
Show total HPSS calls (if any) on stderr when -Dhpss is active.
39
    debug,
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
40
    errors,
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
41
    trace,
3958.1.1 by Andrew Bennetts
Report traffic on smart media as transport activity.
42
    ui,
3431.3.11 by Andrew Bennetts
Push remote_path_from_transport logic into SmartClientMedium, removing special-casing of bzr+http from _SmartClient.
43
    urlutils,
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
44
    )
6138.3.4 by Jonathan Riddell
add gettext() to uses of trace.note()
45
from bzrlib.i18n import gettext
4326.2.1 by Jonathan Lange
Show the number of VFS calls in -Dhpss output.
46
from bzrlib.smart import client, protocol, request, vfs
3066.2.1 by John Arbash Meinel
We don't require paramiko for bzr+ssh.
47
from bzrlib.transport import ssh
3530.1.1 by John Arbash Meinel
Make bzrlib.smart use lazy imports.
48
""")
4332.3.17 by Robert Collins
Check revisions as we cross check the revision index, rather than in a separate pass.
49
from bzrlib import osutils
2018.5.17 by Andrew Bennetts
Paramaterise the commands handled by SmartServerRequestHandler.
50
5011.3.3 by Martin
Reintroduce EINTR handling only for socket object functions and general cleanup
51
# Throughout this module buffer size parameters are either limited to be at
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
52
# most _MAX_READ_SIZE, or are ignored and _MAX_READ_SIZE is used instead.
53
# For this module's purposes, MAX_SOCKET_CHUNK is a reasonable size for reads
54
# from non-sockets as well.
55
_MAX_READ_SIZE = osutils.MAX_SOCKET_CHUNK
3565.1.3 by Andrew Bennetts
Define a _MAX_READ_SIZE constant as suggested by John's review.
56
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
57
def _get_protocol_factory_for_bytes(bytes):
58
    """Determine the right protocol factory for 'bytes'.
59
60
    This will return an appropriate protocol factory depending on the version
61
    of the protocol being used, as determined by inspecting the given bytes.
62
    The bytes should have at least one newline byte (i.e. be a whole line),
63
    otherwise it's possible that a request will be incorrectly identified as
64
    version 1.
65
66
    Typical use would be::
67
68
         factory, unused_bytes = _get_protocol_factory_for_bytes(bytes)
69
         server_protocol = factory(transport, write_func, root_client_path)
70
         server_protocol.accept_bytes(unused_bytes)
71
72
    :param bytes: a str of bytes of the start of the request.
73
    :returns: 2-tuple of (protocol_factory, unused_bytes).  protocol_factory is
74
        a callable that takes three args: transport, write_func,
75
        root_client_path.  unused_bytes are any bytes that were not part of a
76
        protocol version marker.
77
    """
3530.1.1 by John Arbash Meinel
Make bzrlib.smart use lazy imports.
78
    if bytes.startswith(protocol.MESSAGE_VERSION_THREE):
79
        protocol_factory = protocol.build_server_protocol_three
80
        bytes = bytes[len(protocol.MESSAGE_VERSION_THREE):]
81
    elif bytes.startswith(protocol.REQUEST_VERSION_TWO):
82
        protocol_factory = protocol.SmartServerRequestProtocolTwo
83
        bytes = bytes[len(protocol.REQUEST_VERSION_TWO):]
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
84
    else:
3530.1.1 by John Arbash Meinel
Make bzrlib.smart use lazy imports.
85
        protocol_factory = protocol.SmartServerRequestProtocolOne
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
86
    return protocol_factory, bytes
87
88
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
89
def _get_line(read_bytes_func):
90
    """Read bytes using read_bytes_func until a newline byte.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
91
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
92
    This isn't particularly efficient, so should only be used when the
93
    expected size of the line is quite short.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
94
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
95
    :returns: a tuple of two strs: (line, excess)
96
    """
97
    newline_pos = -1
98
    bytes = ''
99
    while newline_pos == -1:
100
        new_bytes = read_bytes_func(1)
101
        bytes += new_bytes
102
        if new_bytes == '':
103
            # Ran out of bytes before receiving a complete line.
104
            return bytes, ''
105
        newline_pos = bytes.find('\n')
106
    line = bytes[:newline_pos+1]
107
    excess = bytes[newline_pos+1:]
108
    return line, excess
109
110
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
111
class SmartMedium(object):
112
    """Base class for smart protocol media, both client- and server-side."""
113
114
    def __init__(self):
115
        self._push_back_buffer = None
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
116
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
117
    def _push_back(self, bytes):
118
        """Return unused bytes to the medium, because they belong to the next
119
        request(s).
120
121
        This sets the _push_back_buffer to the given bytes.
122
        """
123
        if self._push_back_buffer is not None:
124
            raise AssertionError(
125
                "_push_back called when self._push_back_buffer is %r"
126
                % (self._push_back_buffer,))
127
        if bytes == '':
128
            return
129
        self._push_back_buffer = bytes
130
131
    def _get_push_back_buffer(self):
132
        if self._push_back_buffer == '':
133
            raise AssertionError(
134
                '%s._push_back_buffer should never be the empty string, '
135
                'which can be confused with EOF' % (self,))
136
        bytes = self._push_back_buffer
137
        self._push_back_buffer = None
138
        return bytes
139
140
    def read_bytes(self, desired_count):
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
141
        """Read some bytes from this medium.
142
143
        :returns: some bytes, possibly more or less than the number requested
144
            in 'desired_count' depending on the medium.
145
        """
146
        if self._push_back_buffer is not None:
147
            return self._get_push_back_buffer()
3565.1.3 by Andrew Bennetts
Define a _MAX_READ_SIZE constant as suggested by John's review.
148
        bytes_to_read = min(desired_count, _MAX_READ_SIZE)
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
149
        return self._read_bytes(bytes_to_read)
150
151
    def _read_bytes(self, count):
152
        raise NotImplementedError(self._read_bytes)
153
154
    def _get_line(self):
155
        """Read bytes from this request's response until a newline byte.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
156
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
157
        This isn't particularly efficient, so should only be used when the
158
        expected size of the line is quite short.
159
160
        :returns: a string of bytes ending in a newline (byte 0x0A).
161
        """
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
162
        line, excess = _get_line(self.read_bytes)
163
        self._push_back(excess)
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
164
        return line
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
165
3958.1.1 by Andrew Bennetts
Report traffic on smart media as transport activity.
166
    def _report_activity(self, bytes, direction):
167
        """Notify that this medium has activity.
168
169
        Implementations should call this from all methods that actually do IO.
170
        Be careful that it's not called twice, if one method is implemented on
171
        top of another.
172
173
        :param bytes: Number of bytes read or written.
174
        :param direction: 'read' or 'write' or None.
175
        """
176
        ui.ui_factory.report_transport_activity(self, bytes, direction)
177
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
178
179
class SmartServerStreamMedium(SmartMedium):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
180
    """Handles smart commands coming over a stream.
181
182
    The stream may be a pipe connected to sshd, or a tcp socket, or an
183
    in-process fifo for testing.
184
185
    One instance is created for each connected client; it can serve multiple
186
    requests in the lifetime of the connection.
187
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
188
    The server passes requests through to an underlying backing transport,
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
189
    which will typically be a LocalTransport looking at the server's filesystem.
3236.3.4 by Andrew Bennetts
Rename 'push_back' attribute to '_push_back_buffer', add some docstrings, and remove a little bit of redundant code from SmartServerSocketStreamMedium._serve_one_request_unguarded.
190
191
    :ivar _push_back_buffer: a str of bytes that have been read from the stream
192
        but not used yet, or None if there are no buffered bytes.  Subclasses
193
        should make sure to exhaust this buffer before reading more bytes from
194
        the stream.  See also the _push_back method.
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
195
    """
196
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
197
    def __init__(self, backing_transport, root_client_path='/'):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
198
        """Construct new server.
199
200
        :param backing_transport: Transport for the directory served.
201
        """
202
        # backing_transport could be passed to serve instead of __init__
203
        self.backing_transport = backing_transport
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
204
        self.root_client_path = root_client_path
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
205
        self.finished = False
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
206
        SmartMedium.__init__(self)
3236.3.5 by Andrew Bennetts
Add _get_push_back_buffer helper.
207
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
208
    def serve(self):
209
        """Serve requests until the client disconnects."""
210
        # Keep a reference to stderr because the sys module's globals get set to
211
        # None during interpreter shutdown.
212
        from sys import stderr
213
        try:
214
            while not self.finished:
2432.2.3 by Andrew Bennetts
Merge from bzr.dev.
215
                server_protocol = self._build_protocol()
2018.5.14 by Andrew Bennetts
Move SmartTCPServer to smart/server.py, and SmartServerRequestHandler to smart/request.py.
216
                self._serve_one_request(server_protocol)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
217
        except Exception, e:
218
            stderr.write("%s terminating on exception %s\n" % (self, e))
219
            raise
220
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
221
    def _build_protocol(self):
2432.2.8 by Andrew Bennetts
NEWS entry, greatly improved docstring in bzrlib.smart.
222
        """Identifies the version of the incoming request, and returns an
223
        a protocol object that can interpret it.
224
225
        If more bytes than the version prefix of the request are read, they will
226
        be fed into the protocol before it is returned.
227
228
        :returns: a SmartServerRequestProtocol.
229
        """
2432.2.7 by Andrew Bennetts
Use less confusing version strings, and define REQUEST_VERSION_TWO/RESPONSE_VERSION_TWO constants for them.
230
        bytes = self._get_line()
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
231
        protocol_factory, unused_bytes = _get_protocol_factory_for_bytes(bytes)
3245.4.14 by Andrew Bennetts
Merge from bzr.dev (via loom thread).
232
        protocol = protocol_factory(
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
233
            self.backing_transport, self._write_out, self.root_client_path)
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
234
        protocol.accept_bytes(unused_bytes)
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
235
        return protocol
236
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
237
    def _serve_one_request(self, protocol):
238
        """Read one request from input, process, send back a response.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
239
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
240
        :param protocol: a SmartServerRequestProtocol.
241
        """
242
        try:
243
            self._serve_one_request_unguarded(protocol)
244
        except KeyboardInterrupt:
245
            raise
246
        except Exception, e:
247
            self.terminate_due_to_error()
248
249
    def terminate_due_to_error(self):
250
        """Called when an unhandled exception from the protocol occurs."""
251
        raise NotImplementedError(self.terminate_due_to_error)
252
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
253
    def _read_bytes(self, desired_count):
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
254
        """Get some bytes from the medium.
255
256
        :param desired_count: number of bytes we want to read.
257
        """
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
258
        raise NotImplementedError(self._read_bytes)
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
259
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
260
261
class SmartServerSocketStreamMedium(SmartServerStreamMedium):
262
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
263
    def __init__(self, sock, backing_transport, root_client_path='/'):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
264
        """Constructor.
265
266
        :param sock: the socket the server will read from.  It will be put
267
            into blocking mode.
268
        """
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
269
        SmartServerStreamMedium.__init__(
270
            self, backing_transport, root_client_path=root_client_path)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
271
        sock.setblocking(True)
272
        self.socket = sock
273
274
    def _serve_one_request_unguarded(self, protocol):
275
        while protocol.next_read_size():
3565.1.3 by Andrew Bennetts
Define a _MAX_READ_SIZE constant as suggested by John's review.
276
            # We can safely try to read large chunks.  If there is less data
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
277
            # than MAX_SOCKET_CHUNK ready, the socket will just return a
278
            # short read immediately rather than block.
279
            bytes = self.read_bytes(osutils.MAX_SOCKET_CHUNK)
3236.3.4 by Andrew Bennetts
Rename 'push_back' attribute to '_push_back_buffer', add some docstrings, and remove a little bit of redundant code from SmartServerSocketStreamMedium._serve_one_request_unguarded.
280
            if bytes == '':
281
                self.finished = True
282
                return
283
            protocol.accept_bytes(bytes)
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
284
3245.4.21 by Andrew Bennetts
Remove 'excess_buffer' attribute and another crufty comment.
285
        self._push_back(protocol.unused_data)
3195.3.18 by Andrew Bennetts
call_with_body_bytes now works with v3 (e.g. test_copy_content_remote_to_local passes). Lots of debugging cruft, though.
286
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
287
    def _read_bytes(self, desired_count):
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
288
        return osutils.read_bytes_from_socket(
289
            self.socket, self._report_activity)
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
290
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
291
    def terminate_due_to_error(self):
3245.4.59 by Andrew Bennetts
Various tweaks in response to Martin's review.
292
        # TODO: This should log to a server log file, but no such thing
293
        # exists yet.  Andrew Bennetts 2006-09-29.
5011.3.1 by Martin
Revert second-phase EINTR changes
294
        self.socket.close()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
295
        self.finished = True
296
297
    def _write_out(self, bytes):
4889.2.1 by John Arbash Meinel
Make -Dhpss log debug information for the server process.
298
        tstart = osutils.timer_func()
5011.3.9 by Andrew Bennetts
Remove _send_bytes_chunked.
299
        osutils.send_all(self.socket, bytes, self._report_activity)
4889.2.1 by John Arbash Meinel
Make -Dhpss log debug information for the server process.
300
        if 'hpss' in debug.debug_flags:
4913.1.1 by John Arbash Meinel
Switch to using thread.get_ident() which is available on all python versions.
301
            thread_id = thread.get_ident()
4889.2.3 by John Arbash Meinel
Get rid of -Dhpssthread, just always include it.
302
            trace.mutter('%12s: [%s] %d bytes to the socket in %.3fs'
303
                         % ('wrote', thread_id, len(bytes),
4889.2.2 by John Arbash Meinel
Add a -Dhpssthread debug flag to include thread.ident info.
304
                            osutils.timer_func() - tstart))
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
305
306
307
class SmartServerPipeStreamMedium(SmartServerStreamMedium):
308
309
    def __init__(self, in_file, out_file, backing_transport):
310
        """Construct new server.
311
312
        :param in_file: Python file from which requests can be read.
313
        :param out_file: Python file to write responses.
314
        :param backing_transport: Transport for the directory served.
315
        """
316
        SmartServerStreamMedium.__init__(self, backing_transport)
2018.5.161 by Andrew Bennetts
Reinstate forcing binary mode on windows in SmartServerStreamMedium.
317
        if sys.platform == 'win32':
318
            # force binary mode for files
319
            import msvcrt
320
            for f in (in_file, out_file):
321
                fileno = getattr(f, 'fileno', None)
322
                if fileno:
323
                    msvcrt.setmode(fileno(), os.O_BINARY)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
324
        self._in = in_file
325
        self._out = out_file
326
327
    def _serve_one_request_unguarded(self, protocol):
328
        while True:
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
329
            # We need to be careful not to read past the end of the current
330
            # request, or else the read from the pipe will block, so we use
331
            # protocol.next_read_size().
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
332
            bytes_to_read = protocol.next_read_size()
333
            if bytes_to_read == 0:
334
                # Finished serving this request.
5011.3.1 by Martin
Revert second-phase EINTR changes
335
                self._out.flush()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
336
                return
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
337
            bytes = self.read_bytes(bytes_to_read)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
338
            if bytes == '':
339
                # Connection has been closed.
340
                self.finished = True
5011.3.1 by Martin
Revert second-phase EINTR changes
341
                self._out.flush()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
342
                return
343
            protocol.accept_bytes(bytes)
344
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
345
    def _read_bytes(self, desired_count):
5011.3.1 by Martin
Revert second-phase EINTR changes
346
        return self._in.read(desired_count)
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
347
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
348
    def terminate_due_to_error(self):
349
        # TODO: This should log to a server log file, but no such thing
350
        # exists yet.  Andrew Bennetts 2006-09-29.
5011.3.1 by Martin
Revert second-phase EINTR changes
351
        self._out.close()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
352
        self.finished = True
353
354
    def _write_out(self, bytes):
5011.3.1 by Martin
Revert second-phase EINTR changes
355
        self._out.write(bytes)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
356
357
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
358
class SmartClientMediumRequest(object):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
359
    """A request on a SmartClientMedium.
360
361
    Each request allows bytes to be provided to it via accept_bytes, and then
362
    the response bytes to be read via read_bytes.
363
364
    For instance:
365
    request.accept_bytes('123')
366
    request.finished_writing()
367
    result = request.read_bytes(3)
368
    request.finished_reading()
369
370
    It is up to the individual SmartClientMedium whether multiple concurrent
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
371
    requests can exist. See SmartClientMedium.get_request to obtain instances
372
    of SmartClientMediumRequest, and the concrete Medium you are using for
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
373
    details on concurrency and pipelining.
374
    """
375
376
    def __init__(self, medium):
377
        """Construct a SmartClientMediumRequest for the medium medium."""
378
        self._medium = medium
379
        # we track state by constants - we may want to use the same
380
        # pattern as BodyReader if it gets more complex.
381
        # valid states are: "writing", "reading", "done"
382
        self._state = "writing"
383
384
    def accept_bytes(self, bytes):
385
        """Accept bytes for inclusion in this request.
386
4031.3.1 by Frank Aspell
Fixing various typos
387
        This method may not be called after finished_writing() has been
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
388
        called.  It depends upon the Medium whether or not the bytes will be
389
        immediately transmitted. Message based Mediums will tend to buffer the
390
        bytes until finished_writing() is called.
391
392
        :param bytes: A bytestring.
393
        """
394
        if self._state != "writing":
395
            raise errors.WritingCompleted(self)
396
        self._accept_bytes(bytes)
397
398
    def _accept_bytes(self, bytes):
399
        """Helper for accept_bytes.
400
401
        Accept_bytes checks the state of the request to determing if bytes
402
        should be accepted. After that it hands off to _accept_bytes to do the
403
        actual acceptance.
404
        """
405
        raise NotImplementedError(self._accept_bytes)
406
407
    def finished_reading(self):
408
        """Inform the request that all desired data has been read.
409
410
        This will remove the request from the pipeline for its medium (if the
411
        medium supports pipelining) and any further calls to methods on the
412
        request will raise ReadingCompleted.
413
        """
414
        if self._state == "writing":
415
            raise errors.WritingNotComplete(self)
416
        if self._state != "reading":
417
            raise errors.ReadingCompleted(self)
418
        self._state = "done"
419
        self._finished_reading()
420
421
    def _finished_reading(self):
422
        """Helper for finished_reading.
423
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
424
        finished_reading checks the state of the request to determine if
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
425
        finished_reading is allowed, and if it is hands off to _finished_reading
426
        to perform the action.
427
        """
428
        raise NotImplementedError(self._finished_reading)
429
430
    def finished_writing(self):
431
        """Finish the writing phase of this request.
432
433
        This will flush all pending data for this request along the medium.
434
        After calling finished_writing, you may not call accept_bytes anymore.
435
        """
436
        if self._state != "writing":
437
            raise errors.WritingCompleted(self)
438
        self._state = "reading"
439
        self._finished_writing()
440
441
    def _finished_writing(self):
442
        """Helper for finished_writing.
443
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
444
        finished_writing checks the state of the request to determine if
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
445
        finished_writing is allowed, and if it is hands off to _finished_writing
446
        to perform the action.
447
        """
448
        raise NotImplementedError(self._finished_writing)
449
450
    def read_bytes(self, count):
451
        """Read bytes from this requests response.
452
453
        This method will block and wait for count bytes to be read. It may not
454
        be invoked until finished_writing() has been called - this is to ensure
2432.2.7 by Andrew Bennetts
Use less confusing version strings, and define REQUEST_VERSION_TWO/RESPONSE_VERSION_TWO constants for them.
455
        a message-based approach to requests, for compatibility with message
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
456
        based mediums like HTTP.
457
        """
458
        if self._state == "writing":
459
            raise errors.WritingNotComplete(self)
460
        if self._state != "reading":
461
            raise errors.ReadingCompleted(self)
462
        return self._read_bytes(count)
463
464
    def _read_bytes(self, count):
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
465
        """Helper for SmartClientMediumRequest.read_bytes.
466
467
        read_bytes checks the state of the request to determing if bytes
468
        should be read. After that it hands off to _read_bytes to do the
469
        actual read.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
470
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
471
        By default this forwards to self._medium.read_bytes because we are
472
        operating on the medium's stream.
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
473
        """
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
474
        return self._medium.read_bytes(count)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
475
2432.2.7 by Andrew Bennetts
Use less confusing version strings, and define REQUEST_VERSION_TWO/RESPONSE_VERSION_TWO constants for them.
476
    def read_line(self):
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
477
        line = self._read_line()
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
478
        if not line.endswith('\n'):
479
            # end of file encountered reading from server
480
            raise errors.ConnectionReset(
4509.2.3 by Martin Pool
Test tweaks for ConnectionReset message change
481
                "Unexpected end of message. Please check connectivity "
482
                "and permissions, and report a bug if problems persist.")
2432.2.7 by Andrew Bennetts
Use less confusing version strings, and define REQUEST_VERSION_TWO/RESPONSE_VERSION_TWO constants for them.
483
        return line
484
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
485
    def _read_line(self):
486
        """Helper for SmartClientMediumRequest.read_line.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
487
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
488
        By default this forwards to self._medium._get_line because we are
489
        operating on the medium's stream.
490
        """
491
        return self._medium._get_line()
492
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
493
6060.7.1 by Jelmer Vernooij
Add vfs refuser.
494
class _VfsRefuser(object):
495
    """An object that refuses all VFS requests.
496
497
    """
498
499
    def __init__(self):
500
        client._SmartClient.hooks.install_named_hook(
6060.7.2 by Jelmer Vernooij
Fix hook installation
501
            'call', self.check_vfs, 'vfs refuser')
6060.7.1 by Jelmer Vernooij
Add vfs refuser.
502
503
    def check_vfs(self, params):
504
        try:
505
            request_method = request.request_handlers.get(params.method)
506
        except KeyError:
507
            # A method we don't know about doesn't count as a VFS method.
508
            return
6060.7.4 by Jelmer Vernooij
Update NEWS
509
        if issubclass(request_method, vfs.VfsRequest):
510
            raise errors.HpssVfsRequestNotAllowed(params.method, params.args)
6060.7.1 by Jelmer Vernooij
Add vfs refuser.
511
512
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
513
class _DebugCounter(object):
514
    """An object that counts the HPSS calls made to each client medium.
515
5222.2.9 by Robert Collins
Write up some doc about bzrlib.initialize.
516
    When a medium is garbage-collected, or failing that when
517
    bzrlib.global_state exits, the total number of calls made on that medium
518
    are reported via trace.note.
3731.2.1 by Andrew Bennetts
Show total HPSS calls (if any) on stderr when -Dhpss is active.
519
    """
520
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
521
    def __init__(self):
522
        self.counts = weakref.WeakKeyDictionary()
523
        client._SmartClient.hooks.install_named_hook(
524
            'call', self.increment_call_count, 'hpss call counter')
5310.1.1 by Vincent Ladeuil
Fix typo but we may want to use addCleanup instead indeed.
525
        bzrlib.global_state.cleanups.add_cleanup(self.flush_all)
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
526
527
    def track(self, medium):
528
        """Start tracking calls made to a medium.
529
530
        This only keeps a weakref to the medium, so shouldn't affect the
531
        medium's lifetime.
532
        """
533
        medium_repr = repr(medium)
534
        # Add this medium to the WeakKeyDictionary
4326.2.3 by Jonathan Lange
Use as a dict.
535
        self.counts[medium] = dict(count=0, vfs_count=0,
536
                                   medium_repr=medium_repr)
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
537
        # Weakref callbacks are fired in reverse order of their association
538
        # with the referenced object.  So we add a weakref *after* adding to
539
        # the WeakKeyDict so that we can report the value from it before the
540
        # entry is removed by the WeakKeyDict's own callback.
541
        ref = weakref.ref(medium, self.done)
542
543
    def increment_call_count(self, params):
544
        # Increment the count in the WeakKeyDictionary
545
        value = self.counts[params.medium]
4326.2.3 by Jonathan Lange
Use as a dict.
546
        value['count'] += 1
4476.3.15 by Andrew Bennetts
Partially working fallback for pre-1.17 servers.
547
        try:
548
            request_method = request.request_handlers.get(params.method)
549
        except KeyError:
4547.3.1 by Andrew Bennetts
Fix minor bug in -Dhpss that would cause a KeyError when issuing a request for a method not registered in request_handlers.
550
            # A method we don't know about doesn't count as a VFS method.
4476.3.15 by Andrew Bennetts
Partially working fallback for pre-1.17 servers.
551
            return
4326.2.1 by Jonathan Lange
Show the number of VFS calls in -Dhpss output.
552
        if issubclass(request_method, vfs.VfsRequest):
4326.2.3 by Jonathan Lange
Use as a dict.
553
            value['vfs_count'] += 1
3731.2.1 by Andrew Bennetts
Show total HPSS calls (if any) on stderr when -Dhpss is active.
554
555
    def done(self, ref):
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
556
        value = self.counts[ref]
4326.2.3 by Jonathan Lange
Use as a dict.
557
        count, vfs_count, medium_repr = (
558
            value['count'], value['vfs_count'], value['medium_repr'])
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
559
        # In case this callback is invoked for the same ref twice (by the
560
        # weakref callback and by the atexit function), set the call count back
561
        # to 0 so this item won't be reported twice.
4326.2.3 by Jonathan Lange
Use as a dict.
562
        value['count'] = 0
563
        value['vfs_count'] = 0
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
564
        if count != 0:
6138.3.4 by Jonathan Riddell
add gettext() to uses of trace.note()
565
            trace.note(gettext('HPSS calls: {0} ({1} vfs) {2}').format(
566
                       count, vfs_count, medium_repr))
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
567
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
568
    def flush_all(self):
569
        for ref in list(self.counts.keys()):
570
            self.done(ref)
571
572
_debug_counter = None
6060.7.2 by Jelmer Vernooij
Fix hook installation
573
_vfs_refuser = None
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
574
575
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
576
class SmartClientMedium(SmartMedium):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
577
    """Smart client is a medium for sending smart protocol requests over."""
578
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
579
    def __init__(self, base):
3241.1.1 by Andrew Bennetts
Shift protocol version querying from RemoteBzrDirFormat into SmartClientMedium.
580
        super(SmartClientMedium, self).__init__()
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
581
        self.base = base
3241.1.4 by Andrew Bennetts
Use get_smart_medium as suggested by Robert, and deal with the fallout.
582
        self._protocol_version_error = None
3241.1.1 by Andrew Bennetts
Shift protocol version querying from RemoteBzrDirFormat into SmartClientMedium.
583
        self._protocol_version = None
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
584
        self._done_hello = False
3435.1.1 by Andrew Bennetts
Define _remote_is_at_least_1_2 on SmartClientMedium base class, rather than just SmartClientStreamMedium.
585
        # Be optimistic: we assume the remote end can accept new remote
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
586
        # requests until we get an error saying otherwise.
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
587
        # _remote_version_is_before tracks the bzr version the remote side
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
588
        # can be based on what we've seen so far.
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
589
        self._remote_version_is_before = None
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
590
        # Install debug hook function if debug flag is set.
3731.2.1 by Andrew Bennetts
Show total HPSS calls (if any) on stderr when -Dhpss is active.
591
        if 'hpss' in debug.debug_flags:
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
592
            global _debug_counter
593
            if _debug_counter is None:
594
                _debug_counter = _DebugCounter()
595
            _debug_counter.track(self)
6060.7.5 by Jelmer Vernooij
Rename hpss_no_vfs to hpss_client_no_vfs.
596
        if 'hpss_client_no_vfs' in debug.debug_flags:
6060.7.1 by Jelmer Vernooij
Add vfs refuser.
597
            global _vfs_refuser
598
            if _vfs_refuser is None:
599
                _vfs_refuser = _VfsRefuser()
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
600
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
601
    def _is_remote_before(self, version_tuple):
3502.1.1 by Matt Nordhoff
Fix a docstring typo, and a two-expression ``raise`` statement
602
        """Is it possible the remote side supports RPCs for a given version?
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
603
604
        Typical use::
605
606
            needed_version = (1, 2)
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
607
            if medium._is_remote_before(needed_version):
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
608
                fallback_to_pre_1_2_rpc()
609
            else:
610
                try:
611
                    do_1_2_rpc()
612
                except UnknownSmartMethod:
3453.4.9 by Andrew Bennetts
Rename _remote_is_not to _remember_remote_is_before.
613
                    medium._remember_remote_is_before(needed_version)
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
614
                    fallback_to_pre_1_2_rpc()
615
3453.4.9 by Andrew Bennetts
Rename _remote_is_not to _remember_remote_is_before.
616
        :seealso: _remember_remote_is_before
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
617
        """
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
618
        if self._remote_version_is_before is None:
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
619
            # So far, the remote side seems to support everything
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
620
            return False
621
        return version_tuple >= self._remote_version_is_before
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
622
3453.4.9 by Andrew Bennetts
Rename _remote_is_not to _remember_remote_is_before.
623
    def _remember_remote_is_before(self, version_tuple):
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
624
        """Tell this medium that the remote side is older the given version.
625
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
626
        :seealso: _is_remote_before
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
627
        """
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
628
        if (self._remote_version_is_before is not None and
629
            version_tuple > self._remote_version_is_before):
4017.3.3 by Robert Collins
Review feedback - make RemoteRepository.initialize use helpers, and version-lock the new method to not attempt the method on older servers.
630
            # We have been told that the remote side is older than some version
631
            # which is newer than a previously supplied older-than version.
632
            # This indicates that some smart verb call is not guarded
633
            # appropriately (it should simply not have been tried).
4797.49.1 by Andrew Bennetts
First, fix _remember_remote_is_before to never raise AssertionError for what is a very minor bug.
634
            trace.mutter(
3453.4.9 by Andrew Bennetts
Rename _remote_is_not to _remember_remote_is_before.
635
                "_remember_remote_is_before(%r) called, but "
636
                "_remember_remote_is_before(%r) was called previously."
4797.49.1 by Andrew Bennetts
First, fix _remember_remote_is_before to never raise AssertionError for what is a very minor bug.
637
                , version_tuple, self._remote_version_is_before)
638
            if 'hpss' in debug.debug_flags:
639
                ui.ui_factory.show_warning(
640
                    "_remember_remote_is_before(%r) called, but "
641
                    "_remember_remote_is_before(%r) was called previously."
642
                    % (version_tuple, self._remote_version_is_before))
643
            return
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
644
        self._remote_version_is_before = version_tuple
3241.1.1 by Andrew Bennetts
Shift protocol version querying from RemoteBzrDirFormat into SmartClientMedium.
645
646
    def protocol_version(self):
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
647
        """Find out if 'hello' smart request works."""
3241.1.4 by Andrew Bennetts
Use get_smart_medium as suggested by Robert, and deal with the fallout.
648
        if self._protocol_version_error is not None:
649
            raise self._protocol_version_error
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
650
        if not self._done_hello:
3241.1.4 by Andrew Bennetts
Use get_smart_medium as suggested by Robert, and deal with the fallout.
651
            try:
652
                medium_request = self.get_request()
653
                # Send a 'hello' request in protocol version one, for maximum
654
                # backwards compatibility.
3530.1.2 by John Arbash Meinel
missed one of the imports
655
                client_protocol = protocol.SmartClientRequestProtocolOne(medium_request)
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
656
                client_protocol.query_version()
657
                self._done_hello = True
3241.1.4 by Andrew Bennetts
Use get_smart_medium as suggested by Robert, and deal with the fallout.
658
            except errors.SmartProtocolError, e:
659
                # Cache the error, just like we would cache a successful
660
                # result.
661
                self._protocol_version_error = e
662
                raise
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
663
        return '2'
664
665
    def should_probe(self):
666
        """Should RemoteBzrDirFormat.probe_transport send a smart request on
667
        this medium?
668
669
        Some transports are unambiguously smart-only; there's no need to check
670
        if the transport is able to carry smart requests, because that's all
671
        it is for.  In those cases, this method should return False.
672
673
        But some HTTP transports can sometimes fail to carry smart requests,
674
        but still be usuable for accessing remote bzrdirs via plain file
675
        accesses.  So for those transports, their media should return True here
676
        so that RemoteBzrDirFormat can determine if it is appropriate for that
677
        transport.
678
        """
679
        return False
3241.1.1 by Andrew Bennetts
Shift protocol version querying from RemoteBzrDirFormat into SmartClientMedium.
680
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
681
    def disconnect(self):
682
        """If this medium maintains a persistent connection, close it.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
683
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
684
        The default implementation does nothing.
685
        """
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
686
3431.3.11 by Andrew Bennetts
Push remote_path_from_transport logic into SmartClientMedium, removing special-casing of bzr+http from _SmartClient.
687
    def remote_path_from_transport(self, transport):
688
        """Convert transport into a path suitable for using in a request.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
689
3431.3.11 by Andrew Bennetts
Push remote_path_from_transport logic into SmartClientMedium, removing special-casing of bzr+http from _SmartClient.
690
        Note that the resulting remote path doesn't encode the host name or
691
        anything but path, so it is only safe to use it in requests sent over
692
        the medium from the matching transport.
693
        """
694
        medium_base = urlutils.join(self.base, '/')
695
        rel_url = urlutils.relative_url(medium_base, transport.base)
696
        return urllib.unquote(rel_url)
697
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
698
699
class SmartClientStreamMedium(SmartClientMedium):
700
    """Stream based medium common class.
701
702
    SmartClientStreamMediums operate on a stream. All subclasses use a common
703
    SmartClientStreamMediumRequest for their requests, and should implement
704
    _accept_bytes and _read_bytes to allow the request objects to send and
705
    receive bytes.
706
    """
707
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
708
    def __init__(self, base):
709
        SmartClientMedium.__init__(self, base)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
710
        self._current_request = None
711
712
    def accept_bytes(self, bytes):
713
        self._accept_bytes(bytes)
714
715
    def __del__(self):
716
        """The SmartClientStreamMedium knows how to close the stream when it is
717
        finished with it.
718
        """
719
        self.disconnect()
720
721
    def _flush(self):
722
        """Flush the output stream.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
723
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
724
        This method is used by the SmartClientStreamMediumRequest to ensure that
725
        all data for a request is sent, to avoid long timeouts or deadlocks.
726
        """
727
        raise NotImplementedError(self._flush)
728
729
    def get_request(self):
730
        """See SmartClientMedium.get_request().
731
732
        SmartClientStreamMedium always returns a SmartClientStreamMediumRequest
733
        for get_request.
734
        """
735
        return SmartClientStreamMediumRequest(self)
736
737
738
class SmartSimplePipesClientMedium(SmartClientStreamMedium):
739
    """A client medium using simple pipes.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
740
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
741
    This client does not manage the pipes: it assumes they will always be open.
742
    """
743
3431.3.1 by Andrew Bennetts
First rough cut of a fix for bug #230550, by adding .base to SmartClientMedia rather than relying on other objects to track this accurately while reusing client media.
744
    def __init__(self, readable_pipe, writeable_pipe, base):
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
745
        SmartClientStreamMedium.__init__(self, base)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
746
        self._readable_pipe = readable_pipe
747
        self._writeable_pipe = writeable_pipe
748
749
    def _accept_bytes(self, bytes):
750
        """See SmartClientStreamMedium.accept_bytes."""
5011.3.1 by Martin
Revert second-phase EINTR changes
751
        self._writeable_pipe.write(bytes)
3958.1.2 by Andrew Bennetts
Report network activity from more client medium implementations.
752
        self._report_activity(len(bytes), 'write')
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
753
754
    def _flush(self):
755
        """See SmartClientStreamMedium._flush()."""
5011.3.1 by Martin
Revert second-phase EINTR changes
756
        self._writeable_pipe.flush()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
757
758
    def _read_bytes(self, count):
759
        """See SmartClientStreamMedium._read_bytes."""
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
760
        bytes_to_read = min(count, _MAX_READ_SIZE)
761
        bytes = self._readable_pipe.read(bytes_to_read)
3958.1.2 by Andrew Bennetts
Report network activity from more client medium implementations.
762
        self._report_activity(len(bytes), 'read')
763
        return bytes
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
764
765
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
766
class SSHParams(object):
5284.5.5 by Andrew Bennetts
Fix SSHParams docs.
767
    """A set of parameters for starting a remote bzr via SSH."""
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
768
769
    def __init__(self, host, port=None, username=None, password=None,
770
            bzr_remote_path='bzr'):
771
        self.host = host
772
        self.port = port
773
        self.username = username
774
        self.password = password
775
        self.bzr_remote_path = bzr_remote_path
776
777
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
778
class SmartSSHClientMedium(SmartClientStreamMedium):
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
779
    """A client medium using SSH.
780
    
781
    It delegates IO to a SmartClientSocketMedium or
782
    SmartClientAlreadyConnectedSocketMedium (depending on platform).
783
    """
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
784
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
785
    def __init__(self, base, ssh_params, vendor=None):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
786
        """Creates a client that will connect on the first use.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
787
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
788
        :param ssh_params: A SSHParams instance.
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
789
        :param vendor: An optional override for the ssh vendor to use. See
790
            bzrlib.transport.ssh for details on ssh vendors.
791
        """
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
792
        self._real_medium = None
793
        self._ssh_params = ssh_params
4964.2.5 by Martin Pool
Make sure variables used in repr are set early in initialization
794
        # for the benefit of progress making a short description of this
795
        # transport
796
        self._scheme = 'bzr+ssh'
4100.1.5 by Martin Pool
Fix crash in SSHSmartClientStreamMedium repr.
797
        # SmartClientStreamMedium stores the repr of this object in its
798
        # _DebugCounter so we have to store all the values used in our repr
799
        # method before calling the super init.
800
        SmartClientStreamMedium.__init__(self, base)
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
801
        self._vendor = vendor
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
802
        self._ssh_connection = None
4100.1.1 by Martin Pool
Cleanup and add SmartSSHClientMedium repr
803
804
    def __repr__(self):
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
805
        if self._ssh_params.port is None:
4964.2.4 by Martin Pool
Tweak SSHSmartClientMedium to look better when there's no port
806
            maybe_port = ''
807
        else:
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
808
            maybe_port = ':%s' % self._ssh_params.port
4964.2.4 by Martin Pool
Tweak SSHSmartClientMedium to look better when there's no port
809
        return "%s(%s://%s@%s%s/)" % (
4100.1.1 by Martin Pool
Cleanup and add SmartSSHClientMedium repr
810
            self.__class__.__name__,
4964.2.3 by Martin Pool
Tweak SmartSSHClientMedium repr
811
            self._scheme,
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
812
            self._ssh_params.username,
813
            self._ssh_params.host,
4964.2.4 by Martin Pool
Tweak SSHSmartClientMedium to look better when there's no port
814
            maybe_port)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
815
816
    def _accept_bytes(self, bytes):
817
        """See SmartClientStreamMedium.accept_bytes."""
818
        self._ensure_connection()
5284.5.6 by Andrew Bennetts
Tweaks prompted by Robert's review.
819
        self._real_medium.accept_bytes(bytes)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
820
821
    def disconnect(self):
822
        """See SmartClientMedium.disconnect()."""
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
823
        if self._real_medium is not None:
824
            self._real_medium.disconnect()
825
            self._real_medium = None
826
        if self._ssh_connection is not None:
827
            self._ssh_connection.close()
828
            self._ssh_connection = None
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
829
830
    def _ensure_connection(self):
831
        """Connect this medium if not already connected."""
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
832
        if self._real_medium is not None:
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
833
            return
834
        if self._vendor is None:
835
            vendor = ssh._get_ssh_vendor()
836
        else:
837
            vendor = self._vendor
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
838
        self._ssh_connection = vendor.connect_ssh(self._ssh_params.username,
839
                self._ssh_params.password, self._ssh_params.host,
840
                self._ssh_params.port,
841
                command=[self._ssh_params.bzr_remote_path, 'serve', '--inet',
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
842
                         '--directory=/', '--allow-writes'])
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
843
        io_kind, io_object = self._ssh_connection.get_sock_or_pipes()
844
        if io_kind == 'socket':
845
            self._real_medium = SmartClientAlreadyConnectedSocketMedium(
846
                self.base, io_object)
847
        elif io_kind == 'pipes':
848
            read_from, write_to = io_object
849
            self._real_medium = SmartSimplePipesClientMedium(
850
                read_from, write_to, self.base)
851
        else:
852
            raise AssertionError(
853
                "Unexpected io_kind %r from %r"
854
                % (io_kind, self._ssh_connection))
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
855
856
    def _flush(self):
857
        """See SmartClientStreamMedium._flush()."""
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
858
        self._real_medium._flush()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
859
860
    def _read_bytes(self, count):
861
        """See SmartClientStreamMedium.read_bytes."""
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
862
        if self._real_medium is None:
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
863
            raise errors.MediumNotConnected(self)
5284.5.6 by Andrew Bennetts
Tweaks prompted by Robert's review.
864
        return self._real_medium.read_bytes(count)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
865
866
3004.2.1 by Vincent Ladeuil
Fix 150860 by leaving port as user specified it.
867
# Port 4155 is the default port for bzr://, registered with IANA.
3665.4.1 by Jelmer Vernooij
Support IPv6 in the smart server.
868
BZR_DEFAULT_INTERFACE = None
3004.2.1 by Vincent Ladeuil
Fix 150860 by leaving port as user specified it.
869
BZR_DEFAULT_PORT = 4155
870
871
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
872
class SmartClientSocketMedium(SmartClientStreamMedium):
5284.5.6 by Andrew Bennetts
Tweaks prompted by Robert's review.
873
    """A client medium using a socket.
874
    
875
    This class isn't usable directly.  Use one of its subclasses instead.
876
    """
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
877
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
878
    def __init__(self, base):
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
879
        SmartClientStreamMedium.__init__(self, base)
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
880
        self._socket = None
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
881
        self._connected = False
882
883
    def _accept_bytes(self, bytes):
884
        """See SmartClientMedium.accept_bytes."""
885
        self._ensure_connection()
5011.3.9 by Andrew Bennetts
Remove _send_bytes_chunked.
886
        osutils.send_all(self._socket, bytes, self._report_activity)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
887
5284.5.6 by Andrew Bennetts
Tweaks prompted by Robert's review.
888
    def _ensure_connection(self):
889
        """Connect this medium if not already connected."""
890
        raise NotImplementedError(self._ensure_connection)
891
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
892
    def _flush(self):
893
        """See SmartClientStreamMedium._flush().
894
5284.5.6 by Andrew Bennetts
Tweaks prompted by Robert's review.
895
        For sockets we do no flushing. For TCP sockets we may want to turn off
896
        TCP_NODELAY and add a means to do a flush, but that can be done in the
897
        future.
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
898
        """
899
900
    def _read_bytes(self, count):
901
        """See SmartClientMedium.read_bytes."""
902
        if not self._connected:
903
            raise errors.MediumNotConnected(self)
904
        return osutils.read_bytes_from_socket(
905
            self._socket, self._report_activity)
906
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
907
    def disconnect(self):
908
        """See SmartClientMedium.disconnect()."""
909
        if not self._connected:
910
            return
5011.3.1 by Martin
Revert second-phase EINTR changes
911
        self._socket.close()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
912
        self._socket = None
913
        self._connected = False
914
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
915
916
class SmartTCPClientMedium(SmartClientSocketMedium):
5284.5.6 by Andrew Bennetts
Tweaks prompted by Robert's review.
917
    """A client medium that creates a TCP connection."""
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
918
919
    def __init__(self, host, port, base):
920
        """Creates a client that will connect on the first use."""
921
        SmartClientSocketMedium.__init__(self, base)
922
        self._host = host
923
        self._port = port
924
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
925
    def _ensure_connection(self):
926
        """Connect this medium if not already connected."""
927
        if self._connected:
928
            return
3004.2.1 by Vincent Ladeuil
Fix 150860 by leaving port as user specified it.
929
        if self._port is None:
930
            port = BZR_DEFAULT_PORT
931
        else:
932
            port = int(self._port)
3711.2.2 by Jelmer Vernooij
Avoid using AI_ADDRCONFIG since it's not portable.
933
        try:
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
934
            sockaddrs = socket.getaddrinfo(self._host, port, socket.AF_UNSPEC,
3711.2.2 by Jelmer Vernooij
Avoid using AI_ADDRCONFIG since it's not portable.
935
                socket.SOCK_STREAM, 0, 0)
936
        except socket.gaierror, (err_num, err_msg):
937
            raise errors.ConnectionError("failed to lookup %s:%d: %s" %
938
                    (self._host, port, err_msg))
3711.2.3 by Jelmer Vernooij
Add comment.
939
        # Initialize err in case there are no addresses returned:
3665.4.2 by Jelmer Vernooij
Fall through to next available address if previous fails.
940
        err = socket.error("no address found for %s" % self._host)
3665.4.1 by Jelmer Vernooij
Support IPv6 in the smart server.
941
        for (family, socktype, proto, canonname, sockaddr) in sockaddrs:
942
            try:
3665.4.2 by Jelmer Vernooij
Fall through to next available address if previous fails.
943
                self._socket = socket.socket(family, socktype, proto)
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
944
                self._socket.setsockopt(socket.IPPROTO_TCP,
3665.4.2 by Jelmer Vernooij
Fall through to next available address if previous fails.
945
                                        socket.TCP_NODELAY, 1)
3665.4.1 by Jelmer Vernooij
Support IPv6 in the smart server.
946
                self._socket.connect(sockaddr)
947
            except socket.error, err:
3665.4.2 by Jelmer Vernooij
Fall through to next available address if previous fails.
948
                if self._socket is not None:
949
                    self._socket.close()
950
                self._socket = None
951
                continue
952
            break
953
        if self._socket is None:
954
            # socket errors either have a (string) or (errno, string) as their
955
            # args.
956
            if type(err.args) is str:
957
                err_msg = err.args
958
            else:
959
                err_msg = err.args[1]
960
            raise errors.ConnectionError("failed to connect to %s:%d: %s" %
961
                    (self._host, port, err_msg))
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
962
        self._connected = True
963
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
964
965
class SmartClientAlreadyConnectedSocketMedium(SmartClientSocketMedium):
5284.5.3 by Andrew Bennetts
Docstring tweaks.
966
    """A client medium for an already connected socket.
5284.5.1 by Andrew Bennetts
Use socketpairs (rather than pipes) for SSH subprocesses where possible, and formalise some internal APIs a little more.
967
    
968
    Note that this class will assume it "owns" the socket, so it will close it
969
    when its disconnect method is called.
970
    """
971
972
    def __init__(self, base, sock):
973
        SmartClientSocketMedium.__init__(self, base)
974
        self._socket = sock
975
        self._connected = True
976
977
    def _ensure_connection(self):
978
        # Already connected, by definition!  So nothing to do.
979
        pass
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
980
981
982
class SmartClientStreamMediumRequest(SmartClientMediumRequest):
983
    """A SmartClientMediumRequest that works with an SmartClientStreamMedium."""
984
985
    def __init__(self, medium):
986
        SmartClientMediumRequest.__init__(self, medium)
987
        # check that we are safe concurrency wise. If some streams start
988
        # allowing concurrent requests - i.e. via multiplexing - then this
989
        # assert should be moved to SmartClientStreamMedium.get_request,
990
        # and the setting/unsetting of _current_request likewise moved into
991
        # that class : but its unneeded overhead for now. RBC 20060922
992
        if self._medium._current_request is not None:
993
            raise errors.TooManyConcurrentRequests(self._medium)
994
        self._medium._current_request = self
995
996
    def _accept_bytes(self, bytes):
997
        """See SmartClientMediumRequest._accept_bytes.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
998
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
999
        This forwards to self._medium._accept_bytes because we are operating
1000
        on the mediums stream.
1001
        """
1002
        self._medium._accept_bytes(bytes)
1003
1004
    def _finished_reading(self):
1005
        """See SmartClientMediumRequest._finished_reading.
1006
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
1007
        This clears the _current_request on self._medium to allow a new
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
1008
        request to be created.
1009
        """
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1010
        if self._medium._current_request is not self:
1011
            raise AssertionError()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
1012
        self._medium._current_request = None
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
1013
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
1014
    def _finished_writing(self):
1015
        """See SmartClientMediumRequest._finished_writing.
1016
1017
        This invokes self._medium._flush to ensure all bytes are transmitted.
1018
        """
1019
        self._medium._flush()
1020
4382.4.2 by Andrew Bennetts
Refactor duplicated SmartServerSocketStreamMedium._read_bytes and SmartTCPClientMedium._read_bytes to share a common implementation with the best parts of both. Includes Robert's review feedback.
1021