~bzr-pqm/bzr/bzr.dev

4763.2.4 by John Arbash Meinel
merge bzr.2.1 in preparation for NEWS entry.
1
# Copyright (C) 2006-2010 Canonical Ltd
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
4183.7.1 by Sabin Iacob
update FSF mailing address
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
16
2018.5.19 by Andrew Bennetts
Add docstrings to all the new modules, and a few other places.
17
"""The 'medium' layer for the smart servers and clients.
18
19
"Medium" here is the noun meaning "a means of transmission", not the adjective
20
for "the quality between big and small."
21
22
Media carry the bytes of the requests somehow (e.g. via TCP, wrapped in HTTP, or
23
over SSH), and pass them to and from the protocol logic.  See the overview in
24
bzrlib/transport/smart/__init__.py.
25
"""
26
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
27
import os
2018.5.162 by Andrew Bennetts
Add some missing _ensure_real calls, and a missing import.
28
import sys
3431.3.11 by Andrew Bennetts
Push remote_path_from_transport logic into SmartClientMedium, removing special-casing of bzr+http from _SmartClient.
29
import urllib
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
30
3530.1.1 by John Arbash Meinel
Make bzrlib.smart use lazy imports.
31
from bzrlib.lazy_import import lazy_import
32
lazy_import(globals(), """
3731.2.4 by Andrew Bennetts
Minor tweaks.
33
import atexit
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
34
import socket
4913.1.1 by John Arbash Meinel
Switch to using thread.get_ident() which is available on all python versions.
35
import thread
3731.2.4 by Andrew Bennetts
Minor tweaks.
36
import weakref
4889.2.2 by John Arbash Meinel
Add a -Dhpssthread debug flag to include thread.ident info.
37
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
38
from bzrlib import (
3731.2.1 by Andrew Bennetts
Show total HPSS calls (if any) on stderr when -Dhpss is active.
39
    debug,
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
40
    errors,
41
    symbol_versioning,
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
42
    trace,
3958.1.1 by Andrew Bennetts
Report traffic on smart media as transport activity.
43
    ui,
3431.3.11 by Andrew Bennetts
Push remote_path_from_transport logic into SmartClientMedium, removing special-casing of bzr+http from _SmartClient.
44
    urlutils,
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
45
    )
4326.2.1 by Jonathan Lange
Show the number of VFS calls in -Dhpss output.
46
from bzrlib.smart import client, protocol, request, vfs
3066.2.1 by John Arbash Meinel
We don't require paramiko for bzr+ssh.
47
from bzrlib.transport import ssh
3530.1.1 by John Arbash Meinel
Make bzrlib.smart use lazy imports.
48
""")
4332.3.17 by Robert Collins
Check revisions as we cross check the revision index, rather than in a separate pass.
49
from bzrlib import osutils
2018.5.17 by Andrew Bennetts
Paramaterise the commands handled by SmartServerRequestHandler.
50
5011.3.3 by Martin
Reintroduce EINTR handling only for socket object functions and general cleanup
51
# Throughout this module buffer size parameters are either limited to be at
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
52
# most _MAX_READ_SIZE, or are ignored and _MAX_READ_SIZE is used instead.
53
# For this module's purposes, MAX_SOCKET_CHUNK is a reasonable size for reads
54
# from non-sockets as well.
55
_MAX_READ_SIZE = osutils.MAX_SOCKET_CHUNK
3565.1.3 by Andrew Bennetts
Define a _MAX_READ_SIZE constant as suggested by John's review.
56
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
57
def _get_protocol_factory_for_bytes(bytes):
58
    """Determine the right protocol factory for 'bytes'.
59
60
    This will return an appropriate protocol factory depending on the version
61
    of the protocol being used, as determined by inspecting the given bytes.
62
    The bytes should have at least one newline byte (i.e. be a whole line),
63
    otherwise it's possible that a request will be incorrectly identified as
64
    version 1.
65
66
    Typical use would be::
67
68
         factory, unused_bytes = _get_protocol_factory_for_bytes(bytes)
69
         server_protocol = factory(transport, write_func, root_client_path)
70
         server_protocol.accept_bytes(unused_bytes)
71
72
    :param bytes: a str of bytes of the start of the request.
73
    :returns: 2-tuple of (protocol_factory, unused_bytes).  protocol_factory is
74
        a callable that takes three args: transport, write_func,
75
        root_client_path.  unused_bytes are any bytes that were not part of a
76
        protocol version marker.
77
    """
3530.1.1 by John Arbash Meinel
Make bzrlib.smart use lazy imports.
78
    if bytes.startswith(protocol.MESSAGE_VERSION_THREE):
79
        protocol_factory = protocol.build_server_protocol_three
80
        bytes = bytes[len(protocol.MESSAGE_VERSION_THREE):]
81
    elif bytes.startswith(protocol.REQUEST_VERSION_TWO):
82
        protocol_factory = protocol.SmartServerRequestProtocolTwo
83
        bytes = bytes[len(protocol.REQUEST_VERSION_TWO):]
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
84
    else:
3530.1.1 by John Arbash Meinel
Make bzrlib.smart use lazy imports.
85
        protocol_factory = protocol.SmartServerRequestProtocolOne
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
86
    return protocol_factory, bytes
87
88
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
89
def _get_line(read_bytes_func):
90
    """Read bytes using read_bytes_func until a newline byte.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
91
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
92
    This isn't particularly efficient, so should only be used when the
93
    expected size of the line is quite short.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
94
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
95
    :returns: a tuple of two strs: (line, excess)
96
    """
97
    newline_pos = -1
98
    bytes = ''
99
    while newline_pos == -1:
100
        new_bytes = read_bytes_func(1)
101
        bytes += new_bytes
102
        if new_bytes == '':
103
            # Ran out of bytes before receiving a complete line.
104
            return bytes, ''
105
        newline_pos = bytes.find('\n')
106
    line = bytes[:newline_pos+1]
107
    excess = bytes[newline_pos+1:]
108
    return line, excess
109
110
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
111
class SmartMedium(object):
112
    """Base class for smart protocol media, both client- and server-side."""
113
114
    def __init__(self):
115
        self._push_back_buffer = None
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
116
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
117
    def _push_back(self, bytes):
118
        """Return unused bytes to the medium, because they belong to the next
119
        request(s).
120
121
        This sets the _push_back_buffer to the given bytes.
122
        """
123
        if self._push_back_buffer is not None:
124
            raise AssertionError(
125
                "_push_back called when self._push_back_buffer is %r"
126
                % (self._push_back_buffer,))
127
        if bytes == '':
128
            return
129
        self._push_back_buffer = bytes
130
131
    def _get_push_back_buffer(self):
132
        if self._push_back_buffer == '':
133
            raise AssertionError(
134
                '%s._push_back_buffer should never be the empty string, '
135
                'which can be confused with EOF' % (self,))
136
        bytes = self._push_back_buffer
137
        self._push_back_buffer = None
138
        return bytes
139
140
    def read_bytes(self, desired_count):
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
141
        """Read some bytes from this medium.
142
143
        :returns: some bytes, possibly more or less than the number requested
144
            in 'desired_count' depending on the medium.
145
        """
146
        if self._push_back_buffer is not None:
147
            return self._get_push_back_buffer()
3565.1.3 by Andrew Bennetts
Define a _MAX_READ_SIZE constant as suggested by John's review.
148
        bytes_to_read = min(desired_count, _MAX_READ_SIZE)
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
149
        return self._read_bytes(bytes_to_read)
150
151
    def _read_bytes(self, count):
152
        raise NotImplementedError(self._read_bytes)
153
154
    def _get_line(self):
155
        """Read bytes from this request's response until a newline byte.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
156
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
157
        This isn't particularly efficient, so should only be used when the
158
        expected size of the line is quite short.
159
160
        :returns: a string of bytes ending in a newline (byte 0x0A).
161
        """
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
162
        line, excess = _get_line(self.read_bytes)
163
        self._push_back(excess)
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
164
        return line
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
165
3958.1.1 by Andrew Bennetts
Report traffic on smart media as transport activity.
166
    def _report_activity(self, bytes, direction):
167
        """Notify that this medium has activity.
168
169
        Implementations should call this from all methods that actually do IO.
170
        Be careful that it's not called twice, if one method is implemented on
171
        top of another.
172
173
        :param bytes: Number of bytes read or written.
174
        :param direction: 'read' or 'write' or None.
175
        """
176
        ui.ui_factory.report_transport_activity(self, bytes, direction)
177
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
178
179
class SmartServerStreamMedium(SmartMedium):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
180
    """Handles smart commands coming over a stream.
181
182
    The stream may be a pipe connected to sshd, or a tcp socket, or an
183
    in-process fifo for testing.
184
185
    One instance is created for each connected client; it can serve multiple
186
    requests in the lifetime of the connection.
187
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
188
    The server passes requests through to an underlying backing transport,
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
189
    which will typically be a LocalTransport looking at the server's filesystem.
3236.3.4 by Andrew Bennetts
Rename 'push_back' attribute to '_push_back_buffer', add some docstrings, and remove a little bit of redundant code from SmartServerSocketStreamMedium._serve_one_request_unguarded.
190
191
    :ivar _push_back_buffer: a str of bytes that have been read from the stream
192
        but not used yet, or None if there are no buffered bytes.  Subclasses
193
        should make sure to exhaust this buffer before reading more bytes from
194
        the stream.  See also the _push_back method.
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
195
    """
196
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
197
    def __init__(self, backing_transport, root_client_path='/'):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
198
        """Construct new server.
199
200
        :param backing_transport: Transport for the directory served.
201
        """
202
        # backing_transport could be passed to serve instead of __init__
203
        self.backing_transport = backing_transport
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
204
        self.root_client_path = root_client_path
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
205
        self.finished = False
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
206
        SmartMedium.__init__(self)
3236.3.5 by Andrew Bennetts
Add _get_push_back_buffer helper.
207
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
208
    def serve(self):
209
        """Serve requests until the client disconnects."""
210
        # Keep a reference to stderr because the sys module's globals get set to
211
        # None during interpreter shutdown.
212
        from sys import stderr
213
        try:
214
            while not self.finished:
2432.2.3 by Andrew Bennetts
Merge from bzr.dev.
215
                server_protocol = self._build_protocol()
2018.5.14 by Andrew Bennetts
Move SmartTCPServer to smart/server.py, and SmartServerRequestHandler to smart/request.py.
216
                self._serve_one_request(server_protocol)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
217
        except Exception, e:
218
            stderr.write("%s terminating on exception %s\n" % (self, e))
219
            raise
220
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
221
    def _build_protocol(self):
2432.2.8 by Andrew Bennetts
NEWS entry, greatly improved docstring in bzrlib.smart.
222
        """Identifies the version of the incoming request, and returns an
223
        a protocol object that can interpret it.
224
225
        If more bytes than the version prefix of the request are read, they will
226
        be fed into the protocol before it is returned.
227
228
        :returns: a SmartServerRequestProtocol.
229
        """
2432.2.7 by Andrew Bennetts
Use less confusing version strings, and define REQUEST_VERSION_TWO/RESPONSE_VERSION_TWO constants for them.
230
        bytes = self._get_line()
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
231
        protocol_factory, unused_bytes = _get_protocol_factory_for_bytes(bytes)
3245.4.14 by Andrew Bennetts
Merge from bzr.dev (via loom thread).
232
        protocol = protocol_factory(
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
233
            self.backing_transport, self._write_out, self.root_client_path)
3245.4.16 by Andrew Bennetts
Remove duplication of request version identification logic in wsgi.py
234
        protocol.accept_bytes(unused_bytes)
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
235
        return protocol
236
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
237
    def _serve_one_request(self, protocol):
238
        """Read one request from input, process, send back a response.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
239
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
240
        :param protocol: a SmartServerRequestProtocol.
241
        """
242
        try:
243
            self._serve_one_request_unguarded(protocol)
244
        except KeyboardInterrupt:
245
            raise
246
        except Exception, e:
247
            self.terminate_due_to_error()
248
249
    def terminate_due_to_error(self):
250
        """Called when an unhandled exception from the protocol occurs."""
251
        raise NotImplementedError(self.terminate_due_to_error)
252
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
253
    def _read_bytes(self, desired_count):
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
254
        """Get some bytes from the medium.
255
256
        :param desired_count: number of bytes we want to read.
257
        """
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
258
        raise NotImplementedError(self._read_bytes)
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
259
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
260
261
class SmartServerSocketStreamMedium(SmartServerStreamMedium):
262
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
263
    def __init__(self, sock, backing_transport, root_client_path='/'):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
264
        """Constructor.
265
266
        :param sock: the socket the server will read from.  It will be put
267
            into blocking mode.
268
        """
2692.1.11 by Andrew Bennetts
Improve test coverage by making SmartTCPServer_for_testing by default create a server that does not serve the backing transport's root at its own root. This mirrors the way most HTTP smart servers are configured.
269
        SmartServerStreamMedium.__init__(
270
            self, backing_transport, root_client_path=root_client_path)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
271
        sock.setblocking(True)
272
        self.socket = sock
273
274
    def _serve_one_request_unguarded(self, protocol):
275
        while protocol.next_read_size():
3565.1.3 by Andrew Bennetts
Define a _MAX_READ_SIZE constant as suggested by John's review.
276
            # We can safely try to read large chunks.  If there is less data
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
277
            # than MAX_SOCKET_CHUNK ready, the socket will just return a
278
            # short read immediately rather than block.
279
            bytes = self.read_bytes(osutils.MAX_SOCKET_CHUNK)
3236.3.4 by Andrew Bennetts
Rename 'push_back' attribute to '_push_back_buffer', add some docstrings, and remove a little bit of redundant code from SmartServerSocketStreamMedium._serve_one_request_unguarded.
280
            if bytes == '':
281
                self.finished = True
282
                return
283
            protocol.accept_bytes(bytes)
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
284
3245.4.21 by Andrew Bennetts
Remove 'excess_buffer' attribute and another crufty comment.
285
        self._push_back(protocol.unused_data)
3195.3.18 by Andrew Bennetts
call_with_body_bytes now works with v3 (e.g. test_copy_content_remote_to_local passes). Lots of debugging cruft, though.
286
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
287
    def _read_bytes(self, desired_count):
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
288
        return osutils.read_bytes_from_socket(
289
            self.socket, self._report_activity)
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
290
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
291
    def terminate_due_to_error(self):
3245.4.59 by Andrew Bennetts
Various tweaks in response to Martin's review.
292
        # TODO: This should log to a server log file, but no such thing
293
        # exists yet.  Andrew Bennetts 2006-09-29.
5011.3.1 by Martin
Revert second-phase EINTR changes
294
        self.socket.close()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
295
        self.finished = True
296
297
    def _write_out(self, bytes):
4889.2.1 by John Arbash Meinel
Make -Dhpss log debug information for the server process.
298
        tstart = osutils.timer_func()
5011.3.9 by Andrew Bennetts
Remove _send_bytes_chunked.
299
        osutils.send_all(self.socket, bytes, self._report_activity)
4889.2.1 by John Arbash Meinel
Make -Dhpss log debug information for the server process.
300
        if 'hpss' in debug.debug_flags:
4913.1.1 by John Arbash Meinel
Switch to using thread.get_ident() which is available on all python versions.
301
            thread_id = thread.get_ident()
4889.2.3 by John Arbash Meinel
Get rid of -Dhpssthread, just always include it.
302
            trace.mutter('%12s: [%s] %d bytes to the socket in %.3fs'
303
                         % ('wrote', thread_id, len(bytes),
4889.2.2 by John Arbash Meinel
Add a -Dhpssthread debug flag to include thread.ident info.
304
                            osutils.timer_func() - tstart))
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
305
306
307
class SmartServerPipeStreamMedium(SmartServerStreamMedium):
308
309
    def __init__(self, in_file, out_file, backing_transport):
310
        """Construct new server.
311
312
        :param in_file: Python file from which requests can be read.
313
        :param out_file: Python file to write responses.
314
        :param backing_transport: Transport for the directory served.
315
        """
316
        SmartServerStreamMedium.__init__(self, backing_transport)
2018.5.161 by Andrew Bennetts
Reinstate forcing binary mode on windows in SmartServerStreamMedium.
317
        if sys.platform == 'win32':
318
            # force binary mode for files
319
            import msvcrt
320
            for f in (in_file, out_file):
321
                fileno = getattr(f, 'fileno', None)
322
                if fileno:
323
                    msvcrt.setmode(fileno(), os.O_BINARY)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
324
        self._in = in_file
325
        self._out = out_file
326
327
    def _serve_one_request_unguarded(self, protocol):
328
        while True:
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
329
            # We need to be careful not to read past the end of the current
330
            # request, or else the read from the pipe will block, so we use
331
            # protocol.next_read_size().
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
332
            bytes_to_read = protocol.next_read_size()
333
            if bytes_to_read == 0:
334
                # Finished serving this request.
5011.3.1 by Martin
Revert second-phase EINTR changes
335
                self._out.flush()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
336
                return
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
337
            bytes = self.read_bytes(bytes_to_read)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
338
            if bytes == '':
339
                # Connection has been closed.
340
                self.finished = True
5011.3.1 by Martin
Revert second-phase EINTR changes
341
                self._out.flush()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
342
                return
343
            protocol.accept_bytes(bytes)
344
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
345
    def _read_bytes(self, desired_count):
5011.3.1 by Martin
Revert second-phase EINTR changes
346
        return self._in.read(desired_count)
2432.2.2 by Andrew Bennetts
Smart server mediums now detect which protocol version a request is and dispatch accordingly.
347
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
348
    def terminate_due_to_error(self):
349
        # TODO: This should log to a server log file, but no such thing
350
        # exists yet.  Andrew Bennetts 2006-09-29.
5011.3.1 by Martin
Revert second-phase EINTR changes
351
        self._out.close()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
352
        self.finished = True
353
354
    def _write_out(self, bytes):
5011.3.1 by Martin
Revert second-phase EINTR changes
355
        self._out.write(bytes)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
356
357
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
358
class SmartClientMediumRequest(object):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
359
    """A request on a SmartClientMedium.
360
361
    Each request allows bytes to be provided to it via accept_bytes, and then
362
    the response bytes to be read via read_bytes.
363
364
    For instance:
365
    request.accept_bytes('123')
366
    request.finished_writing()
367
    result = request.read_bytes(3)
368
    request.finished_reading()
369
370
    It is up to the individual SmartClientMedium whether multiple concurrent
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
371
    requests can exist. See SmartClientMedium.get_request to obtain instances
372
    of SmartClientMediumRequest, and the concrete Medium you are using for
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
373
    details on concurrency and pipelining.
374
    """
375
376
    def __init__(self, medium):
377
        """Construct a SmartClientMediumRequest for the medium medium."""
378
        self._medium = medium
379
        # we track state by constants - we may want to use the same
380
        # pattern as BodyReader if it gets more complex.
381
        # valid states are: "writing", "reading", "done"
382
        self._state = "writing"
383
384
    def accept_bytes(self, bytes):
385
        """Accept bytes for inclusion in this request.
386
4031.3.1 by Frank Aspell
Fixing various typos
387
        This method may not be called after finished_writing() has been
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
388
        called.  It depends upon the Medium whether or not the bytes will be
389
        immediately transmitted. Message based Mediums will tend to buffer the
390
        bytes until finished_writing() is called.
391
392
        :param bytes: A bytestring.
393
        """
394
        if self._state != "writing":
395
            raise errors.WritingCompleted(self)
396
        self._accept_bytes(bytes)
397
398
    def _accept_bytes(self, bytes):
399
        """Helper for accept_bytes.
400
401
        Accept_bytes checks the state of the request to determing if bytes
402
        should be accepted. After that it hands off to _accept_bytes to do the
403
        actual acceptance.
404
        """
405
        raise NotImplementedError(self._accept_bytes)
406
407
    def finished_reading(self):
408
        """Inform the request that all desired data has been read.
409
410
        This will remove the request from the pipeline for its medium (if the
411
        medium supports pipelining) and any further calls to methods on the
412
        request will raise ReadingCompleted.
413
        """
414
        if self._state == "writing":
415
            raise errors.WritingNotComplete(self)
416
        if self._state != "reading":
417
            raise errors.ReadingCompleted(self)
418
        self._state = "done"
419
        self._finished_reading()
420
421
    def _finished_reading(self):
422
        """Helper for finished_reading.
423
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
424
        finished_reading checks the state of the request to determine if
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
425
        finished_reading is allowed, and if it is hands off to _finished_reading
426
        to perform the action.
427
        """
428
        raise NotImplementedError(self._finished_reading)
429
430
    def finished_writing(self):
431
        """Finish the writing phase of this request.
432
433
        This will flush all pending data for this request along the medium.
434
        After calling finished_writing, you may not call accept_bytes anymore.
435
        """
436
        if self._state != "writing":
437
            raise errors.WritingCompleted(self)
438
        self._state = "reading"
439
        self._finished_writing()
440
441
    def _finished_writing(self):
442
        """Helper for finished_writing.
443
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
444
        finished_writing checks the state of the request to determine if
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
445
        finished_writing is allowed, and if it is hands off to _finished_writing
446
        to perform the action.
447
        """
448
        raise NotImplementedError(self._finished_writing)
449
450
    def read_bytes(self, count):
451
        """Read bytes from this requests response.
452
453
        This method will block and wait for count bytes to be read. It may not
454
        be invoked until finished_writing() has been called - this is to ensure
2432.2.7 by Andrew Bennetts
Use less confusing version strings, and define REQUEST_VERSION_TWO/RESPONSE_VERSION_TWO constants for them.
455
        a message-based approach to requests, for compatibility with message
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
456
        based mediums like HTTP.
457
        """
458
        if self._state == "writing":
459
            raise errors.WritingNotComplete(self)
460
        if self._state != "reading":
461
            raise errors.ReadingCompleted(self)
462
        return self._read_bytes(count)
463
464
    def _read_bytes(self, count):
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
465
        """Helper for SmartClientMediumRequest.read_bytes.
466
467
        read_bytes checks the state of the request to determing if bytes
468
        should be read. After that it hands off to _read_bytes to do the
469
        actual read.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
470
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
471
        By default this forwards to self._medium.read_bytes because we are
472
        operating on the medium's stream.
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
473
        """
3565.1.2 by Andrew Bennetts
Delete some more code, fix some bugs, add more comments.
474
        return self._medium.read_bytes(count)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
475
2432.2.7 by Andrew Bennetts
Use less confusing version strings, and define REQUEST_VERSION_TWO/RESPONSE_VERSION_TWO constants for them.
476
    def read_line(self):
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
477
        line = self._read_line()
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
478
        if not line.endswith('\n'):
479
            # end of file encountered reading from server
480
            raise errors.ConnectionReset(
4509.2.3 by Martin Pool
Test tweaks for ConnectionReset message change
481
                "Unexpected end of message. Please check connectivity "
482
                "and permissions, and report a bug if problems persist.")
2432.2.7 by Andrew Bennetts
Use less confusing version strings, and define REQUEST_VERSION_TWO/RESPONSE_VERSION_TWO constants for them.
483
        return line
484
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
485
    def _read_line(self):
486
        """Helper for SmartClientMediumRequest.read_line.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
487
3606.4.1 by Andrew Bennetts
Fix NotImplementedError when probing for smart protocol via HTTP.
488
        By default this forwards to self._medium._get_line because we are
489
        operating on the medium's stream.
490
        """
491
        return self._medium._get_line()
492
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
493
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
494
class _DebugCounter(object):
495
    """An object that counts the HPSS calls made to each client medium.
496
497
    When a medium is garbage-collected, or failing that when atexit functions
498
    are run, the total number of calls made on that medium are reported via
499
    trace.note.
3731.2.1 by Andrew Bennetts
Show total HPSS calls (if any) on stderr when -Dhpss is active.
500
    """
501
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
502
    def __init__(self):
503
        self.counts = weakref.WeakKeyDictionary()
504
        client._SmartClient.hooks.install_named_hook(
505
            'call', self.increment_call_count, 'hpss call counter')
506
        atexit.register(self.flush_all)
507
508
    def track(self, medium):
509
        """Start tracking calls made to a medium.
510
511
        This only keeps a weakref to the medium, so shouldn't affect the
512
        medium's lifetime.
513
        """
514
        medium_repr = repr(medium)
515
        # Add this medium to the WeakKeyDictionary
4326.2.3 by Jonathan Lange
Use as a dict.
516
        self.counts[medium] = dict(count=0, vfs_count=0,
517
                                   medium_repr=medium_repr)
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
518
        # Weakref callbacks are fired in reverse order of their association
519
        # with the referenced object.  So we add a weakref *after* adding to
520
        # the WeakKeyDict so that we can report the value from it before the
521
        # entry is removed by the WeakKeyDict's own callback.
522
        ref = weakref.ref(medium, self.done)
523
524
    def increment_call_count(self, params):
525
        # Increment the count in the WeakKeyDictionary
526
        value = self.counts[params.medium]
4326.2.3 by Jonathan Lange
Use as a dict.
527
        value['count'] += 1
4476.3.15 by Andrew Bennetts
Partially working fallback for pre-1.17 servers.
528
        try:
529
            request_method = request.request_handlers.get(params.method)
530
        except KeyError:
4547.3.1 by Andrew Bennetts
Fix minor bug in -Dhpss that would cause a KeyError when issuing a request for a method not registered in request_handlers.
531
            # A method we don't know about doesn't count as a VFS method.
4476.3.15 by Andrew Bennetts
Partially working fallback for pre-1.17 servers.
532
            return
4326.2.1 by Jonathan Lange
Show the number of VFS calls in -Dhpss output.
533
        if issubclass(request_method, vfs.VfsRequest):
4326.2.3 by Jonathan Lange
Use as a dict.
534
            value['vfs_count'] += 1
3731.2.1 by Andrew Bennetts
Show total HPSS calls (if any) on stderr when -Dhpss is active.
535
536
    def done(self, ref):
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
537
        value = self.counts[ref]
4326.2.3 by Jonathan Lange
Use as a dict.
538
        count, vfs_count, medium_repr = (
539
            value['count'], value['vfs_count'], value['medium_repr'])
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
540
        # In case this callback is invoked for the same ref twice (by the
541
        # weakref callback and by the atexit function), set the call count back
542
        # to 0 so this item won't be reported twice.
4326.2.3 by Jonathan Lange
Use as a dict.
543
        value['count'] = 0
544
        value['vfs_count'] = 0
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
545
        if count != 0:
4326.2.1 by Jonathan Lange
Show the number of VFS calls in -Dhpss output.
546
            trace.note('HPSS calls: %d (%d vfs) %s',
547
                       count, vfs_count, medium_repr)
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
548
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
549
    def flush_all(self):
550
        for ref in list(self.counts.keys()):
551
            self.done(ref)
552
553
_debug_counter = None
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
554
555
3565.1.1 by Andrew Bennetts
Read no more then 64k at a time in the smart protocol code.
556
class SmartClientMedium(SmartMedium):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
557
    """Smart client is a medium for sending smart protocol requests over."""
558
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
559
    def __init__(self, base):
3241.1.1 by Andrew Bennetts
Shift protocol version querying from RemoteBzrDirFormat into SmartClientMedium.
560
        super(SmartClientMedium, self).__init__()
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
561
        self.base = base
3241.1.4 by Andrew Bennetts
Use get_smart_medium as suggested by Robert, and deal with the fallout.
562
        self._protocol_version_error = None
3241.1.1 by Andrew Bennetts
Shift protocol version querying from RemoteBzrDirFormat into SmartClientMedium.
563
        self._protocol_version = None
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
564
        self._done_hello = False
3435.1.1 by Andrew Bennetts
Define _remote_is_at_least_1_2 on SmartClientMedium base class, rather than just SmartClientStreamMedium.
565
        # Be optimistic: we assume the remote end can accept new remote
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
566
        # requests until we get an error saying otherwise.
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
567
        # _remote_version_is_before tracks the bzr version the remote side
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
568
        # can be based on what we've seen so far.
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
569
        self._remote_version_is_before = None
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
570
        # Install debug hook function if debug flag is set.
3731.2.1 by Andrew Bennetts
Show total HPSS calls (if any) on stderr when -Dhpss is active.
571
        if 'hpss' in debug.debug_flags:
3731.2.5 by Andrew Bennetts
Rework hpss call counter.
572
            global _debug_counter
573
            if _debug_counter is None:
574
                _debug_counter = _DebugCounter()
575
            _debug_counter.track(self)
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
576
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
577
    def _is_remote_before(self, version_tuple):
3502.1.1 by Matt Nordhoff
Fix a docstring typo, and a two-expression ``raise`` statement
578
        """Is it possible the remote side supports RPCs for a given version?
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
579
580
        Typical use::
581
582
            needed_version = (1, 2)
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
583
            if medium._is_remote_before(needed_version):
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
584
                fallback_to_pre_1_2_rpc()
585
            else:
586
                try:
587
                    do_1_2_rpc()
588
                except UnknownSmartMethod:
3453.4.9 by Andrew Bennetts
Rename _remote_is_not to _remember_remote_is_before.
589
                    medium._remember_remote_is_before(needed_version)
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
590
                    fallback_to_pre_1_2_rpc()
591
3453.4.9 by Andrew Bennetts
Rename _remote_is_not to _remember_remote_is_before.
592
        :seealso: _remember_remote_is_before
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
593
        """
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
594
        if self._remote_version_is_before is None:
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
595
            # So far, the remote side seems to support everything
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
596
            return False
597
        return version_tuple >= self._remote_version_is_before
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
598
3453.4.9 by Andrew Bennetts
Rename _remote_is_not to _remember_remote_is_before.
599
    def _remember_remote_is_before(self, version_tuple):
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
600
        """Tell this medium that the remote side is older the given version.
601
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
602
        :seealso: _is_remote_before
3453.4.1 by Andrew Bennetts
Better infrastructure on SmartClientMedium for tracking the remote version.
603
        """
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
604
        if (self._remote_version_is_before is not None and
605
            version_tuple > self._remote_version_is_before):
4017.3.3 by Robert Collins
Review feedback - make RemoteRepository.initialize use helpers, and version-lock the new method to not attempt the method on older servers.
606
            # We have been told that the remote side is older than some version
607
            # which is newer than a previously supplied older-than version.
608
            # This indicates that some smart verb call is not guarded
609
            # appropriately (it should simply not have been tried).
4797.49.1 by Andrew Bennetts
First, fix _remember_remote_is_before to never raise AssertionError for what is a very minor bug.
610
            trace.mutter(
3453.4.9 by Andrew Bennetts
Rename _remote_is_not to _remember_remote_is_before.
611
                "_remember_remote_is_before(%r) called, but "
612
                "_remember_remote_is_before(%r) was called previously."
4797.49.1 by Andrew Bennetts
First, fix _remember_remote_is_before to never raise AssertionError for what is a very minor bug.
613
                , version_tuple, self._remote_version_is_before)
614
            if 'hpss' in debug.debug_flags:
615
                ui.ui_factory.show_warning(
616
                    "_remember_remote_is_before(%r) called, but "
617
                    "_remember_remote_is_before(%r) was called previously."
618
                    % (version_tuple, self._remote_version_is_before))
619
            return
3453.4.10 by Andrew Bennetts
Change _is_remote_at_least to _is_remote_before.
620
        self._remote_version_is_before = version_tuple
3241.1.1 by Andrew Bennetts
Shift protocol version querying from RemoteBzrDirFormat into SmartClientMedium.
621
622
    def protocol_version(self):
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
623
        """Find out if 'hello' smart request works."""
3241.1.4 by Andrew Bennetts
Use get_smart_medium as suggested by Robert, and deal with the fallout.
624
        if self._protocol_version_error is not None:
625
            raise self._protocol_version_error
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
626
        if not self._done_hello:
3241.1.4 by Andrew Bennetts
Use get_smart_medium as suggested by Robert, and deal with the fallout.
627
            try:
628
                medium_request = self.get_request()
629
                # Send a 'hello' request in protocol version one, for maximum
630
                # backwards compatibility.
3530.1.2 by John Arbash Meinel
missed one of the imports
631
                client_protocol = protocol.SmartClientRequestProtocolOne(medium_request)
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
632
                client_protocol.query_version()
633
                self._done_hello = True
3241.1.4 by Andrew Bennetts
Use get_smart_medium as suggested by Robert, and deal with the fallout.
634
            except errors.SmartProtocolError, e:
635
                # Cache the error, just like we would cache a successful
636
                # result.
637
                self._protocol_version_error = e
638
                raise
3245.4.47 by Andrew Bennetts
Don't automatically send 'hello' requests from RemoteBzrDirFormat.probe_transport unless we have to (i.e. the transport is HTTP).
639
        return '2'
640
641
    def should_probe(self):
642
        """Should RemoteBzrDirFormat.probe_transport send a smart request on
643
        this medium?
644
645
        Some transports are unambiguously smart-only; there's no need to check
646
        if the transport is able to carry smart requests, because that's all
647
        it is for.  In those cases, this method should return False.
648
649
        But some HTTP transports can sometimes fail to carry smart requests,
650
        but still be usuable for accessing remote bzrdirs via plain file
651
        accesses.  So for those transports, their media should return True here
652
        so that RemoteBzrDirFormat can determine if it is appropriate for that
653
        transport.
654
        """
655
        return False
3241.1.1 by Andrew Bennetts
Shift protocol version querying from RemoteBzrDirFormat into SmartClientMedium.
656
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
657
    def disconnect(self):
658
        """If this medium maintains a persistent connection, close it.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
659
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
660
        The default implementation does nothing.
661
        """
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
662
3431.3.11 by Andrew Bennetts
Push remote_path_from_transport logic into SmartClientMedium, removing special-casing of bzr+http from _SmartClient.
663
    def remote_path_from_transport(self, transport):
664
        """Convert transport into a path suitable for using in a request.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
665
3431.3.11 by Andrew Bennetts
Push remote_path_from_transport logic into SmartClientMedium, removing special-casing of bzr+http from _SmartClient.
666
        Note that the resulting remote path doesn't encode the host name or
667
        anything but path, so it is only safe to use it in requests sent over
668
        the medium from the matching transport.
669
        """
670
        medium_base = urlutils.join(self.base, '/')
671
        rel_url = urlutils.relative_url(medium_base, transport.base)
672
        return urllib.unquote(rel_url)
673
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
674
675
class SmartClientStreamMedium(SmartClientMedium):
676
    """Stream based medium common class.
677
678
    SmartClientStreamMediums operate on a stream. All subclasses use a common
679
    SmartClientStreamMediumRequest for their requests, and should implement
680
    _accept_bytes and _read_bytes to allow the request objects to send and
681
    receive bytes.
682
    """
683
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
684
    def __init__(self, base):
685
        SmartClientMedium.__init__(self, base)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
686
        self._current_request = None
687
688
    def accept_bytes(self, bytes):
689
        self._accept_bytes(bytes)
690
691
    def __del__(self):
692
        """The SmartClientStreamMedium knows how to close the stream when it is
693
        finished with it.
694
        """
695
        self.disconnect()
696
697
    def _flush(self):
698
        """Flush the output stream.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
699
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
700
        This method is used by the SmartClientStreamMediumRequest to ensure that
701
        all data for a request is sent, to avoid long timeouts or deadlocks.
702
        """
703
        raise NotImplementedError(self._flush)
704
705
    def get_request(self):
706
        """See SmartClientMedium.get_request().
707
708
        SmartClientStreamMedium always returns a SmartClientStreamMediumRequest
709
        for get_request.
710
        """
711
        return SmartClientStreamMediumRequest(self)
712
713
714
class SmartSimplePipesClientMedium(SmartClientStreamMedium):
715
    """A client medium using simple pipes.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
716
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
717
    This client does not manage the pipes: it assumes they will always be open.
5011.3.4 by Andrew Bennetts
Reinstate osutils.until_no_eintr and .send_all, reapply until_no_eintr in SmartSimplePipesClientMedium.read_bytes.
718
719
    Note that if readable_pipe.read might raise IOError or OSError with errno
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
720
    of EINTR, it must be safe to retry the read.  Plain CPython fileobjects
721
    (such as used for sys.stdin) are safe.
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
722
    """
723
3431.3.1 by Andrew Bennetts
First rough cut of a fix for bug #230550, by adding .base to SmartClientMedia rather than relying on other objects to track this accurately while reusing client media.
724
    def __init__(self, readable_pipe, writeable_pipe, base):
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
725
        SmartClientStreamMedium.__init__(self, base)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
726
        self._readable_pipe = readable_pipe
727
        self._writeable_pipe = writeable_pipe
728
729
    def _accept_bytes(self, bytes):
730
        """See SmartClientStreamMedium.accept_bytes."""
5011.3.1 by Martin
Revert second-phase EINTR changes
731
        self._writeable_pipe.write(bytes)
3958.1.2 by Andrew Bennetts
Report network activity from more client medium implementations.
732
        self._report_activity(len(bytes), 'write')
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
733
734
    def _flush(self):
735
        """See SmartClientStreamMedium._flush()."""
5011.3.1 by Martin
Revert second-phase EINTR changes
736
        self._writeable_pipe.flush()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
737
738
    def _read_bytes(self, count):
739
        """See SmartClientStreamMedium._read_bytes."""
5011.3.7 by Andrew Bennetts
Make max_read_size param of _read_bytes_from_socket optional, workaround unicode vs. bytes issue.
740
        bytes = osutils.until_no_eintr(self._readable_pipe.read, count)
3958.1.2 by Andrew Bennetts
Report network activity from more client medium implementations.
741
        self._report_activity(len(bytes), 'read')
742
        return bytes
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
743
744
745
class SmartSSHClientMedium(SmartClientStreamMedium):
746
    """A client medium using SSH."""
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
747
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
748
    def __init__(self, host, port=None, username=None, password=None,
3431.3.1 by Andrew Bennetts
First rough cut of a fix for bug #230550, by adding .base to SmartClientMedia rather than relying on other objects to track this accurately while reusing client media.
749
            base=None, vendor=None, bzr_remote_path=None):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
750
        """Creates a client that will connect on the first use.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
751
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
752
        :param vendor: An optional override for the ssh vendor to use. See
753
            bzrlib.transport.ssh for details on ssh vendors.
754
        """
755
        self._connected = False
756
        self._host = host
757
        self._password = password
758
        self._port = port
759
        self._username = username
4964.2.5 by Martin Pool
Make sure variables used in repr are set early in initialization
760
        # for the benefit of progress making a short description of this
761
        # transport
762
        self._scheme = 'bzr+ssh'
4100.1.5 by Martin Pool
Fix crash in SSHSmartClientStreamMedium repr.
763
        # SmartClientStreamMedium stores the repr of this object in its
764
        # _DebugCounter so we have to store all the values used in our repr
765
        # method before calling the super init.
766
        SmartClientStreamMedium.__init__(self, base)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
767
        self._read_from = None
768
        self._ssh_connection = None
769
        self._vendor = vendor
770
        self._write_to = None
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
771
        self._bzr_remote_path = bzr_remote_path
4100.1.1 by Martin Pool
Cleanup and add SmartSSHClientMedium repr
772
773
    def __repr__(self):
4964.2.4 by Martin Pool
Tweak SSHSmartClientMedium to look better when there's no port
774
        if self._port is None:
775
            maybe_port = ''
776
        else:
777
            maybe_port = ':%s' % self._port
778
        return "%s(%s://%s@%s%s/)" % (
4100.1.1 by Martin Pool
Cleanup and add SmartSSHClientMedium repr
779
            self.__class__.__name__,
4964.2.3 by Martin Pool
Tweak SmartSSHClientMedium repr
780
            self._scheme,
4100.1.2 by Martin Pool
review tweaks
781
            self._username,
782
            self._host,
4964.2.4 by Martin Pool
Tweak SSHSmartClientMedium to look better when there's no port
783
            maybe_port)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
784
785
    def _accept_bytes(self, bytes):
786
        """See SmartClientStreamMedium.accept_bytes."""
787
        self._ensure_connection()
5011.3.1 by Martin
Revert second-phase EINTR changes
788
        self._write_to.write(bytes)
3958.1.2 by Andrew Bennetts
Report network activity from more client medium implementations.
789
        self._report_activity(len(bytes), 'write')
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
790
791
    def disconnect(self):
792
        """See SmartClientMedium.disconnect()."""
793
        if not self._connected:
794
            return
5011.3.1 by Martin
Revert second-phase EINTR changes
795
        self._read_from.close()
796
        self._write_to.close()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
797
        self._ssh_connection.close()
798
        self._connected = False
799
800
    def _ensure_connection(self):
801
        """Connect this medium if not already connected."""
802
        if self._connected:
803
            return
804
        if self._vendor is None:
805
            vendor = ssh._get_ssh_vendor()
806
        else:
807
            vendor = self._vendor
808
        self._ssh_connection = vendor.connect_ssh(self._username,
809
                self._password, self._host, self._port,
1551.18.17 by Aaron Bentley
Introduce bzr_remote_path configuration variable
810
                command=[self._bzr_remote_path, 'serve', '--inet',
811
                         '--directory=/', '--allow-writes'])
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
812
        self._read_from, self._write_to = \
813
            self._ssh_connection.get_filelike_channels()
814
        self._connected = True
815
816
    def _flush(self):
817
        """See SmartClientStreamMedium._flush()."""
818
        self._write_to.flush()
819
820
    def _read_bytes(self, count):
821
        """See SmartClientStreamMedium.read_bytes."""
822
        if not self._connected:
823
            raise errors.MediumNotConnected(self)
3565.1.3 by Andrew Bennetts
Define a _MAX_READ_SIZE constant as suggested by John's review.
824
        bytes_to_read = min(count, _MAX_READ_SIZE)
5011.3.1 by Martin
Revert second-phase EINTR changes
825
        bytes = self._read_from.read(bytes_to_read)
3958.1.2 by Andrew Bennetts
Report network activity from more client medium implementations.
826
        self._report_activity(len(bytes), 'read')
827
        return bytes
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
828
829
3004.2.1 by Vincent Ladeuil
Fix 150860 by leaving port as user specified it.
830
# Port 4155 is the default port for bzr://, registered with IANA.
3665.4.1 by Jelmer Vernooij
Support IPv6 in the smart server.
831
BZR_DEFAULT_INTERFACE = None
3004.2.1 by Vincent Ladeuil
Fix 150860 by leaving port as user specified it.
832
BZR_DEFAULT_PORT = 4155
833
834
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
835
class SmartTCPClientMedium(SmartClientStreamMedium):
836
    """A client medium using TCP."""
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
837
3431.3.1 by Andrew Bennetts
First rough cut of a fix for bug #230550, by adding .base to SmartClientMedia rather than relying on other objects to track this accurately while reusing client media.
838
    def __init__(self, host, port, base):
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
839
        """Creates a client that will connect on the first use."""
3431.3.3 by Andrew Bennetts
Set 'base' in SmartClientMedium base class.
840
        SmartClientStreamMedium.__init__(self, base)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
841
        self._connected = False
842
        self._host = host
843
        self._port = port
844
        self._socket = None
845
846
    def _accept_bytes(self, bytes):
847
        """See SmartClientMedium.accept_bytes."""
848
        self._ensure_connection()
5011.3.9 by Andrew Bennetts
Remove _send_bytes_chunked.
849
        osutils.send_all(self._socket, bytes, self._report_activity)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
850
851
    def disconnect(self):
852
        """See SmartClientMedium.disconnect()."""
853
        if not self._connected:
854
            return
5011.3.1 by Martin
Revert second-phase EINTR changes
855
        self._socket.close()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
856
        self._socket = None
857
        self._connected = False
858
859
    def _ensure_connection(self):
860
        """Connect this medium if not already connected."""
861
        if self._connected:
862
            return
3004.2.1 by Vincent Ladeuil
Fix 150860 by leaving port as user specified it.
863
        if self._port is None:
864
            port = BZR_DEFAULT_PORT
865
        else:
866
            port = int(self._port)
3711.2.2 by Jelmer Vernooij
Avoid using AI_ADDRCONFIG since it's not portable.
867
        try:
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
868
            sockaddrs = socket.getaddrinfo(self._host, port, socket.AF_UNSPEC,
3711.2.2 by Jelmer Vernooij
Avoid using AI_ADDRCONFIG since it's not portable.
869
                socket.SOCK_STREAM, 0, 0)
870
        except socket.gaierror, (err_num, err_msg):
871
            raise errors.ConnectionError("failed to lookup %s:%d: %s" %
872
                    (self._host, port, err_msg))
3711.2.3 by Jelmer Vernooij
Add comment.
873
        # Initialize err in case there are no addresses returned:
3665.4.2 by Jelmer Vernooij
Fall through to next available address if previous fails.
874
        err = socket.error("no address found for %s" % self._host)
3665.4.1 by Jelmer Vernooij
Support IPv6 in the smart server.
875
        for (family, socktype, proto, canonname, sockaddr) in sockaddrs:
876
            try:
3665.4.2 by Jelmer Vernooij
Fall through to next available address if previous fails.
877
                self._socket = socket.socket(family, socktype, proto)
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
878
                self._socket.setsockopt(socket.IPPROTO_TCP,
3665.4.2 by Jelmer Vernooij
Fall through to next available address if previous fails.
879
                                        socket.TCP_NODELAY, 1)
3665.4.1 by Jelmer Vernooij
Support IPv6 in the smart server.
880
                self._socket.connect(sockaddr)
881
            except socket.error, err:
3665.4.2 by Jelmer Vernooij
Fall through to next available address if previous fails.
882
                if self._socket is not None:
883
                    self._socket.close()
884
                self._socket = None
885
                continue
886
            break
887
        if self._socket is None:
888
            # socket errors either have a (string) or (errno, string) as their
889
            # args.
890
            if type(err.args) is str:
891
                err_msg = err.args
892
            else:
893
                err_msg = err.args[1]
894
            raise errors.ConnectionError("failed to connect to %s:%d: %s" %
895
                    (self._host, port, err_msg))
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
896
        self._connected = True
897
898
    def _flush(self):
899
        """See SmartClientStreamMedium._flush().
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
900
901
        For TCP we do no flushing. We may want to turn off TCP_NODELAY and
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
902
        add a means to do a flush, but that can be done in the future.
903
        """
904
905
    def _read_bytes(self, count):
906
        """See SmartClientMedium.read_bytes."""
907
        if not self._connected:
908
            raise errors.MediumNotConnected(self)
5011.3.11 by Andrew Bennetts
Consolidate changes, try to minimise unnecessary changes and tidy up those that kept.
909
        return osutils.read_bytes_from_socket(
910
            self._socket, self._report_activity)
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
911
912
913
class SmartClientStreamMediumRequest(SmartClientMediumRequest):
914
    """A SmartClientMediumRequest that works with an SmartClientStreamMedium."""
915
916
    def __init__(self, medium):
917
        SmartClientMediumRequest.__init__(self, medium)
918
        # check that we are safe concurrency wise. If some streams start
919
        # allowing concurrent requests - i.e. via multiplexing - then this
920
        # assert should be moved to SmartClientStreamMedium.get_request,
921
        # and the setting/unsetting of _current_request likewise moved into
922
        # that class : but its unneeded overhead for now. RBC 20060922
923
        if self._medium._current_request is not None:
924
            raise errors.TooManyConcurrentRequests(self._medium)
925
        self._medium._current_request = self
926
927
    def _accept_bytes(self, bytes):
928
        """See SmartClientMediumRequest._accept_bytes.
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
929
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
930
        This forwards to self._medium._accept_bytes because we are operating
931
        on the mediums stream.
932
        """
933
        self._medium._accept_bytes(bytes)
934
935
    def _finished_reading(self):
936
        """See SmartClientMediumRequest._finished_reading.
937
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
938
        This clears the _current_request on self._medium to allow a new
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
939
        request to be created.
940
        """
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
941
        if self._medium._current_request is not self:
942
            raise AssertionError()
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
943
        self._medium._current_request = None
3943.8.1 by Marius Kruger
remove all trailing whitespace from bzr source
944
2018.5.2 by Andrew Bennetts
Start splitting bzrlib/transport/smart.py into a package.
945
    def _finished_writing(self):
946
        """See SmartClientMediumRequest._finished_writing.
947
948
        This invokes self._medium._flush to ensure all bytes are transmitted.
949
        """
950
        self._medium._flush()
951
4382.4.2 by Andrew Bennetts
Refactor duplicated SmartServerSocketStreamMedium._read_bytes and SmartTCPClientMedium._read_bytes to share a common implementation with the best parts of both. Includes Robert's review feedback.
952