~bzr-pqm/bzr/bzr.dev

2052.3.2 by John Arbash Meinel
Change Copyright .. by Canonical to Copyright ... Canonical
1
# Copyright (C) 2005 Canonical Ltd
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
"""Tests for the urlutils wrapper."""
18
19
import os
1830.3.17 by John Arbash Meinel
list_files() with wrong normalized_filename code raises exceptions. Fix this
20
import re
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
21
import sys
22
2279.4.2 by Alexander Belchenko
Don't do normpath after abspath, because this function is called inside abspath
23
from bzrlib import osutils, urlutils, win32utils
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
24
import bzrlib
1685.1.55 by John Arbash Meinel
Adding bzrlib.urlutils.join() to handle joining URLs
25
from bzrlib.errors import InvalidURL, InvalidURLJoin
1685.1.75 by Wouter van Heyst
more tests handle LANG=C
26
from bzrlib.tests import TestCaseInTempDir, TestCase, TestSkipped
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
27
28
29
class TestUrlToPath(TestCase):
30
    
1685.1.49 by John Arbash Meinel
Added bzrlib.urlutils.split and basename + dirname
31
    def test_basename(self):
32
        # bzrlib.urlutils.basename
33
        # Test bzrlib.urlutils.split()
34
        basename = urlutils.basename
35
        if sys.platform == 'win32':
36
            self.assertRaises(InvalidURL, basename, 'file:///path/to/foo')
37
            self.assertEqual('foo', basename('file:///C|/foo'))
1685.1.78 by Wouter van Heyst
more code cleanup
38
            self.assertEqual('foo', basename('file:///C:/foo'))
39
            self.assertEqual('', basename('file:///C:/'))
1685.1.49 by John Arbash Meinel
Added bzrlib.urlutils.split and basename + dirname
40
        else:
41
            self.assertEqual('foo', basename('file:///foo'))
42
            self.assertEqual('', basename('file:///'))
43
44
        self.assertEqual('foo', basename('http://host/path/to/foo'))
45
        self.assertEqual('foo', basename('http://host/path/to/foo/'))
46
        self.assertEqual('',
47
            basename('http://host/path/to/foo/', exclude_trailing_slash=False))
48
        self.assertEqual('path', basename('http://host/path'))
49
        self.assertEqual('', basename('http://host/'))
50
        self.assertEqual('', basename('http://host'))
51
        self.assertEqual('path', basename('http:///nohost/path'))
52
53
        self.assertEqual('path', basename('random+scheme://user:pass@ahost:port/path'))
54
        self.assertEqual('path', basename('random+scheme://user:pass@ahost:port/path/'))
55
        self.assertEqual('', basename('random+scheme://user:pass@ahost:port/'))
56
57
        # relative paths
58
        self.assertEqual('foo', basename('path/to/foo'))
59
        self.assertEqual('foo', basename('path/to/foo/'))
60
        self.assertEqual('', basename('path/to/foo/',
61
            exclude_trailing_slash=False))
62
        self.assertEqual('foo', basename('path/../foo'))
63
        self.assertEqual('foo', basename('../path/foo'))
64
1685.1.51 by John Arbash Meinel
Working on getting normalize_url working.
65
    def test_normalize_url_files(self):
66
        # Test that local paths are properly normalized
67
        normalize_url = urlutils.normalize_url
68
69
        def norm_file(expected, path):
70
            url = normalize_url(path)
71
            self.assertStartsWith(url, 'file:///')
72
            if sys.platform == 'win32':
73
                url = url[len('file:///C:'):]
74
            else:
75
                url = url[len('file://'):]
76
1685.1.53 by John Arbash Meinel
Updated normalize_url
77
            self.assertEndsWith(url, expected)
1685.1.51 by John Arbash Meinel
Working on getting normalize_url working.
78
79
        norm_file('path/to/foo', 'path/to/foo')
80
        norm_file('/path/to/foo', '/path/to/foo')
81
        norm_file('path/to/foo', '../path/to/foo')
82
83
        # Local paths are assumed to *not* be escaped at all
1685.1.75 by Wouter van Heyst
more tests handle LANG=C
84
        try:
85
            u'uni/\xb5'.encode(bzrlib.user_encoding)
86
        except UnicodeError:
87
            # locale cannot handle unicode 
88
            pass
89
        else:
90
            norm_file('uni/%C2%B5', u'uni/\xb5')
91
1685.1.51 by John Arbash Meinel
Working on getting normalize_url working.
92
        norm_file('uni/%25C2%25B5', u'uni/%C2%B5')
93
        norm_file('uni/%20b', u'uni/ b')
94
        # All the crazy characters get escaped in local paths => file:/// urls
1711.4.4 by John Arbash Meinel
Fix some broken tests because of stupid ntpath.abspath behavior
95
        # The ' ' character must not be at the end, because on win32
96
        # it gets stripped off by ntpath.abspath
97
        norm_file('%27%20%3B/%3F%3A%40%26%3D%2B%24%2C%23', "' ;/?:@&=+$,#")
1685.1.51 by John Arbash Meinel
Working on getting normalize_url working.
98
99
    def test_normalize_url_hybrid(self):
100
        # Anything with a scheme:// should be treated as a hybrid url
101
        # which changes what characters get escaped.
102
        normalize_url = urlutils.normalize_url
103
104
        eq = self.assertEqual
105
        eq('file:///foo/', normalize_url(u'file:///foo/'))
106
        eq('file:///foo/%20', normalize_url(u'file:///foo/ '))
107
        eq('file:///foo/%20', normalize_url(u'file:///foo/%20'))
108
        # Don't escape reserved characters
109
        eq('file:///ab_c.d-e/%f:?g&h=i+j;k,L#M$',
110
            normalize_url('file:///ab_c.d-e/%f:?g&h=i+j;k,L#M$'))
111
        eq('http://ab_c.d-e/%f:?g&h=i+j;k,L#M$',
112
            normalize_url('http://ab_c.d-e/%f:?g&h=i+j;k,L#M$'))
113
114
        # Escape unicode characters, but not already escaped chars
115
        eq('http://host/ab/%C2%B5/%C2%B5',
116
            normalize_url(u'http://host/ab/%C2%B5/\xb5'))
117
2208.4.1 by Andrew Bennetts
normalize_url should normalise escaping of unreserved characters, like '~'.
118
        # Unescape characters that don't need to be escaped
119
        eq('http://host/~bob%2525-._',
120
                normalize_url('http://host/%7Ebob%2525%2D%2E%5F'))
121
        eq('http://host/~bob%2525-._',
122
                normalize_url(u'http://host/%7Ebob%2525%2D%2E%5F'))
123
1685.1.51 by John Arbash Meinel
Working on getting normalize_url working.
124
        # Normalize verifies URLs when they are not unicode
125
        # (indicating they did not come from the user)
126
        self.assertRaises(InvalidURL, normalize_url, 'http://host/\xb5')
127
        self.assertRaises(InvalidURL, normalize_url, 'http://host/ ')
1685.1.50 by John Arbash Meinel
Added an re for handling scheme paths.
128
129
    def test_url_scheme_re(self):
130
        # Test paths that may be URLs
131
        def test_one(url, scheme_and_path):
132
            """Assert that _url_scheme_re correctly matches
133
134
            :param scheme_and_path: The (scheme, path) that should be matched
135
                can be None, to indicate it should not match
136
            """
137
            m = urlutils._url_scheme_re.match(url)
138
            if scheme_and_path is None:
139
                self.assertEqual(None, m)
140
            else:
141
                self.assertEqual(scheme_and_path[0], m.group('scheme'))
142
                self.assertEqual(scheme_and_path[1], m.group('path'))
143
144
        # Local paths
145
        test_one('/path', None)
146
        test_one('C:/path', None)
147
        test_one('../path/to/foo', None)
148
        test_one(u'../path/to/fo\xe5', None)
149
150
        # Real URLS
151
        test_one('http://host/path/', ('http', 'host/path/'))
152
        test_one('sftp://host/path/to/foo', ('sftp', 'host/path/to/foo'))
153
        test_one('file:///usr/bin', ('file', '/usr/bin'))
154
        test_one('file:///C:/Windows', ('file', '/C:/Windows'))
155
        test_one('file:///C|/Windows', ('file', '/C|/Windows'))
156
        test_one(u'readonly+sftp://host/path/\xe5', ('readonly+sftp', u'host/path/\xe5'))
157
158
        # Weird stuff
159
        # Can't have slashes or colons in the scheme
160
        test_one('/path/to/://foo', None)
161
        test_one('path:path://foo', None)
162
        # Must have more than one character for scheme
163
        test_one('C://foo', None)
164
        test_one('ab://foo', ('ab', 'foo'))
165
1685.1.49 by John Arbash Meinel
Added bzrlib.urlutils.split and basename + dirname
166
    def test_dirname(self):
167
        # Test bzrlib.urlutils.dirname()
168
        dirname = urlutils.dirname
169
        if sys.platform == 'win32':
170
            self.assertRaises(InvalidURL, dirname, 'file:///path/to/foo')
171
            self.assertEqual('file:///C|/', dirname('file:///C|/foo'))
172
            self.assertEqual('file:///C|/', dirname('file:///C|/'))
173
        else:
174
            self.assertEqual('file:///', dirname('file:///foo'))
175
            self.assertEqual('file:///', dirname('file:///'))
176
177
        self.assertEqual('http://host/path/to', dirname('http://host/path/to/foo'))
178
        self.assertEqual('http://host/path/to', dirname('http://host/path/to/foo/'))
179
        self.assertEqual('http://host/path/to/foo',
180
            dirname('http://host/path/to/foo/', exclude_trailing_slash=False))
181
        self.assertEqual('http://host/', dirname('http://host/path'))
182
        self.assertEqual('http://host/', dirname('http://host/'))
183
        self.assertEqual('http://host', dirname('http://host'))
184
        self.assertEqual('http:///nohost', dirname('http:///nohost/path'))
185
186
        self.assertEqual('random+scheme://user:pass@ahost:port/',
187
            dirname('random+scheme://user:pass@ahost:port/path'))
188
        self.assertEqual('random+scheme://user:pass@ahost:port/',
189
            dirname('random+scheme://user:pass@ahost:port/path/'))
190
        self.assertEqual('random+scheme://user:pass@ahost:port/',
191
            dirname('random+scheme://user:pass@ahost:port/'))
192
193
        # relative paths
194
        self.assertEqual('path/to', dirname('path/to/foo'))
195
        self.assertEqual('path/to', dirname('path/to/foo/'))
196
        self.assertEqual('path/to/foo',
197
            dirname('path/to/foo/', exclude_trailing_slash=False))
198
        self.assertEqual('path/..', dirname('path/../foo'))
199
        self.assertEqual('../path', dirname('../path/foo'))
200
1685.1.55 by John Arbash Meinel
Adding bzrlib.urlutils.join() to handle joining URLs
201
    def test_join(self):
202
        def test(expected, *args):
203
            joined = urlutils.join(*args)
204
            self.assertEqual(expected, joined)
205
206
        # Test relative path joining
2018.5.100 by Andrew Bennetts
Fix IndexError in urlutils.join with 'http://host/a' and '../../b'.
207
        test('foo', 'foo') # relative fragment with nothing is preserved.
1685.1.55 by John Arbash Meinel
Adding bzrlib.urlutils.join() to handle joining URLs
208
        test('foo/bar', 'foo', 'bar')
209
        test('http://foo/bar', 'http://foo', 'bar')
210
        test('http://foo/bar', 'http://foo', '.', 'bar')
211
        test('http://foo/baz', 'http://foo', 'bar', '../baz')
212
        test('http://foo/bar/baz', 'http://foo', 'bar/baz')
213
        test('http://foo/baz', 'http://foo', 'bar/../baz')
2018.5.93 by Andrew Bennetts
Fix another bug in urlutils.join.
214
        test('http://foo/baz', 'http://foo/bar/', '../baz')
1685.1.55 by John Arbash Meinel
Adding bzrlib.urlutils.join() to handle joining URLs
215
216
        # Absolute paths
2018.5.100 by Andrew Bennetts
Fix IndexError in urlutils.join with 'http://host/a' and '../../b'.
217
        test('http://foo', 'http://foo') # abs url with nothing is preserved.
1685.1.55 by John Arbash Meinel
Adding bzrlib.urlutils.join() to handle joining URLs
218
        test('http://bar', 'http://foo', 'http://bar')
219
        test('sftp://bzr/foo', 'http://foo', 'bar', 'sftp://bzr/foo')
220
        test('file:///bar', 'foo', 'file:///bar')
2018.5.92 by Andrew Bennetts
Small bugfix to urlutils.join: join('anything', 'http://bar/a/') should not strip the trailing slash.
221
        test('http://bar/', 'http://foo', 'http://bar/')
222
        test('http://bar/a', 'http://foo', 'http://bar/a')
223
        test('http://bar/a/', 'http://foo', 'http://bar/a/')
1711.2.49 by John Arbash Meinel
urlutils.join should work for root paths.
224
225
        # From a base path
226
        test('file:///foo', 'file:///', 'foo')
227
        test('file:///bar/foo', 'file:///bar/', 'foo')
228
        test('http://host/foo', 'http://host/', 'foo')
229
        test('http://host/', 'http://host', '')
1685.1.55 by John Arbash Meinel
Adding bzrlib.urlutils.join() to handle joining URLs
230
        
231
        # Invalid joinings
232
        # Cannot go above root
2018.5.100 by Andrew Bennetts
Fix IndexError in urlutils.join with 'http://host/a' and '../../b'.
233
        # Implicitly at root:
1685.1.55 by John Arbash Meinel
Adding bzrlib.urlutils.join() to handle joining URLs
234
        self.assertRaises(InvalidURLJoin, urlutils.join,
235
                'http://foo', '../baz')
2018.5.54 by Andrew Bennetts
Fix ChrootTransportDecorator's abspath method to be consistent with its clone
236
        self.assertRaises(InvalidURLJoin, urlutils.join,
237
                'http://foo', '/..')
2018.5.100 by Andrew Bennetts
Fix IndexError in urlutils.join with 'http://host/a' and '../../b'.
238
        # Joining from a path explicitly under the root.
239
        self.assertRaises(InvalidURLJoin, urlutils.join,
240
                'http://foo/a', '../../b')
2379.1.1 by Robert Collins
urlutils improvements from hpss.
241
2018.5.46 by Andrew Bennetts
Fix ChrootTransportDecorator's clone to pass less surprising offsets to the decorated transport's clone.
242
    def test_joinpath(self):
243
        def test(expected, *args):
244
            joined = urlutils.joinpath(*args)
245
            self.assertEqual(expected, joined)
246
247
        # Test a single element
248
        test('foo', 'foo')
249
250
        # Test relative path joining
251
        test('foo/bar', 'foo', 'bar')
252
        test('foo/bar', 'foo', '.', 'bar')
253
        test('foo/baz', 'foo', 'bar', '../baz')
254
        test('foo/bar/baz', 'foo', 'bar/baz')
255
        test('foo/baz', 'foo', 'bar/../baz')
256
257
        # Test joining to an absolute path
258
        test('/foo', '/foo')
259
        test('/foo', '/foo', '.')
260
        test('/foo/bar', '/foo', 'bar')
261
        test('/', '/foo', '..')
262
263
        # Test joining with an absolute path
264
        test('/bar', 'foo', '/bar')
2018.5.53 by Andrew Bennetts
Small fix to urlutils.joinpath that was causing a misbehaviour in
265
266
        # Test joining to a path with a trailing slash
267
        test('foo/bar', 'foo/', 'bar')
2018.5.46 by Andrew Bennetts
Fix ChrootTransportDecorator's clone to pass less surprising offsets to the decorated transport's clone.
268
        
269
        # Invalid joinings
270
        # Cannot go above root
271
        self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '../baz')
2018.5.54 by Andrew Bennetts
Fix ChrootTransportDecorator's abspath method to be consistent with its clone
272
        self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '..')
273
        self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '/..')
2018.5.46 by Andrew Bennetts
Fix ChrootTransportDecorator's clone to pass less surprising offsets to the decorated transport's clone.
274
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
275
    def test_function_type(self):
276
        if sys.platform == 'win32':
277
            self.assertEqual(urlutils._win32_local_path_to_url, urlutils.local_path_to_url)
278
            self.assertEqual(urlutils._win32_local_path_from_url, urlutils.local_path_from_url)
279
        else:
280
            self.assertEqual(urlutils._posix_local_path_to_url, urlutils.local_path_to_url)
281
            self.assertEqual(urlutils._posix_local_path_from_url, urlutils.local_path_from_url)
282
283
    def test_posix_local_path_to_url(self):
284
        to_url = urlutils._posix_local_path_to_url
285
        self.assertEqual('file:///path/to/foo',
286
            to_url('/path/to/foo'))
1685.1.75 by Wouter van Heyst
more tests handle LANG=C
287
288
        try:
289
            result = to_url(u'/path/to/r\xe4ksm\xf6rg\xe5s')
290
        except UnicodeError:
291
            raise TestSkipped("local encoding cannot handle unicode")
292
293
        self.assertEqual('file:///path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
294
295
    def test_posix_local_path_from_url(self):
296
        from_url = urlutils._posix_local_path_from_url
297
        self.assertEqual('/path/to/foo',
298
            from_url('file:///path/to/foo'))
299
        self.assertEqual(u'/path/to/r\xe4ksm\xf6rg\xe5s',
300
            from_url('file:///path/to/r%C3%A4ksm%C3%B6rg%C3%A5s'))
301
        self.assertEqual(u'/path/to/r\xe4ksm\xf6rg\xe5s',
302
            from_url('file:///path/to/r%c3%a4ksm%c3%b6rg%c3%a5s'))
303
304
        self.assertRaises(InvalidURL, from_url, '/path/to/foo')
305
306
    def test_win32_local_path_to_url(self):
307
        to_url = urlutils._win32_local_path_to_url
1711.4.28 by John Arbash Meinel
Update the test suite for Alexander's patch.
308
        self.assertEqual('file:///C:/path/to/foo',
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
309
            to_url('C:/path/to/foo'))
1711.4.4 by John Arbash Meinel
Fix some broken tests because of stupid ntpath.abspath behavior
310
        # BOGUS: on win32, ntpath.abspath will strip trailing
311
        #       whitespace, so this will always fail
312
        #       Though under linux, it fakes abspath support
313
        #       and thus will succeed
314
        # self.assertEqual('file:///C:/path/to/foo%20',
315
        #     to_url('C:/path/to/foo '))
1711.4.28 by John Arbash Meinel
Update the test suite for Alexander's patch.
316
        self.assertEqual('file:///C:/path/to/f%20oo',
1711.4.4 by John Arbash Meinel
Fix some broken tests because of stupid ntpath.abspath behavior
317
            to_url('C:/path/to/f oo'))
1685.1.75 by Wouter van Heyst
more tests handle LANG=C
318
319
        try:
320
            result = to_url(u'd:/path/to/r\xe4ksm\xf6rg\xe5s')
321
        except UnicodeError:
322
            raise TestSkipped("local encoding cannot handle unicode")
323
1711.4.28 by John Arbash Meinel
Update the test suite for Alexander's patch.
324
        self.assertEqual('file:///D:/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
325
2162.2.1 by Alexander Belchenko
Testing UNC path conversion
326
    def test_win32_unc_path_to_url(self):
327
        to_url = urlutils._win32_local_path_to_url
2162.2.6 by Alexander Belchenko
Change tests for win32 UNC path to new file://HOST/path scheme
328
        self.assertEqual('file://HOST/path',
2162.2.1 by Alexander Belchenko
Testing UNC path conversion
329
            to_url(r'\\HOST\path'))
2162.2.6 by Alexander Belchenko
Change tests for win32 UNC path to new file://HOST/path scheme
330
        self.assertEqual('file://HOST/path',
2162.2.1 by Alexander Belchenko
Testing UNC path conversion
331
            to_url('//HOST/path'))
332
2162.2.5 by Alexander Belchenko
Expand test_win32_unc_path_to_url to check unicode
333
        try:
334
            result = to_url(u'//HOST/path/to/r\xe4ksm\xf6rg\xe5s')
335
        except UnicodeError:
336
            raise TestSkipped("local encoding cannot handle unicode")
337
2162.2.6 by Alexander Belchenko
Change tests for win32 UNC path to new file://HOST/path scheme
338
        self.assertEqual('file://HOST/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
2162.2.5 by Alexander Belchenko
Expand test_win32_unc_path_to_url to check unicode
339
340
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
341
    def test_win32_local_path_from_url(self):
342
        from_url = urlutils._win32_local_path_from_url
1711.4.28 by John Arbash Meinel
Update the test suite for Alexander's patch.
343
        self.assertEqual('C:/path/to/foo',
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
344
            from_url('file:///C|/path/to/foo'))
1711.4.28 by John Arbash Meinel
Update the test suite for Alexander's patch.
345
        self.assertEqual(u'D:/path/to/r\xe4ksm\xf6rg\xe5s',
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
346
            from_url('file:///d|/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s'))
1711.4.28 by John Arbash Meinel
Update the test suite for Alexander's patch.
347
        self.assertEqual(u'D:/path/to/r\xe4ksm\xf6rg\xe5s',
1685.1.79 by Wouter van Heyst
cleanup urlutils
348
            from_url('file:///d:/path/to/r%c3%a4ksm%c3%b6rg%c3%a5s'))
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
349
350
        self.assertRaises(InvalidURL, from_url, '/path/to/foo')
351
        # Not a valid _win32 url, no drive letter
352
        self.assertRaises(InvalidURL, from_url, 'file:///path/to/foo')
353
2162.2.1 by Alexander Belchenko
Testing UNC path conversion
354
    def test_win32_unc_path_from_url(self):
355
        from_url = urlutils._win32_local_path_from_url
2162.2.6 by Alexander Belchenko
Change tests for win32 UNC path to new file://HOST/path scheme
356
        self.assertEqual('//HOST/path', from_url('file://HOST/path'))
357
        # despite IE allows 2, 4, 5 and 6 slashes in URL to another machine
358
        # we want to use only 2 slashes
359
        # Firefox understand only 5 slashes in URL, but it's ugly
2162.2.1 by Alexander Belchenko
Testing UNC path conversion
360
        self.assertRaises(InvalidURL, from_url, 'file:////HOST/path')
2162.2.6 by Alexander Belchenko
Change tests for win32 UNC path to new file://HOST/path scheme
361
        self.assertRaises(InvalidURL, from_url, 'file://///HOST/path')
2162.2.1 by Alexander Belchenko
Testing UNC path conversion
362
        self.assertRaises(InvalidURL, from_url, 'file://////HOST/path')
2162.2.6 by Alexander Belchenko
Change tests for win32 UNC path to new file://HOST/path scheme
363
        # check for file://C:/ instead of file:///C:/
364
        self.assertRaises(InvalidURL, from_url, 'file://C:/path')
2162.2.1 by Alexander Belchenko
Testing UNC path conversion
365
2162.2.6 by Alexander Belchenko
Change tests for win32 UNC path to new file://HOST/path scheme
366
    def test_win32_extract_drive_letter(self):
1711.2.43 by John Arbash Meinel
Split out win32 specific code so that it can be tested on all platforms.
367
        extract = urlutils._win32_extract_drive_letter
368
        self.assertEqual(('file:///C:', '/foo'), extract('file://', '/C:/foo'))
369
        self.assertEqual(('file:///d|', '/path'), extract('file://', '/d|/path'))
370
        self.assertRaises(InvalidURL, extract, 'file://', '/path')
371
1685.1.49 by John Arbash Meinel
Added bzrlib.urlutils.split and basename + dirname
372
    def test_split(self):
373
        # Test bzrlib.urlutils.split()
374
        split = urlutils.split
375
        if sys.platform == 'win32':
376
            self.assertRaises(InvalidURL, split, 'file:///path/to/foo')
377
            self.assertEqual(('file:///C|/', 'foo'), split('file:///C|/foo'))
1685.1.79 by Wouter van Heyst
cleanup urlutils
378
            self.assertEqual(('file:///C:/', ''), split('file:///C:/'))
1685.1.49 by John Arbash Meinel
Added bzrlib.urlutils.split and basename + dirname
379
        else:
380
            self.assertEqual(('file:///', 'foo'), split('file:///foo'))
381
            self.assertEqual(('file:///', ''), split('file:///'))
382
383
        self.assertEqual(('http://host/path/to', 'foo'), split('http://host/path/to/foo'))
384
        self.assertEqual(('http://host/path/to', 'foo'), split('http://host/path/to/foo/'))
385
        self.assertEqual(('http://host/path/to/foo', ''),
386
            split('http://host/path/to/foo/', exclude_trailing_slash=False))
387
        self.assertEqual(('http://host/', 'path'), split('http://host/path'))
388
        self.assertEqual(('http://host/', ''), split('http://host/'))
389
        self.assertEqual(('http://host', ''), split('http://host'))
390
        self.assertEqual(('http:///nohost', 'path'), split('http:///nohost/path'))
391
392
        self.assertEqual(('random+scheme://user:pass@ahost:port/', 'path'),
393
            split('random+scheme://user:pass@ahost:port/path'))
394
        self.assertEqual(('random+scheme://user:pass@ahost:port/', 'path'),
395
            split('random+scheme://user:pass@ahost:port/path/'))
396
        self.assertEqual(('random+scheme://user:pass@ahost:port/', ''),
397
            split('random+scheme://user:pass@ahost:port/'))
398
399
        # relative paths
400
        self.assertEqual(('path/to', 'foo'), split('path/to/foo'))
401
        self.assertEqual(('path/to', 'foo'), split('path/to/foo/'))
402
        self.assertEqual(('path/to/foo', ''),
403
            split('path/to/foo/', exclude_trailing_slash=False))
404
        self.assertEqual(('path/..', 'foo'), split('path/../foo'))
405
        self.assertEqual(('../path', 'foo'), split('../path/foo'))
406
2162.2.6 by Alexander Belchenko
Change tests for win32 UNC path to new file://HOST/path scheme
407
    def test_win32_strip_local_trailing_slash(self):
1711.2.44 by John Arbash Meinel
Factor out another win32 special case and add platform independent tests for it.
408
        strip = urlutils._win32_strip_local_trailing_slash
409
        self.assertEqual('file://', strip('file://'))
410
        self.assertEqual('file:///', strip('file:///'))
411
        self.assertEqual('file:///C', strip('file:///C'))
412
        self.assertEqual('file:///C:', strip('file:///C:'))
413
        self.assertEqual('file:///d|', strip('file:///d|'))
414
        self.assertEqual('file:///C:/', strip('file:///C:/'))
415
        self.assertEqual('file:///C:/a', strip('file:///C:/a/'))
416
1685.1.48 by John Arbash Meinel
Updated strip_trailing_slash to support lots more url stuff, added tests
417
    def test_strip_trailing_slash(self):
418
        sts = urlutils.strip_trailing_slash
419
        if sys.platform == 'win32':
420
            self.assertEqual('file:///C|/', sts('file:///C|/'))
1685.1.79 by Wouter van Heyst
cleanup urlutils
421
            self.assertEqual('file:///C:/foo', sts('file:///C:/foo'))
1685.1.48 by John Arbash Meinel
Updated strip_trailing_slash to support lots more url stuff, added tests
422
            self.assertEqual('file:///C|/foo', sts('file:///C|/foo/'))
423
        else:
424
            self.assertEqual('file:///', sts('file:///'))
425
            self.assertEqual('file:///foo', sts('file:///foo'))
426
            self.assertEqual('file:///foo', sts('file:///foo/'))
427
428
        self.assertEqual('http://host/', sts('http://host/'))
429
        self.assertEqual('http://host/foo', sts('http://host/foo'))
430
        self.assertEqual('http://host/foo', sts('http://host/foo/'))
431
432
        # No need to fail just because the slash is missing
433
        self.assertEqual('http://host', sts('http://host'))
434
        # TODO: jam 20060502 Should this raise InvalidURL?
435
        self.assertEqual('file://', sts('file://'))
436
437
        self.assertEqual('random+scheme://user:pass@ahost:port/path',
438
            sts('random+scheme://user:pass@ahost:port/path'))
439
        self.assertEqual('random+scheme://user:pass@ahost:port/path',
440
            sts('random+scheme://user:pass@ahost:port/path/'))
441
        self.assertEqual('random+scheme://user:pass@ahost:port/',
442
            sts('random+scheme://user:pass@ahost:port/'))
443
444
        # Make sure relative paths work too
445
        self.assertEqual('path/to/foo', sts('path/to/foo'))
446
        self.assertEqual('path/to/foo', sts('path/to/foo/'))
447
        self.assertEqual('../to/foo', sts('../to/foo/'))
448
        self.assertEqual('path/../foo', sts('path/../foo/'))
449
1685.1.54 by John Arbash Meinel
url_for_display now makes sure output can be properly encoded.
450
    def test_unescape_for_display_utf8(self):
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
451
        # Test that URLs are converted to nice unicode strings for display
1685.1.54 by John Arbash Meinel
url_for_display now makes sure output can be properly encoded.
452
        def test(expected, url, encoding='utf-8'):
453
            disp_url = urlutils.unescape_for_display(url, encoding=encoding)
1685.1.58 by Martin Pool
urlutils.unescape_for_display should return Unicode
454
            self.assertIsInstance(disp_url, unicode)
1685.1.54 by John Arbash Meinel
url_for_display now makes sure output can be properly encoded.
455
            self.assertEqual(expected, disp_url)
1685.1.79 by Wouter van Heyst
cleanup urlutils
456
1685.1.54 by John Arbash Meinel
url_for_display now makes sure output can be properly encoded.
457
        test('http://foo', 'http://foo')
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
458
        if sys.platform == 'win32':
1711.7.13 by John Arbash Meinel
Fix expected value for urlutils tests
459
            test('C:/foo/path', 'file:///C|/foo/path')
460
            test('C:/foo/path', 'file:///C:/foo/path')
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
461
        else:
1685.1.54 by John Arbash Meinel
url_for_display now makes sure output can be properly encoded.
462
            test('/foo/path', 'file:///foo/path')
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
463
1685.1.54 by John Arbash Meinel
url_for_display now makes sure output can be properly encoded.
464
        test('http://foo/%2Fbaz', 'http://foo/%2Fbaz')
1685.1.58 by Martin Pool
urlutils.unescape_for_display should return Unicode
465
        test(u'http://host/r\xe4ksm\xf6rg\xe5s',
466
             'http://host/r%C3%A4ksm%C3%B6rg%C3%A5s')
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
467
468
        # Make sure special escaped characters stay escaped
1685.1.54 by John Arbash Meinel
url_for_display now makes sure output can be properly encoded.
469
        test(u'http://host/%3B%2F%3F%3A%40%26%3D%2B%24%2C%23',
1685.1.58 by Martin Pool
urlutils.unescape_for_display should return Unicode
470
             'http://host/%3B%2F%3F%3A%40%26%3D%2B%24%2C%23')
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
471
472
        # Can we handle sections that don't have utf-8 encoding?
1685.1.58 by Martin Pool
urlutils.unescape_for_display should return Unicode
473
        test(u'http://host/%EE%EE%EE/r\xe4ksm\xf6rg\xe5s',
474
             'http://host/%EE%EE%EE/r%C3%A4ksm%C3%B6rg%C3%A5s')
1685.1.54 by John Arbash Meinel
url_for_display now makes sure output can be properly encoded.
475
476
        # Test encoding into output that can handle some characters
1685.1.58 by Martin Pool
urlutils.unescape_for_display should return Unicode
477
        test(u'http://host/%EE%EE%EE/r\xe4ksm\xf6rg\xe5s',
478
             'http://host/%EE%EE%EE/r%C3%A4ksm%C3%B6rg%C3%A5s',
479
             encoding='iso-8859-1')
480
481
        # This one can be encoded into utf8
482
        test(u'http://host/\u062c\u0648\u062c\u0648',
483
             'http://host/%d8%ac%d9%88%d8%ac%d9%88',
484
             encoding='utf-8')
485
486
        # This can't be put into 8859-1 and so stays as escapes
487
        test(u'http://host/%d8%ac%d9%88%d8%ac%d9%88',
488
             'http://host/%d8%ac%d9%88%d8%ac%d9%88',
489
             encoding='iso-8859-1')
1685.1.45 by John Arbash Meinel
Moved url functions into bzrlib.urlutils
490
491
    def test_escape(self):
492
        self.assertEqual('%25', urlutils.escape('%'))
493
        self.assertEqual('%C3%A5', urlutils.escape(u'\xe5'))
494
495
    def test_unescape(self):
496
        self.assertEqual('%', urlutils.unescape('%25'))
497
        self.assertEqual(u'\xe5', urlutils.unescape('%C3%A5'))
498
499
        self.assertRaises(InvalidURL, urlutils.unescape, u'\xe5')
500
        self.assertRaises(InvalidURL, urlutils.unescape, '\xe5')
501
        self.assertRaises(InvalidURL, urlutils.unescape, '%E5')
502
503
    def test_escape_unescape(self):
504
        self.assertEqual(u'\xe5', urlutils.unescape(urlutils.escape(u'\xe5')))
505
        self.assertEqual('%', urlutils.unescape(urlutils.escape('%')))
506
1685.1.70 by Wouter van Heyst
working on get_parent, set_parent and relative urls, broken
507
    def test_relative_url(self):
508
        def test(expected, base, other):
509
            result = urlutils.relative_url(base, other)
510
            self.assertEqual(expected, result)
511
            
512
        test('a', 'http://host/', 'http://host/a')
1685.1.71 by Wouter van Heyst
change branch.{get,set}_parent to store a relative path but return full urls
513
        test('http://entirely/different', 'sftp://host/branch',
514
                    'http://entirely/different')
515
        test('../person/feature', 'http://host/branch/mainline',
516
                    'http://host/branch/person/feature')
1685.1.70 by Wouter van Heyst
working on get_parent, set_parent and relative urls, broken
517
        test('..', 'http://host/branch', 'http://host/')
518
        test('http://host2/branch', 'http://host1/branch', 'http://host2/branch')
1685.1.71 by Wouter van Heyst
change branch.{get,set}_parent to store a relative path but return full urls
519
        test('.', 'http://host1/branch', 'http://host1/branch')
520
        test('../../../branch/2b', 'file:///home/jelmer/foo/bar/2b',
521
                    'file:///home/jelmer/branch/2b')
522
        test('../../branch/2b', 'sftp://host/home/jelmer/bar/2b',
523
                    'sftp://host/home/jelmer/branch/2b')
1685.1.79 by Wouter van Heyst
cleanup urlutils
524
        test('../../branch/feature/%2b', 'http://host/home/jelmer/bar/%2b',
525
                    'http://host/home/jelmer/branch/feature/%2b')
1685.1.71 by Wouter van Heyst
change branch.{get,set}_parent to store a relative path but return full urls
526
        test('../../branch/feature/2b', 'http://host/home/jelmer/bar/2b/', 
527
                    'http://host/home/jelmer/branch/feature/2b')
528
        # relative_url should preserve a trailing slash
529
        test('../../branch/feature/2b/', 'http://host/home/jelmer/bar/2b/',
530
                    'http://host/home/jelmer/branch/feature/2b/')
531
        test('../../branch/feature/2b/', 'http://host/home/jelmer/bar/2b',
532
                    'http://host/home/jelmer/branch/feature/2b/')
533
534
        # TODO: treat http://host as http://host/
535
        #       relative_url is typically called from a branch.base or
536
        #       transport.base which always ends with a /
537
        #test('a', 'http://host', 'http://host/a')
538
        test('http://host/a', 'http://host', 'http://host/a')
539
        #test('.', 'http://host', 'http://host/')
540
        test('http://host/', 'http://host', 'http://host/')
541
        #test('.', 'http://host/', 'http://host')
542
        test('http://host', 'http://host/', 'http://host')
1830.3.13 by John Arbash Meinel
Add a test that urlutils creates normalized paths
543
544
545
class TestCwdToURL(TestCaseInTempDir):
546
    """Test that local_path_to_url works base on the cwd"""
547
548
    def test_dot(self):
549
        # This test will fail if getcwd is not ascii
1830.3.17 by John Arbash Meinel
list_files() with wrong normalized_filename code raises exceptions. Fix this
550
        os.mkdir('mytest')
551
        os.chdir('mytest')
1830.3.13 by John Arbash Meinel
Add a test that urlutils creates normalized paths
552
553
        url = urlutils.local_path_to_url('.')
1830.3.17 by John Arbash Meinel
list_files() with wrong normalized_filename code raises exceptions. Fix this
554
        self.assertEndsWith(url, '/mytest')
1830.3.13 by John Arbash Meinel
Add a test that urlutils creates normalized paths
555
556
    def test_non_ascii(self):
2279.4.2 by Alexander Belchenko
Don't do normpath after abspath, because this function is called inside abspath
557
        if win32utils.winver == 'Windows 98':
558
            raise TestSkipped('Windows 98 cannot handle unicode filenames')
559
1830.3.13 by John Arbash Meinel
Add a test that urlutils creates normalized paths
560
        try:
561
            os.mkdir(u'dod\xe9')
562
        except UnicodeError:
563
            raise TestSkipped('cannot create unicode directory')
564
565
        os.chdir(u'dod\xe9')
566
567
        # On Mac OSX this directory is actually: 
568
        #   u'/dode\u0301' => '/dode\xcc\x81
569
        # but we should normalize it back to 
570
        #   u'/dod\xe9' => '/dod\xc3\xa9'
571
        url = urlutils.local_path_to_url('.')
572
        self.assertEndsWith(url, '/dod%C3%A9')
2512.4.1 by Ian Clatworthy
Fixes #115491 - 'branch lp:projname' now creates ./projname as exected
573
574
575
class TestDeriveToLocation(TestCase):
576
    """Test that the mapping of FROM_LOCATION to TO_LOCATION works."""
577
578
    def test_to_locations_derived_from_paths(self):
579
        derive = urlutils.derive_to_location
580
        self.assertEqual("bar", derive("bar"))
581
        self.assertEqual("bar", derive("../bar"))
582
        self.assertEqual("bar", derive("/foo/bar"))
583
        self.assertEqual("bar", derive("c:/foo/bar"))
584
        self.assertEqual("bar", derive("c:bar"))
585
586
    def test_to_locations_derived_from_urls(self):
587
        derive = urlutils.derive_to_location
588
        self.assertEqual("bar", derive("http://foo/bar"))
589
        self.assertEqual("bar", derive("bzr+ssh://foo/bar"))
590
        self.assertEqual("foo-bar", derive("lp:foo-bar"))