1
# Copyright (C) 2006-2012, 2015 Canonical Ltd
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11
# GNU General Public License for more details.
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17
"""Tests for the urlutils wrapper."""
22
from bzrlib import osutils, urlutils, win32utils
23
from bzrlib.errors import (
29
from bzrlib.tests import features, TestCaseInTempDir, TestCase, TestSkipped
32
class TestUrlToPath(TestCase):
34
def test_basename(self):
35
# bzrlib.urlutils.basename
36
# Test bzrlib.urlutils.split()
37
basename = urlutils.basename
38
if sys.platform == 'win32':
39
self.assertRaises(InvalidURL, basename, 'file:///path/to/foo')
40
self.assertEqual('foo', basename('file:///C|/foo'))
41
self.assertEqual('foo', basename('file:///C:/foo'))
42
self.assertEqual('', basename('file:///C:/'))
44
self.assertEqual('foo', basename('file:///foo'))
45
self.assertEqual('', basename('file:///'))
47
self.assertEqual('foo', basename('http://host/path/to/foo'))
48
self.assertEqual('foo', basename('http://host/path/to/foo/'))
50
basename('http://host/path/to/foo/', exclude_trailing_slash=False))
51
self.assertEqual('path', basename('http://host/path'))
52
self.assertEqual('', basename('http://host/'))
53
self.assertEqual('', basename('http://host'))
54
self.assertEqual('path', basename('http:///nohost/path'))
56
self.assertEqual('path', basename('random+scheme://user:pass@ahost:port/path'))
57
self.assertEqual('path', basename('random+scheme://user:pass@ahost:port/path/'))
58
self.assertEqual('', basename('random+scheme://user:pass@ahost:port/'))
61
self.assertEqual('foo', basename('path/to/foo'))
62
self.assertEqual('foo', basename('path/to/foo/'))
63
self.assertEqual('', basename('path/to/foo/',
64
exclude_trailing_slash=False))
65
self.assertEqual('foo', basename('path/../foo'))
66
self.assertEqual('foo', basename('../path/foo'))
68
def test_normalize_url_files(self):
69
# Test that local paths are properly normalized
70
normalize_url = urlutils.normalize_url
72
def norm_file(expected, path):
73
url = normalize_url(path)
74
self.assertStartsWith(url, 'file:///')
75
if sys.platform == 'win32':
76
url = url[len('file:///C:'):]
78
url = url[len('file://'):]
80
self.assertEndsWith(url, expected)
82
norm_file('path/to/foo', 'path/to/foo')
83
norm_file('/path/to/foo', '/path/to/foo')
84
norm_file('path/to/foo', '../path/to/foo')
86
# Local paths are assumed to *not* be escaped at all
88
u'uni/\xb5'.encode(osutils.get_user_encoding())
90
# locale cannot handle unicode
93
norm_file('uni/%C2%B5', u'uni/\xb5')
95
norm_file('uni/%25C2%25B5', u'uni/%C2%B5')
96
norm_file('uni/%20b', u'uni/ b')
97
# All the crazy characters get escaped in local paths => file:/// urls
98
# The ' ' character must not be at the end, because on win32
99
# it gets stripped off by ntpath.abspath
100
norm_file('%27%20%3B/%3F%3A%40%26%3D%2B%24%2C%23', "' ;/?:@&=+$,#")
102
def test_normalize_url_hybrid(self):
103
# Anything with a scheme:// should be treated as a hybrid url
104
# which changes what characters get escaped.
105
normalize_url = urlutils.normalize_url
107
eq = self.assertEqual
108
eq('file:///foo/', normalize_url(u'file:///foo/'))
109
eq('file:///foo/%20', normalize_url(u'file:///foo/ '))
110
eq('file:///foo/%20', normalize_url(u'file:///foo/%20'))
111
# Don't escape reserved characters
112
eq('file:///ab_c.d-e/%f:?g&h=i+j;k,L#M$',
113
normalize_url('file:///ab_c.d-e/%f:?g&h=i+j;k,L#M$'))
114
eq('http://ab_c.d-e/%f:?g&h=i+j;k,L#M$',
115
normalize_url('http://ab_c.d-e/%f:?g&h=i+j;k,L#M$'))
117
# Escape unicode characters, but not already escaped chars
118
eq('http://host/ab/%C2%B5/%C2%B5',
119
normalize_url(u'http://host/ab/%C2%B5/\xb5'))
121
# Unescape characters that don't need to be escaped
122
eq('http://host/~bob%2525-._',
123
normalize_url('http://host/%7Ebob%2525%2D%2E%5F'))
124
eq('http://host/~bob%2525-._',
125
normalize_url(u'http://host/%7Ebob%2525%2D%2E%5F'))
127
# Normalize verifies URLs when they are not unicode
128
# (indicating they did not come from the user)
129
self.assertRaises(InvalidURL, normalize_url, 'http://host/\xb5')
130
self.assertRaises(InvalidURL, normalize_url, 'http://host/ ')
132
def test_url_scheme_re(self):
133
# Test paths that may be URLs
134
def test_one(url, scheme_and_path):
135
"""Assert that _url_scheme_re correctly matches
137
:param scheme_and_path: The (scheme, path) that should be matched
138
can be None, to indicate it should not match
140
m = urlutils._url_scheme_re.match(url)
141
if scheme_and_path is None:
142
self.assertEqual(None, m)
144
self.assertEqual(scheme_and_path[0], m.group('scheme'))
145
self.assertEqual(scheme_and_path[1], m.group('path'))
148
test_one('/path', None)
149
test_one('C:/path', None)
150
test_one('../path/to/foo', None)
151
test_one(u'../path/to/fo\xe5', None)
154
test_one('http://host/path/', ('http', 'host/path/'))
155
test_one('sftp://host/path/to/foo', ('sftp', 'host/path/to/foo'))
156
test_one('file:///usr/bin', ('file', '/usr/bin'))
157
test_one('file:///C:/Windows', ('file', '/C:/Windows'))
158
test_one('file:///C|/Windows', ('file', '/C|/Windows'))
159
test_one(u'readonly+sftp://host/path/\xe5', ('readonly+sftp', u'host/path/\xe5'))
162
# Can't have slashes or colons in the scheme
163
test_one('/path/to/://foo', None)
164
test_one('scheme:stuff://foo', ('scheme', 'stuff://foo'))
165
# Must have more than one character for scheme
166
test_one('C://foo', None)
167
test_one('ab://foo', ('ab', 'foo'))
169
def test_dirname(self):
170
# Test bzrlib.urlutils.dirname()
171
dirname = urlutils.dirname
172
if sys.platform == 'win32':
173
self.assertRaises(InvalidURL, dirname, 'file:///path/to/foo')
174
self.assertEqual('file:///C|/', dirname('file:///C|/foo'))
175
self.assertEqual('file:///C|/', dirname('file:///C|/'))
177
self.assertEqual('file:///', dirname('file:///foo'))
178
self.assertEqual('file:///', dirname('file:///'))
180
self.assertEqual('http://host/path/to', dirname('http://host/path/to/foo'))
181
self.assertEqual('http://host/path/to', dirname('http://host/path/to/foo/'))
182
self.assertEqual('http://host/path/to/foo',
183
dirname('http://host/path/to/foo/', exclude_trailing_slash=False))
184
self.assertEqual('http://host/', dirname('http://host/path'))
185
self.assertEqual('http://host/', dirname('http://host/'))
186
self.assertEqual('http://host', dirname('http://host'))
187
self.assertEqual('http:///nohost', dirname('http:///nohost/path'))
189
self.assertEqual('random+scheme://user:pass@ahost:port/',
190
dirname('random+scheme://user:pass@ahost:port/path'))
191
self.assertEqual('random+scheme://user:pass@ahost:port/',
192
dirname('random+scheme://user:pass@ahost:port/path/'))
193
self.assertEqual('random+scheme://user:pass@ahost:port/',
194
dirname('random+scheme://user:pass@ahost:port/'))
197
self.assertEqual('path/to', dirname('path/to/foo'))
198
self.assertEqual('path/to', dirname('path/to/foo/'))
199
self.assertEqual('path/to/foo',
200
dirname('path/to/foo/', exclude_trailing_slash=False))
201
self.assertEqual('path/..', dirname('path/../foo'))
202
self.assertEqual('../path', dirname('../path/foo'))
204
def test_is_url(self):
205
self.assertTrue(urlutils.is_url('http://foo/bar'))
206
self.assertTrue(urlutils.is_url('bzr+ssh://foo/bar'))
207
self.assertTrue(urlutils.is_url('lp:foo/bar'))
208
self.assertTrue(urlutils.is_url('file:///foo/bar'))
209
self.assertFalse(urlutils.is_url(''))
210
self.assertFalse(urlutils.is_url('foo'))
211
self.assertFalse(urlutils.is_url('foo/bar'))
212
self.assertFalse(urlutils.is_url('/foo'))
213
self.assertFalse(urlutils.is_url('/foo/bar'))
214
self.assertFalse(urlutils.is_url('C:/'))
215
self.assertFalse(urlutils.is_url('C:/foo'))
216
self.assertFalse(urlutils.is_url('C:/foo/bar'))
219
def test(expected, *args):
220
joined = urlutils.join(*args)
221
self.assertEqual(expected, joined)
223
# Test relative path joining
224
test('foo', 'foo') # relative fragment with nothing is preserved.
225
test('foo/bar', 'foo', 'bar')
226
test('http://foo/bar', 'http://foo', 'bar')
227
test('http://foo/bar', 'http://foo', '.', 'bar')
228
test('http://foo/baz', 'http://foo', 'bar', '../baz')
229
test('http://foo/bar/baz', 'http://foo', 'bar/baz')
230
test('http://foo/baz', 'http://foo', 'bar/../baz')
231
test('http://foo/baz', 'http://foo/bar/', '../baz')
232
test('lp:foo/bar', 'lp:foo', 'bar')
233
test('lp:foo/bar/baz', 'lp:foo', 'bar/baz')
236
test('http://foo', 'http://foo') # abs url with nothing is preserved.
237
test('http://bar', 'http://foo', 'http://bar')
238
test('sftp://bzr/foo', 'http://foo', 'bar', 'sftp://bzr/foo')
239
test('file:///bar', 'foo', 'file:///bar')
240
test('http://bar/', 'http://foo', 'http://bar/')
241
test('http://bar/a', 'http://foo', 'http://bar/a')
242
test('http://bar/a/', 'http://foo', 'http://bar/a/')
243
test('lp:bar', 'http://foo', 'lp:bar')
244
test('lp:bar', 'lp:foo', 'lp:bar')
245
test('file:///stuff', 'lp:foo', 'file:///stuff')
248
test('file:///foo', 'file:///', 'foo')
249
test('file:///bar/foo', 'file:///bar/', 'foo')
250
test('http://host/foo', 'http://host/', 'foo')
251
test('http://host/', 'http://host', '')
254
# Cannot go above root
255
# Implicitly at root:
256
self.assertRaises(InvalidURLJoin, urlutils.join,
257
'http://foo', '../baz')
258
self.assertRaises(InvalidURLJoin, urlutils.join,
260
# Joining from a path explicitly under the root.
261
self.assertRaises(InvalidURLJoin, urlutils.join,
262
'http://foo/a', '../../b')
264
def test_joinpath(self):
265
def test(expected, *args):
266
joined = urlutils.joinpath(*args)
267
self.assertEqual(expected, joined)
269
# Test a single element
272
# Test relative path joining
273
test('foo/bar', 'foo', 'bar')
274
test('foo/bar', 'foo', '.', 'bar')
275
test('foo/baz', 'foo', 'bar', '../baz')
276
test('foo/bar/baz', 'foo', 'bar/baz')
277
test('foo/baz', 'foo', 'bar/../baz')
279
# Test joining to an absolute path
281
test('/foo', '/foo', '.')
282
test('/foo/bar', '/foo', 'bar')
283
test('/', '/foo', '..')
285
# Test joining with an absolute path
286
test('/bar', 'foo', '/bar')
288
# Test joining to a path with a trailing slash
289
test('foo/bar', 'foo/', 'bar')
292
# Cannot go above root
293
self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '../baz')
294
self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '..')
295
self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '/..')
297
def test_join_segment_parameters_raw(self):
298
join_segment_parameters_raw = urlutils.join_segment_parameters_raw
299
self.assertEquals("/somedir/path",
300
join_segment_parameters_raw("/somedir/path"))
301
self.assertEquals("/somedir/path,rawdata",
302
join_segment_parameters_raw("/somedir/path", "rawdata"))
303
self.assertRaises(InvalidURLJoin,
304
join_segment_parameters_raw, "/somedir/path",
305
"rawdata1,rawdata2,rawdata3")
306
self.assertEquals("/somedir/path,bla,bar",
307
join_segment_parameters_raw("/somedir/path", "bla", "bar"))
308
self.assertEquals("/somedir,exist=some/path,bla,bar",
309
join_segment_parameters_raw("/somedir,exist=some/path",
311
self.assertRaises(TypeError, join_segment_parameters_raw,
314
def test_join_segment_parameters(self):
315
join_segment_parameters = urlutils.join_segment_parameters
316
self.assertEquals("/somedir/path",
317
join_segment_parameters("/somedir/path", {}))
318
self.assertEquals("/somedir/path,key1=val1",
319
join_segment_parameters("/somedir/path", {"key1": "val1"}))
320
self.assertRaises(InvalidURLJoin,
321
join_segment_parameters, "/somedir/path",
322
{"branch": "brr,brr,brr"})
323
self.assertRaises(InvalidURLJoin,
324
join_segment_parameters, "/somedir/path", {"key1=val1": "val2"})
325
self.assertEquals("/somedir/path,key1=val1,key2=val2",
326
join_segment_parameters("/somedir/path", {
327
"key1": "val1", "key2": "val2"}))
328
self.assertEquals("/somedir/path,key1=val1,key2=val2",
329
join_segment_parameters("/somedir/path,key1=val1", {
331
self.assertEquals("/somedir/path,key1=val2",
332
join_segment_parameters("/somedir/path,key1=val1", {
334
self.assertEquals("/somedir,exist=some/path,key1=val1",
335
join_segment_parameters("/somedir,exist=some/path",
337
self.assertEquals("/,key1=val1,key2=val2",
338
join_segment_parameters("/,key1=val1", {"key2": "val2"}))
339
self.assertRaises(TypeError,
340
join_segment_parameters, "/,key1=val1", {"foo": 42})
342
def test_function_type(self):
343
if sys.platform == 'win32':
344
self.assertEqual(urlutils._win32_local_path_to_url,
345
urlutils.local_path_to_url)
346
self.assertEqual(urlutils._win32_local_path_from_url,
347
urlutils.local_path_from_url)
349
self.assertEqual(urlutils._posix_local_path_to_url,
350
urlutils.local_path_to_url)
351
self.assertEqual(urlutils._posix_local_path_from_url,
352
urlutils.local_path_from_url)
354
def test_posix_local_path_to_url(self):
355
to_url = urlutils._posix_local_path_to_url
356
self.assertEqual('file:///path/to/foo',
357
to_url('/path/to/foo'))
359
self.assertEqual('file:///path/to/foo%2Cbar',
360
to_url('/path/to/foo,bar'))
363
result = to_url(u'/path/to/r\xe4ksm\xf6rg\xe5s')
365
raise TestSkipped("local encoding cannot handle unicode")
367
self.assertEqual('file:///path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
368
self.assertFalse(isinstance(result, unicode))
370
def test_posix_local_path_from_url(self):
371
from_url = urlutils._posix_local_path_from_url
372
self.assertEqual('/path/to/foo',
373
from_url('file:///path/to/foo'))
374
self.assertEqual('/path/to/foo',
375
from_url('file:///path/to/foo,branch=foo'))
376
self.assertEqual(u'/path/to/r\xe4ksm\xf6rg\xe5s',
377
from_url('file:///path/to/r%C3%A4ksm%C3%B6rg%C3%A5s'))
378
self.assertEqual(u'/path/to/r\xe4ksm\xf6rg\xe5s',
379
from_url('file:///path/to/r%c3%a4ksm%c3%b6rg%c3%a5s'))
380
self.assertEqual(u'/path/to/r\xe4ksm\xf6rg\xe5s',
381
from_url('file://localhost/path/to/r%c3%a4ksm%c3%b6rg%c3%a5s'))
383
self.assertRaises(InvalidURL, from_url, '/path/to/foo')
385
InvalidURL, from_url,
386
'file://remotehost/path/to/r%c3%a4ksm%c3%b6rg%c3%a5s')
388
def test_win32_local_path_to_url(self):
389
to_url = urlutils._win32_local_path_to_url
390
self.assertEqual('file:///C:/path/to/foo',
391
to_url('C:/path/to/foo'))
392
# BOGUS: on win32, ntpath.abspath will strip trailing
393
# whitespace, so this will always fail
394
# Though under linux, it fakes abspath support
395
# and thus will succeed
396
# self.assertEqual('file:///C:/path/to/foo%20',
397
# to_url('C:/path/to/foo '))
398
self.assertEqual('file:///C:/path/to/f%20oo',
399
to_url('C:/path/to/f oo'))
401
self.assertEqual('file:///', to_url('/'))
403
self.assertEqual('file:///C:/path/to/foo%2Cbar',
404
to_url('C:/path/to/foo,bar'))
406
result = to_url(u'd:/path/to/r\xe4ksm\xf6rg\xe5s')
408
raise TestSkipped("local encoding cannot handle unicode")
410
self.assertEqual('file:///D:/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
411
self.assertFalse(isinstance(result, unicode))
413
def test_win32_unc_path_to_url(self):
414
self.requireFeature(features.win32_feature)
415
to_url = urlutils._win32_local_path_to_url
416
self.assertEqual('file://HOST/path',
417
to_url(r'\\HOST\path'))
418
self.assertEqual('file://HOST/path',
419
to_url('//HOST/path'))
422
result = to_url(u'//HOST/path/to/r\xe4ksm\xf6rg\xe5s')
424
raise TestSkipped("local encoding cannot handle unicode")
426
self.assertEqual('file://HOST/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
427
self.assertFalse(isinstance(result, unicode))
429
def test_win32_local_path_from_url(self):
430
from_url = urlutils._win32_local_path_from_url
431
self.assertEqual('C:/path/to/foo',
432
from_url('file:///C|/path/to/foo'))
433
self.assertEqual(u'D:/path/to/r\xe4ksm\xf6rg\xe5s',
434
from_url('file:///d|/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s'))
435
self.assertEqual(u'D:/path/to/r\xe4ksm\xf6rg\xe5s',
436
from_url('file:///d:/path/to/r%c3%a4ksm%c3%b6rg%c3%a5s'))
437
self.assertEqual('/', from_url('file:///'))
438
self.assertEqual('C:/path/to/foo',
439
from_url('file:///C|/path/to/foo,branch=foo'))
441
self.assertRaises(InvalidURL, from_url, 'file:///C:')
442
self.assertRaises(InvalidURL, from_url, 'file:///c')
443
self.assertRaises(InvalidURL, from_url, '/path/to/foo')
444
# Not a valid _win32 url, no drive letter
445
self.assertRaises(InvalidURL, from_url, 'file:///path/to/foo')
447
def test_win32_unc_path_from_url(self):
448
from_url = urlutils._win32_local_path_from_url
449
self.assertEqual('//HOST/path', from_url('file://HOST/path'))
450
self.assertEqual('//HOST/path',
451
from_url('file://HOST/path,branch=foo'))
452
# despite IE allows 2, 4, 5 and 6 slashes in URL to another machine
453
# we want to use only 2 slashes
454
# Firefox understand only 5 slashes in URL, but it's ugly
455
self.assertRaises(InvalidURL, from_url, 'file:////HOST/path')
456
self.assertRaises(InvalidURL, from_url, 'file://///HOST/path')
457
self.assertRaises(InvalidURL, from_url, 'file://////HOST/path')
458
# check for file://C:/ instead of file:///C:/
459
self.assertRaises(InvalidURL, from_url, 'file://C:/path')
461
def test_win32_extract_drive_letter(self):
462
extract = urlutils._win32_extract_drive_letter
463
self.assertEqual(('file:///C:', '/foo'), extract('file://', '/C:/foo'))
464
self.assertEqual(('file:///d|', '/path'), extract('file://', '/d|/path'))
465
self.assertRaises(InvalidURL, extract, 'file://', '/path')
466
# Root drives without slash treated as invalid, see bug #841322
467
self.assertEqual(('file:///C:', '/'), extract('file://', '/C:/'))
468
self.assertRaises(InvalidURL, extract, 'file://', '/C:')
469
# Invalid without drive separator or following forward slash
470
self.assertRaises(InvalidURL, extract, 'file://', '/C')
471
self.assertRaises(InvalidURL, extract, 'file://', '/C:ool')
473
def test_split(self):
474
# Test bzrlib.urlutils.split()
475
split = urlutils.split
476
if sys.platform == 'win32':
477
self.assertRaises(InvalidURL, split, 'file:///path/to/foo')
478
self.assertEqual(('file:///C|/', 'foo'), split('file:///C|/foo'))
479
self.assertEqual(('file:///C:/', ''), split('file:///C:/'))
481
self.assertEqual(('file:///', 'foo'), split('file:///foo'))
482
self.assertEqual(('file:///', ''), split('file:///'))
484
self.assertEqual(('http://host/path/to', 'foo'), split('http://host/path/to/foo'))
485
self.assertEqual(('http://host/path/to', 'foo'), split('http://host/path/to/foo/'))
486
self.assertEqual(('http://host/path/to/foo', ''),
487
split('http://host/path/to/foo/', exclude_trailing_slash=False))
488
self.assertEqual(('http://host/', 'path'), split('http://host/path'))
489
self.assertEqual(('http://host/', ''), split('http://host/'))
490
self.assertEqual(('http://host', ''), split('http://host'))
491
self.assertEqual(('http:///nohost', 'path'), split('http:///nohost/path'))
493
self.assertEqual(('random+scheme://user:pass@ahost:port/', 'path'),
494
split('random+scheme://user:pass@ahost:port/path'))
495
self.assertEqual(('random+scheme://user:pass@ahost:port/', 'path'),
496
split('random+scheme://user:pass@ahost:port/path/'))
497
self.assertEqual(('random+scheme://user:pass@ahost:port/', ''),
498
split('random+scheme://user:pass@ahost:port/'))
501
self.assertEqual(('path/to', 'foo'), split('path/to/foo'))
502
self.assertEqual(('path/to', 'foo'), split('path/to/foo/'))
503
self.assertEqual(('path/to/foo', ''),
504
split('path/to/foo/', exclude_trailing_slash=False))
505
self.assertEqual(('path/..', 'foo'), split('path/../foo'))
506
self.assertEqual(('../path', 'foo'), split('../path/foo'))
508
def test_split_segment_parameters_raw(self):
509
split_segment_parameters_raw = urlutils.split_segment_parameters_raw
510
# Check relative references with absolute paths
511
self.assertEquals(("/some/path", []),
512
split_segment_parameters_raw("/some/path"))
513
self.assertEquals(("/some/path", ["tip"]),
514
split_segment_parameters_raw("/some/path,tip"))
515
self.assertEquals(("/some,dir/path", ["tip"]),
516
split_segment_parameters_raw("/some,dir/path,tip"))
517
self.assertEquals(("/somedir/path", ["heads%2Ftip"]),
518
split_segment_parameters_raw("/somedir/path,heads%2Ftip"))
519
self.assertEquals(("/somedir/path", ["heads%2Ftip", "bar"]),
520
split_segment_parameters_raw("/somedir/path,heads%2Ftip,bar"))
521
# Check relative references with relative paths
522
self.assertEquals(("", ["key1=val1"]),
523
split_segment_parameters_raw(",key1=val1"))
524
self.assertEquals(("foo/", ["key1=val1"]),
525
split_segment_parameters_raw("foo/,key1=val1"))
526
self.assertEquals(("foo", ["key1=val1"]),
527
split_segment_parameters_raw("foo,key1=val1"))
528
self.assertEquals(("foo/base,la=bla/other/elements", []),
529
split_segment_parameters_raw("foo/base,la=bla/other/elements"))
530
self.assertEquals(("foo/base,la=bla/other/elements", ["a=b"]),
531
split_segment_parameters_raw("foo/base,la=bla/other/elements,a=b"))
532
# TODO: Check full URLs as well as relative references
534
def test_split_segment_parameters(self):
535
split_segment_parameters = urlutils.split_segment_parameters
536
# Check relative references with absolute paths
537
self.assertEquals(("/some/path", {}),
538
split_segment_parameters("/some/path"))
539
self.assertEquals(("/some/path", {"branch": "tip"}),
540
split_segment_parameters("/some/path,branch=tip"))
541
self.assertEquals(("/some,dir/path", {"branch": "tip"}),
542
split_segment_parameters("/some,dir/path,branch=tip"))
543
self.assertEquals(("/somedir/path", {"ref": "heads%2Ftip"}),
544
split_segment_parameters("/somedir/path,ref=heads%2Ftip"))
545
self.assertEquals(("/somedir/path",
546
{"ref": "heads%2Ftip", "key1": "val1"}),
547
split_segment_parameters(
548
"/somedir/path,ref=heads%2Ftip,key1=val1"))
549
self.assertEquals(("/somedir/path", {"ref": "heads%2F=tip"}),
550
split_segment_parameters("/somedir/path,ref=heads%2F=tip"))
551
# Check relative references with relative paths
552
self.assertEquals(("", {"key1": "val1"}),
553
split_segment_parameters(",key1=val1"))
554
self.assertEquals(("foo/", {"key1": "val1"}),
555
split_segment_parameters("foo/,key1=val1"))
556
self.assertEquals(("foo/base,key1=val1/other/elements", {}),
557
split_segment_parameters("foo/base,key1=val1/other/elements"))
558
self.assertEquals(("foo/base,key1=val1/other/elements",
559
{"key2": "val2"}), split_segment_parameters(
560
"foo/base,key1=val1/other/elements,key2=val2"))
561
# TODO: Check full URLs as well as relative references
563
def test_win32_strip_local_trailing_slash(self):
564
strip = urlutils._win32_strip_local_trailing_slash
565
self.assertEqual('file://', strip('file://'))
566
self.assertEqual('file:///', strip('file:///'))
567
self.assertEqual('file:///C', strip('file:///C'))
568
self.assertEqual('file:///C:', strip('file:///C:'))
569
self.assertEqual('file:///d|', strip('file:///d|'))
570
self.assertEqual('file:///C:/', strip('file:///C:/'))
571
self.assertEqual('file:///C:/a', strip('file:///C:/a/'))
573
def test_strip_trailing_slash(self):
574
sts = urlutils.strip_trailing_slash
575
if sys.platform == 'win32':
576
self.assertEqual('file:///C|/', sts('file:///C|/'))
577
self.assertEqual('file:///C:/foo', sts('file:///C:/foo'))
578
self.assertEqual('file:///C|/foo', sts('file:///C|/foo/'))
580
self.assertEqual('file:///', sts('file:///'))
581
self.assertEqual('file:///foo', sts('file:///foo'))
582
self.assertEqual('file:///foo', sts('file:///foo/'))
584
self.assertEqual('http://host/', sts('http://host/'))
585
self.assertEqual('http://host/foo', sts('http://host/foo'))
586
self.assertEqual('http://host/foo', sts('http://host/foo/'))
588
# No need to fail just because the slash is missing
589
self.assertEqual('http://host', sts('http://host'))
590
# TODO: jam 20060502 Should this raise InvalidURL?
591
self.assertEqual('file://', sts('file://'))
593
self.assertEqual('random+scheme://user:pass@ahost:port/path',
594
sts('random+scheme://user:pass@ahost:port/path'))
595
self.assertEqual('random+scheme://user:pass@ahost:port/path',
596
sts('random+scheme://user:pass@ahost:port/path/'))
597
self.assertEqual('random+scheme://user:pass@ahost:port/',
598
sts('random+scheme://user:pass@ahost:port/'))
600
# Make sure relative paths work too
601
self.assertEqual('path/to/foo', sts('path/to/foo'))
602
self.assertEqual('path/to/foo', sts('path/to/foo/'))
603
self.assertEqual('../to/foo', sts('../to/foo/'))
604
self.assertEqual('path/../foo', sts('path/../foo/'))
606
def test_unescape_for_display_utf8(self):
607
# Test that URLs are converted to nice unicode strings for display
608
def test(expected, url, encoding='utf-8'):
609
disp_url = urlutils.unescape_for_display(url, encoding=encoding)
610
self.assertIsInstance(disp_url, unicode)
611
self.assertEqual(expected, disp_url)
613
test('http://foo', 'http://foo')
614
if sys.platform == 'win32':
615
test('C:/foo/path', 'file:///C|/foo/path')
616
test('C:/foo/path', 'file:///C:/foo/path')
618
test('/foo/path', 'file:///foo/path')
620
test('http://foo/%2Fbaz', 'http://foo/%2Fbaz')
621
test(u'http://host/r\xe4ksm\xf6rg\xe5s',
622
'http://host/r%C3%A4ksm%C3%B6rg%C3%A5s')
624
# Make sure special escaped characters stay escaped
625
test(u'http://host/%3B%2F%3F%3A%40%26%3D%2B%24%2C%23',
626
'http://host/%3B%2F%3F%3A%40%26%3D%2B%24%2C%23')
628
# Can we handle sections that don't have utf-8 encoding?
629
test(u'http://host/%EE%EE%EE/r\xe4ksm\xf6rg\xe5s',
630
'http://host/%EE%EE%EE/r%C3%A4ksm%C3%B6rg%C3%A5s')
632
# Test encoding into output that can handle some characters
633
test(u'http://host/%EE%EE%EE/r\xe4ksm\xf6rg\xe5s',
634
'http://host/%EE%EE%EE/r%C3%A4ksm%C3%B6rg%C3%A5s',
635
encoding='iso-8859-1')
637
# This one can be encoded into utf8
638
test(u'http://host/\u062c\u0648\u062c\u0648',
639
'http://host/%d8%ac%d9%88%d8%ac%d9%88',
642
# This can't be put into 8859-1 and so stays as escapes
643
test(u'http://host/%d8%ac%d9%88%d8%ac%d9%88',
644
'http://host/%d8%ac%d9%88%d8%ac%d9%88',
645
encoding='iso-8859-1')
647
def test_escape(self):
648
self.assertEqual('%25', urlutils.escape('%'))
649
self.assertEqual('%C3%A5', urlutils.escape(u'\xe5'))
650
self.assertFalse(isinstance(urlutils.escape(u'\xe5'), unicode))
652
def test_escape_tildes(self):
653
self.assertEqual('~foo', urlutils.escape('~foo'))
655
def test_unescape(self):
656
self.assertEqual('%', urlutils.unescape('%25'))
657
self.assertEqual(u'\xe5', urlutils.unescape('%C3%A5'))
659
self.assertRaises(InvalidURL, urlutils.unescape, u'\xe5')
660
self.assertRaises(InvalidURL, urlutils.unescape, '\xe5')
661
self.assertRaises(InvalidURL, urlutils.unescape, '%E5')
663
def test_escape_unescape(self):
664
self.assertEqual(u'\xe5', urlutils.unescape(urlutils.escape(u'\xe5')))
665
self.assertEqual('%', urlutils.unescape(urlutils.escape('%')))
667
def test_relative_url(self):
668
def test(expected, base, other):
669
result = urlutils.relative_url(base, other)
670
self.assertEqual(expected, result)
672
test('a', 'http://host/', 'http://host/a')
673
test('http://entirely/different', 'sftp://host/branch',
674
'http://entirely/different')
675
test('../person/feature', 'http://host/branch/mainline',
676
'http://host/branch/person/feature')
677
test('..', 'http://host/branch', 'http://host/')
678
test('http://host2/branch', 'http://host1/branch', 'http://host2/branch')
679
test('.', 'http://host1/branch', 'http://host1/branch')
680
test('../../../branch/2b', 'file:///home/jelmer/foo/bar/2b',
681
'file:///home/jelmer/branch/2b')
682
test('../../branch/2b', 'sftp://host/home/jelmer/bar/2b',
683
'sftp://host/home/jelmer/branch/2b')
684
test('../../branch/feature/%2b', 'http://host/home/jelmer/bar/%2b',
685
'http://host/home/jelmer/branch/feature/%2b')
686
test('../../branch/feature/2b', 'http://host/home/jelmer/bar/2b/',
687
'http://host/home/jelmer/branch/feature/2b')
688
# relative_url should preserve a trailing slash
689
test('../../branch/feature/2b/', 'http://host/home/jelmer/bar/2b/',
690
'http://host/home/jelmer/branch/feature/2b/')
691
test('../../branch/feature/2b/', 'http://host/home/jelmer/bar/2b',
692
'http://host/home/jelmer/branch/feature/2b/')
694
# TODO: treat http://host as http://host/
695
# relative_url is typically called from a branch.base or
696
# transport.base which always ends with a /
697
#test('a', 'http://host', 'http://host/a')
698
test('http://host/a', 'http://host', 'http://host/a')
699
#test('.', 'http://host', 'http://host/')
700
test('http://host/', 'http://host', 'http://host/')
701
#test('.', 'http://host/', 'http://host')
702
test('http://host', 'http://host/', 'http://host')
704
# On Windows file:///C:/path/to and file:///D:/other/path
705
# should not use relative url over the non-existent '/' directory.
706
if sys.platform == 'win32':
708
test('../../other/path',
709
'file:///C:/path/to', 'file:///C:/other/path')
710
#~next two tests is failed, i.e. urlutils.relative_url expects
711
#~to see normalized file URLs?
712
#~test('../../other/path',
713
#~ 'file:///C:/path/to', 'file:///c:/other/path')
714
#~test('../../other/path',
715
#~ 'file:///C:/path/to', 'file:///C|/other/path')
717
# check UNC paths too
718
test('../../other/path',
719
'file://HOST/base/path/to', 'file://HOST/base/other/path')
720
# on different drives
721
test('file:///D:/other/path',
722
'file:///C:/path/to', 'file:///D:/other/path')
723
# TODO: strictly saying in UNC path //HOST/base is full analog
724
# of drive letter for hard disk, and this situation is also
725
# should be exception from rules. [bialix 20071221]
728
class TestCwdToURL(TestCaseInTempDir):
729
"""Test that local_path_to_url works based on the cwd"""
732
# This test will fail if getcwd is not ascii
736
url = urlutils.local_path_to_url('.')
737
self.assertEndsWith(url, '/mytest')
739
def test_non_ascii(self):
740
if win32utils.winver == 'Windows 98':
741
raise TestSkipped('Windows 98 cannot handle unicode filenames')
746
raise TestSkipped('cannot create unicode directory')
750
# On Mac OSX this directory is actually:
751
# u'/dode\u0301' => '/dode\xcc\x81
752
# but we should normalize it back to
753
# u'/dod\xe9' => '/dod\xc3\xa9'
754
url = urlutils.local_path_to_url('.')
755
self.assertEndsWith(url, '/dod%C3%A9')
758
class TestDeriveToLocation(TestCase):
759
"""Test that the mapping of FROM_LOCATION to TO_LOCATION works."""
761
def test_to_locations_derived_from_paths(self):
762
derive = urlutils.derive_to_location
763
self.assertEqual("bar", derive("bar"))
764
self.assertEqual("bar", derive("../bar"))
765
self.assertEqual("bar", derive("/foo/bar"))
766
self.assertEqual("bar", derive("c:/foo/bar"))
767
self.assertEqual("bar", derive("c:bar"))
769
def test_to_locations_derived_from_urls(self):
770
derive = urlutils.derive_to_location
771
self.assertEqual("bar", derive("http://foo/bar"))
772
self.assertEqual("bar", derive("bzr+ssh://foo/bar"))
773
self.assertEqual("foo-bar", derive("lp:foo-bar"))
776
class TestRebaseURL(TestCase):
777
"""Test the behavior of rebase_url."""
779
def test_non_relative(self):
780
result = urlutils.rebase_url('file://foo', 'file://foo',
782
self.assertEqual('file://foo', result)
783
result = urlutils.rebase_url('/foo', 'file://foo',
785
self.assertEqual('/foo', result)
787
def test_different_ports(self):
788
e = self.assertRaises(InvalidRebaseURLs, urlutils.rebase_url,
789
'foo', 'http://bar:80', 'http://bar:81')
790
self.assertEqual(str(e), "URLs differ by more than path:"
791
" 'http://bar:80' and 'http://bar:81'")
793
def test_different_hosts(self):
794
e = self.assertRaises(InvalidRebaseURLs, urlutils.rebase_url,
795
'foo', 'http://bar', 'http://baz')
796
self.assertEqual(str(e), "URLs differ by more than path: 'http://bar'"
799
def test_different_protocol(self):
800
e = self.assertRaises(InvalidRebaseURLs, urlutils.rebase_url,
801
'foo', 'http://bar', 'ftp://bar')
802
self.assertEqual(str(e), "URLs differ by more than path: 'http://bar'"
805
def test_rebase_success(self):
806
self.assertEqual('../bar', urlutils.rebase_url('bar', 'http://baz/',
808
self.assertEqual('qux/bar', urlutils.rebase_url('bar',
809
'http://baz/qux', 'http://baz/'))
810
self.assertEqual('.', urlutils.rebase_url('foo',
811
'http://bar/', 'http://bar/foo/'))
812
self.assertEqual('qux/bar', urlutils.rebase_url('../bar',
813
'http://baz/qux/foo', 'http://baz/'))
815
def test_determine_relative_path(self):
816
self.assertEqual('../../baz/bar',
817
urlutils.determine_relative_path(
818
'/qux/quxx', '/baz/bar'))
819
self.assertEqual('..',
820
urlutils.determine_relative_path(
822
self.assertEqual('baz',
823
urlutils.determine_relative_path(
825
self.assertEqual('.', urlutils.determine_relative_path(
829
class TestParseURL(TestCase):
831
def test_parse_simple(self):
832
parsed = urlutils.parse_url('http://example.com:80/one')
833
self.assertEquals(('http', None, None, 'example.com', 80, '/one'),
837
parsed = urlutils.parse_url('http://[1:2:3::40]/one')
838
self.assertEquals(('http', None, None, '1:2:3::40', None, '/one'),
841
def test_ipv6_port(self):
842
parsed = urlutils.parse_url('http://[1:2:3::40]:80/one')
843
self.assertEquals(('http', None, None, '1:2:3::40', 80, '/one'),
847
class TestURL(TestCase):
849
def test_parse_simple(self):
850
parsed = urlutils.URL.from_string('http://example.com:80/one')
851
self.assertEquals('http', parsed.scheme)
852
self.assertIs(None, parsed.user)
853
self.assertIs(None, parsed.password)
854
self.assertEquals('example.com', parsed.host)
855
self.assertEquals(80, parsed.port)
856
self.assertEquals('/one', parsed.path)
859
parsed = urlutils.URL.from_string('http://[1:2:3::40]/one')
860
self.assertEquals('http', parsed.scheme)
861
self.assertIs(None, parsed.port)
862
self.assertIs(None, parsed.user)
863
self.assertIs(None, parsed.password)
864
self.assertEquals('1:2:3::40', parsed.host)
865
self.assertEquals('/one', parsed.path)
867
def test_ipv6_port(self):
868
parsed = urlutils.URL.from_string('http://[1:2:3::40]:80/one')
869
self.assertEquals('http', parsed.scheme)
870
self.assertEquals('1:2:3::40', parsed.host)
871
self.assertIs(None, parsed.user)
872
self.assertIs(None, parsed.password)
873
self.assertEquals(80, parsed.port)
874
self.assertEquals('/one', parsed.path)
876
def test_quoted(self):
877
parsed = urlutils.URL.from_string(
878
'http://ro%62ey:h%40t@ex%41mple.com:2222/path')
879
self.assertEquals(parsed.quoted_host, 'ex%41mple.com')
880
self.assertEquals(parsed.host, 'exAmple.com')
881
self.assertEquals(parsed.port, 2222)
882
self.assertEquals(parsed.quoted_user, 'ro%62ey')
883
self.assertEquals(parsed.user, 'robey')
884
self.assertEquals(parsed.quoted_password, 'h%40t')
885
self.assertEquals(parsed.password, 'h@t')
886
self.assertEquals(parsed.path, '/path')
889
parsed1 = urlutils.URL.from_string('http://[1:2:3::40]:80/one')
890
parsed2 = urlutils.URL.from_string('http://[1:2:3::40]:80/one')
891
self.assertEquals(parsed1, parsed2)
892
self.assertEquals(parsed1, parsed1)
893
parsed2.path = '/two'
894
self.assertNotEquals(parsed1, parsed2)
897
parsed = urlutils.URL.from_string('http://[1:2:3::40]:80/one')
899
"<URL('http', None, None, '1:2:3::40', 80, '/one')>",
903
parsed = urlutils.URL.from_string('http://[1:2:3::40]:80/one')
904
self.assertEquals('http://[1:2:3::40]:80/one', str(parsed))
906
def test__combine_paths(self):
907
combine = urlutils.URL._combine_paths
908
self.assertEqual('/home/sarah/project/foo',
909
combine('/home/sarah', 'project/foo'))
910
self.assertEqual('/etc',
911
combine('/home/sarah', '../../etc'))
912
self.assertEqual('/etc',
913
combine('/home/sarah', '../../../etc'))
914
self.assertEqual('/etc',
915
combine('/home/sarah', '/etc'))
917
def test_clone(self):
918
url = urlutils.URL.from_string('http://[1:2:3::40]:80/one')
919
url1 = url.clone("two")
920
self.assertEquals("/one/two", url1.path)
921
url2 = url.clone("/two")
922
self.assertEquals("/two", url2.path)
924
self.assertIsNot(url, url3)
925
self.assertEquals(url, url3)
928
class TestFileRelpath(TestCase):
930
# GZ 2011-11-18: A way to override all path handling functions to one
931
# platform or another for testing would be nice.
933
def _with_posix_paths(self):
934
self.overrideAttr(urlutils, "local_path_from_url",
935
urlutils._posix_local_path_from_url)
936
self.overrideAttr(urlutils, "MIN_ABS_FILEURL_LENGTH", len("file:///"))
937
self.overrideAttr(osutils, "normpath", osutils._posix_normpath)
938
self.overrideAttr(osutils, "abspath", osutils._posix_abspath)
939
self.overrideAttr(osutils, "normpath", osutils._posix_normpath)
940
self.overrideAttr(osutils, "pathjoin", osutils.posixpath.join)
941
self.overrideAttr(osutils, "split", osutils.posixpath.split)
942
self.overrideAttr(osutils, "MIN_ABS_PATHLENGTH", 1)
944
def _with_win32_paths(self):
945
self.overrideAttr(urlutils, "local_path_from_url",
946
urlutils._win32_local_path_from_url)
947
self.overrideAttr(urlutils, "MIN_ABS_FILEURL_LENGTH",
948
urlutils.WIN32_MIN_ABS_FILEURL_LENGTH)
949
self.overrideAttr(osutils, "abspath", osutils._win32_abspath)
950
self.overrideAttr(osutils, "normpath", osutils._win32_normpath)
951
self.overrideAttr(osutils, "pathjoin", osutils._win32_pathjoin)
952
self.overrideAttr(osutils, "split", osutils.ntpath.split)
953
self.overrideAttr(osutils, "MIN_ABS_PATHLENGTH", 3)
955
def test_same_url_posix(self):
956
self._with_posix_paths()
957
self.assertEquals("",
958
urlutils.file_relpath("file:///a", "file:///a"))
959
self.assertEquals("",
960
urlutils.file_relpath("file:///a", "file:///a/"))
961
self.assertEquals("",
962
urlutils.file_relpath("file:///a/", "file:///a"))
964
def test_same_url_win32(self):
965
self._with_win32_paths()
966
self.assertEquals("",
967
urlutils.file_relpath("file:///A:/", "file:///A:/"))
968
self.assertEquals("",
969
urlutils.file_relpath("file:///A|/", "file:///A:/"))
970
self.assertEquals("",
971
urlutils.file_relpath("file:///A:/b/", "file:///A:/b/"))
972
self.assertEquals("",
973
urlutils.file_relpath("file:///A:/b", "file:///A:/b/"))
974
self.assertEquals("",
975
urlutils.file_relpath("file:///A:/b/", "file:///A:/b"))
977
def test_child_posix(self):
978
self._with_posix_paths()
979
self.assertEquals("b",
980
urlutils.file_relpath("file:///a", "file:///a/b"))
981
self.assertEquals("b",
982
urlutils.file_relpath("file:///a/", "file:///a/b"))
983
self.assertEquals("b/c",
984
urlutils.file_relpath("file:///a", "file:///a/b/c"))
986
def test_child_win32(self):
987
self._with_win32_paths()
988
self.assertEquals("b",
989
urlutils.file_relpath("file:///A:/", "file:///A:/b"))
990
self.assertEquals("b",
991
urlutils.file_relpath("file:///A|/", "file:///A:/b"))
992
self.assertEquals("c",
993
urlutils.file_relpath("file:///A:/b", "file:///A:/b/c"))
994
self.assertEquals("c",
995
urlutils.file_relpath("file:///A:/b/", "file:///A:/b/c"))
996
self.assertEquals("c/d",
997
urlutils.file_relpath("file:///A:/b", "file:///A:/b/c/d"))
999
def test_sibling_posix(self):
1000
self._with_posix_paths()
1001
self.assertRaises(PathNotChild,
1002
urlutils.file_relpath, "file:///a/b", "file:///a/c")
1003
self.assertRaises(PathNotChild,
1004
urlutils.file_relpath, "file:///a/b/", "file:///a/c")
1005
self.assertRaises(PathNotChild,
1006
urlutils.file_relpath, "file:///a/b/", "file:///a/c/")
1008
def test_sibling_win32(self):
1009
self._with_win32_paths()
1010
self.assertRaises(PathNotChild,
1011
urlutils.file_relpath, "file:///A:/b", "file:///A:/c")
1012
self.assertRaises(PathNotChild,
1013
urlutils.file_relpath, "file:///A:/b/", "file:///A:/c")
1014
self.assertRaises(PathNotChild,
1015
urlutils.file_relpath, "file:///A:/b/", "file:///A:/c/")
1017
def test_parent_posix(self):
1018
self._with_posix_paths()
1019
self.assertRaises(PathNotChild,
1020
urlutils.file_relpath, "file:///a/b", "file:///a")
1021
self.assertRaises(PathNotChild,
1022
urlutils.file_relpath, "file:///a/b", "file:///a/")
1024
def test_parent_win32(self):
1025
self._with_win32_paths()
1026
self.assertRaises(PathNotChild,
1027
urlutils.file_relpath, "file:///A:/b", "file:///A:/")
1028
self.assertRaises(PathNotChild,
1029
urlutils.file_relpath, "file:///A:/b/c", "file:///A:/b")
1032
class QuoteTests(TestCase):
1034
def test_quote(self):
1035
self.assertEqual('abc%20def', urlutils.quote('abc def'))
1036
self.assertEqual('abc%2Fdef', urlutils.quote('abc/def', safe=''))
1037
self.assertEqual('abc/def', urlutils.quote('abc/def', safe='/'))
1039
def test_quote_tildes(self):
1040
self.assertEqual('%7Efoo', urlutils.quote('~foo'))
1041
self.assertEqual('~foo', urlutils.quote('~foo', safe='/~'))
1043
def test_unquote(self):
1044
self.assertEqual('%', urlutils.unquote('%25'))
1045
self.assertEqual('\xc3\xa5', urlutils.unquote('%C3%A5'))
1046
self.assertEqual(u"\xe5", urlutils.unquote(u'\xe5'))