~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/tests/test_urlutils.py

  • Committer: Canonical.com Patch Queue Manager
  • Date: 2008-10-31 04:39:04 UTC
  • mfrom: (3565.6.16 switch_nick)
  • Revision ID: pqm@pqm.ubuntu.com-20081031043904-52fnbfrloojemvcc
(mbp) branch nickname documentation

Show diffs side-by-side

added added

removed removed

Lines of Context:
 
1
# Copyright (C) 2005 Canonical Ltd
 
2
#
 
3
# This program is free software; you can redistribute it and/or modify
 
4
# it under the terms of the GNU General Public License as published by
 
5
# the Free Software Foundation; either version 2 of the License, or
 
6
# (at your option) any later version.
 
7
#
 
8
# This program is distributed in the hope that it will be useful,
 
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
 
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 
11
# GNU General Public License for more details.
 
12
#
 
13
# You should have received a copy of the GNU General Public License
 
14
# along with this program; if not, write to the Free Software
 
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 
16
 
 
17
"""Tests for the urlutils wrapper."""
 
18
 
 
19
import os
 
20
import re
 
21
import sys
 
22
 
 
23
from bzrlib import osutils, urlutils, win32utils
 
24
from bzrlib.errors import InvalidURL, InvalidURLJoin, InvalidRebaseURLs
 
25
from bzrlib.tests import TestCaseInTempDir, TestCase, TestSkipped
 
26
 
 
27
 
 
28
class TestUrlToPath(TestCase):
 
29
    
 
30
    def test_basename(self):
 
31
        # bzrlib.urlutils.basename
 
32
        # Test bzrlib.urlutils.split()
 
33
        basename = urlutils.basename
 
34
        if sys.platform == 'win32':
 
35
            self.assertRaises(InvalidURL, basename, 'file:///path/to/foo')
 
36
            self.assertEqual('foo', basename('file:///C|/foo'))
 
37
            self.assertEqual('foo', basename('file:///C:/foo'))
 
38
            self.assertEqual('', basename('file:///C:/'))
 
39
        else:
 
40
            self.assertEqual('foo', basename('file:///foo'))
 
41
            self.assertEqual('', basename('file:///'))
 
42
 
 
43
        self.assertEqual('foo', basename('http://host/path/to/foo'))
 
44
        self.assertEqual('foo', basename('http://host/path/to/foo/'))
 
45
        self.assertEqual('',
 
46
            basename('http://host/path/to/foo/', exclude_trailing_slash=False))
 
47
        self.assertEqual('path', basename('http://host/path'))
 
48
        self.assertEqual('', basename('http://host/'))
 
49
        self.assertEqual('', basename('http://host'))
 
50
        self.assertEqual('path', basename('http:///nohost/path'))
 
51
 
 
52
        self.assertEqual('path', basename('random+scheme://user:pass@ahost:port/path'))
 
53
        self.assertEqual('path', basename('random+scheme://user:pass@ahost:port/path/'))
 
54
        self.assertEqual('', basename('random+scheme://user:pass@ahost:port/'))
 
55
 
 
56
        # relative paths
 
57
        self.assertEqual('foo', basename('path/to/foo'))
 
58
        self.assertEqual('foo', basename('path/to/foo/'))
 
59
        self.assertEqual('', basename('path/to/foo/',
 
60
            exclude_trailing_slash=False))
 
61
        self.assertEqual('foo', basename('path/../foo'))
 
62
        self.assertEqual('foo', basename('../path/foo'))
 
63
 
 
64
    def test_normalize_url_files(self):
 
65
        # Test that local paths are properly normalized
 
66
        normalize_url = urlutils.normalize_url
 
67
 
 
68
        def norm_file(expected, path):
 
69
            url = normalize_url(path)
 
70
            self.assertStartsWith(url, 'file:///')
 
71
            if sys.platform == 'win32':
 
72
                url = url[len('file:///C:'):]
 
73
            else:
 
74
                url = url[len('file://'):]
 
75
 
 
76
            self.assertEndsWith(url, expected)
 
77
 
 
78
        norm_file('path/to/foo', 'path/to/foo')
 
79
        norm_file('/path/to/foo', '/path/to/foo')
 
80
        norm_file('path/to/foo', '../path/to/foo')
 
81
 
 
82
        # Local paths are assumed to *not* be escaped at all
 
83
        try:
 
84
            u'uni/\xb5'.encode(osutils.get_user_encoding())
 
85
        except UnicodeError:
 
86
            # locale cannot handle unicode 
 
87
            pass
 
88
        else:
 
89
            norm_file('uni/%C2%B5', u'uni/\xb5')
 
90
 
 
91
        norm_file('uni/%25C2%25B5', u'uni/%C2%B5')
 
92
        norm_file('uni/%20b', u'uni/ b')
 
93
        # All the crazy characters get escaped in local paths => file:/// urls
 
94
        # The ' ' character must not be at the end, because on win32
 
95
        # it gets stripped off by ntpath.abspath
 
96
        norm_file('%27%20%3B/%3F%3A%40%26%3D%2B%24%2C%23', "' ;/?:@&=+$,#")
 
97
 
 
98
    def test_normalize_url_hybrid(self):
 
99
        # Anything with a scheme:// should be treated as a hybrid url
 
100
        # which changes what characters get escaped.
 
101
        normalize_url = urlutils.normalize_url
 
102
 
 
103
        eq = self.assertEqual
 
104
        eq('file:///foo/', normalize_url(u'file:///foo/'))
 
105
        eq('file:///foo/%20', normalize_url(u'file:///foo/ '))
 
106
        eq('file:///foo/%20', normalize_url(u'file:///foo/%20'))
 
107
        # Don't escape reserved characters
 
108
        eq('file:///ab_c.d-e/%f:?g&h=i+j;k,L#M$',
 
109
            normalize_url('file:///ab_c.d-e/%f:?g&h=i+j;k,L#M$'))
 
110
        eq('http://ab_c.d-e/%f:?g&h=i+j;k,L#M$',
 
111
            normalize_url('http://ab_c.d-e/%f:?g&h=i+j;k,L#M$'))
 
112
 
 
113
        # Escape unicode characters, but not already escaped chars
 
114
        eq('http://host/ab/%C2%B5/%C2%B5',
 
115
            normalize_url(u'http://host/ab/%C2%B5/\xb5'))
 
116
 
 
117
        # Unescape characters that don't need to be escaped
 
118
        eq('http://host/~bob%2525-._',
 
119
                normalize_url('http://host/%7Ebob%2525%2D%2E%5F'))
 
120
        eq('http://host/~bob%2525-._',
 
121
                normalize_url(u'http://host/%7Ebob%2525%2D%2E%5F'))
 
122
 
 
123
        # Normalize verifies URLs when they are not unicode
 
124
        # (indicating they did not come from the user)
 
125
        self.assertRaises(InvalidURL, normalize_url, 'http://host/\xb5')
 
126
        self.assertRaises(InvalidURL, normalize_url, 'http://host/ ')
 
127
 
 
128
    def test_url_scheme_re(self):
 
129
        # Test paths that may be URLs
 
130
        def test_one(url, scheme_and_path):
 
131
            """Assert that _url_scheme_re correctly matches
 
132
 
 
133
            :param scheme_and_path: The (scheme, path) that should be matched
 
134
                can be None, to indicate it should not match
 
135
            """
 
136
            m = urlutils._url_scheme_re.match(url)
 
137
            if scheme_and_path is None:
 
138
                self.assertEqual(None, m)
 
139
            else:
 
140
                self.assertEqual(scheme_and_path[0], m.group('scheme'))
 
141
                self.assertEqual(scheme_and_path[1], m.group('path'))
 
142
 
 
143
        # Local paths
 
144
        test_one('/path', None)
 
145
        test_one('C:/path', None)
 
146
        test_one('../path/to/foo', None)
 
147
        test_one(u'../path/to/fo\xe5', None)
 
148
 
 
149
        # Real URLS
 
150
        test_one('http://host/path/', ('http', 'host/path/'))
 
151
        test_one('sftp://host/path/to/foo', ('sftp', 'host/path/to/foo'))
 
152
        test_one('file:///usr/bin', ('file', '/usr/bin'))
 
153
        test_one('file:///C:/Windows', ('file', '/C:/Windows'))
 
154
        test_one('file:///C|/Windows', ('file', '/C|/Windows'))
 
155
        test_one(u'readonly+sftp://host/path/\xe5', ('readonly+sftp', u'host/path/\xe5'))
 
156
 
 
157
        # Weird stuff
 
158
        # Can't have slashes or colons in the scheme
 
159
        test_one('/path/to/://foo', None)
 
160
        test_one('path:path://foo', None)
 
161
        # Must have more than one character for scheme
 
162
        test_one('C://foo', None)
 
163
        test_one('ab://foo', ('ab', 'foo'))
 
164
 
 
165
    def test_dirname(self):
 
166
        # Test bzrlib.urlutils.dirname()
 
167
        dirname = urlutils.dirname
 
168
        if sys.platform == 'win32':
 
169
            self.assertRaises(InvalidURL, dirname, 'file:///path/to/foo')
 
170
            self.assertEqual('file:///C|/', dirname('file:///C|/foo'))
 
171
            self.assertEqual('file:///C|/', dirname('file:///C|/'))
 
172
        else:
 
173
            self.assertEqual('file:///', dirname('file:///foo'))
 
174
            self.assertEqual('file:///', dirname('file:///'))
 
175
 
 
176
        self.assertEqual('http://host/path/to', dirname('http://host/path/to/foo'))
 
177
        self.assertEqual('http://host/path/to', dirname('http://host/path/to/foo/'))
 
178
        self.assertEqual('http://host/path/to/foo',
 
179
            dirname('http://host/path/to/foo/', exclude_trailing_slash=False))
 
180
        self.assertEqual('http://host/', dirname('http://host/path'))
 
181
        self.assertEqual('http://host/', dirname('http://host/'))
 
182
        self.assertEqual('http://host', dirname('http://host'))
 
183
        self.assertEqual('http:///nohost', dirname('http:///nohost/path'))
 
184
 
 
185
        self.assertEqual('random+scheme://user:pass@ahost:port/',
 
186
            dirname('random+scheme://user:pass@ahost:port/path'))
 
187
        self.assertEqual('random+scheme://user:pass@ahost:port/',
 
188
            dirname('random+scheme://user:pass@ahost:port/path/'))
 
189
        self.assertEqual('random+scheme://user:pass@ahost:port/',
 
190
            dirname('random+scheme://user:pass@ahost:port/'))
 
191
 
 
192
        # relative paths
 
193
        self.assertEqual('path/to', dirname('path/to/foo'))
 
194
        self.assertEqual('path/to', dirname('path/to/foo/'))
 
195
        self.assertEqual('path/to/foo',
 
196
            dirname('path/to/foo/', exclude_trailing_slash=False))
 
197
        self.assertEqual('path/..', dirname('path/../foo'))
 
198
        self.assertEqual('../path', dirname('../path/foo'))
 
199
 
 
200
    def test_join(self):
 
201
        def test(expected, *args):
 
202
            joined = urlutils.join(*args)
 
203
            self.assertEqual(expected, joined)
 
204
 
 
205
        # Test relative path joining
 
206
        test('foo', 'foo') # relative fragment with nothing is preserved.
 
207
        test('foo/bar', 'foo', 'bar')
 
208
        test('http://foo/bar', 'http://foo', 'bar')
 
209
        test('http://foo/bar', 'http://foo', '.', 'bar')
 
210
        test('http://foo/baz', 'http://foo', 'bar', '../baz')
 
211
        test('http://foo/bar/baz', 'http://foo', 'bar/baz')
 
212
        test('http://foo/baz', 'http://foo', 'bar/../baz')
 
213
        test('http://foo/baz', 'http://foo/bar/', '../baz')
 
214
 
 
215
        # Absolute paths
 
216
        test('http://foo', 'http://foo') # abs url with nothing is preserved.
 
217
        test('http://bar', 'http://foo', 'http://bar')
 
218
        test('sftp://bzr/foo', 'http://foo', 'bar', 'sftp://bzr/foo')
 
219
        test('file:///bar', 'foo', 'file:///bar')
 
220
        test('http://bar/', 'http://foo', 'http://bar/')
 
221
        test('http://bar/a', 'http://foo', 'http://bar/a')
 
222
        test('http://bar/a/', 'http://foo', 'http://bar/a/')
 
223
 
 
224
        # From a base path
 
225
        test('file:///foo', 'file:///', 'foo')
 
226
        test('file:///bar/foo', 'file:///bar/', 'foo')
 
227
        test('http://host/foo', 'http://host/', 'foo')
 
228
        test('http://host/', 'http://host', '')
 
229
        
 
230
        # Invalid joinings
 
231
        # Cannot go above root
 
232
        # Implicitly at root:
 
233
        self.assertRaises(InvalidURLJoin, urlutils.join,
 
234
                'http://foo', '../baz')
 
235
        self.assertRaises(InvalidURLJoin, urlutils.join,
 
236
                'http://foo', '/..')
 
237
        # Joining from a path explicitly under the root.
 
238
        self.assertRaises(InvalidURLJoin, urlutils.join,
 
239
                'http://foo/a', '../../b')
 
240
 
 
241
    def test_joinpath(self):
 
242
        def test(expected, *args):
 
243
            joined = urlutils.joinpath(*args)
 
244
            self.assertEqual(expected, joined)
 
245
 
 
246
        # Test a single element
 
247
        test('foo', 'foo')
 
248
 
 
249
        # Test relative path joining
 
250
        test('foo/bar', 'foo', 'bar')
 
251
        test('foo/bar', 'foo', '.', 'bar')
 
252
        test('foo/baz', 'foo', 'bar', '../baz')
 
253
        test('foo/bar/baz', 'foo', 'bar/baz')
 
254
        test('foo/baz', 'foo', 'bar/../baz')
 
255
 
 
256
        # Test joining to an absolute path
 
257
        test('/foo', '/foo')
 
258
        test('/foo', '/foo', '.')
 
259
        test('/foo/bar', '/foo', 'bar')
 
260
        test('/', '/foo', '..')
 
261
 
 
262
        # Test joining with an absolute path
 
263
        test('/bar', 'foo', '/bar')
 
264
 
 
265
        # Test joining to a path with a trailing slash
 
266
        test('foo/bar', 'foo/', 'bar')
 
267
        
 
268
        # Invalid joinings
 
269
        # Cannot go above root
 
270
        self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '../baz')
 
271
        self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '..')
 
272
        self.assertRaises(InvalidURLJoin, urlutils.joinpath, '/', '/..')
 
273
 
 
274
    def test_function_type(self):
 
275
        if sys.platform == 'win32':
 
276
            self.assertEqual(urlutils._win32_local_path_to_url, urlutils.local_path_to_url)
 
277
            self.assertEqual(urlutils._win32_local_path_from_url, urlutils.local_path_from_url)
 
278
        else:
 
279
            self.assertEqual(urlutils._posix_local_path_to_url, urlutils.local_path_to_url)
 
280
            self.assertEqual(urlutils._posix_local_path_from_url, urlutils.local_path_from_url)
 
281
 
 
282
    def test_posix_local_path_to_url(self):
 
283
        to_url = urlutils._posix_local_path_to_url
 
284
        self.assertEqual('file:///path/to/foo',
 
285
            to_url('/path/to/foo'))
 
286
 
 
287
        try:
 
288
            result = to_url(u'/path/to/r\xe4ksm\xf6rg\xe5s')
 
289
        except UnicodeError:
 
290
            raise TestSkipped("local encoding cannot handle unicode")
 
291
 
 
292
        self.assertEqual('file:///path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
 
293
        self.assertFalse(isinstance(result, unicode))
 
294
 
 
295
    def test_posix_local_path_from_url(self):
 
296
        from_url = urlutils._posix_local_path_from_url
 
297
        self.assertEqual('/path/to/foo',
 
298
            from_url('file:///path/to/foo'))
 
299
        self.assertEqual(u'/path/to/r\xe4ksm\xf6rg\xe5s',
 
300
            from_url('file:///path/to/r%C3%A4ksm%C3%B6rg%C3%A5s'))
 
301
        self.assertEqual(u'/path/to/r\xe4ksm\xf6rg\xe5s',
 
302
            from_url('file:///path/to/r%c3%a4ksm%c3%b6rg%c3%a5s'))
 
303
 
 
304
        self.assertRaises(InvalidURL, from_url, '/path/to/foo')
 
305
 
 
306
    def test_win32_local_path_to_url(self):
 
307
        to_url = urlutils._win32_local_path_to_url
 
308
        self.assertEqual('file:///C:/path/to/foo',
 
309
            to_url('C:/path/to/foo'))
 
310
        # BOGUS: on win32, ntpath.abspath will strip trailing
 
311
        #       whitespace, so this will always fail
 
312
        #       Though under linux, it fakes abspath support
 
313
        #       and thus will succeed
 
314
        # self.assertEqual('file:///C:/path/to/foo%20',
 
315
        #     to_url('C:/path/to/foo '))
 
316
        self.assertEqual('file:///C:/path/to/f%20oo',
 
317
            to_url('C:/path/to/f oo'))
 
318
        
 
319
        self.assertEqual('file:///', to_url('/'))
 
320
 
 
321
        try:
 
322
            result = to_url(u'd:/path/to/r\xe4ksm\xf6rg\xe5s')
 
323
        except UnicodeError:
 
324
            raise TestSkipped("local encoding cannot handle unicode")
 
325
 
 
326
        self.assertEqual('file:///D:/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
 
327
        self.assertFalse(isinstance(result, unicode))
 
328
 
 
329
    def test_win32_unc_path_to_url(self):
 
330
        to_url = urlutils._win32_local_path_to_url
 
331
        self.assertEqual('file://HOST/path',
 
332
            to_url(r'\\HOST\path'))
 
333
        self.assertEqual('file://HOST/path',
 
334
            to_url('//HOST/path'))
 
335
 
 
336
        try:
 
337
            result = to_url(u'//HOST/path/to/r\xe4ksm\xf6rg\xe5s')
 
338
        except UnicodeError:
 
339
            raise TestSkipped("local encoding cannot handle unicode")
 
340
 
 
341
        self.assertEqual('file://HOST/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s', result)
 
342
        self.assertFalse(isinstance(result, unicode))
 
343
 
 
344
    def test_win32_local_path_from_url(self):
 
345
        from_url = urlutils._win32_local_path_from_url
 
346
        self.assertEqual('C:/path/to/foo',
 
347
            from_url('file:///C|/path/to/foo'))
 
348
        self.assertEqual(u'D:/path/to/r\xe4ksm\xf6rg\xe5s',
 
349
            from_url('file:///d|/path/to/r%C3%A4ksm%C3%B6rg%C3%A5s'))
 
350
        self.assertEqual(u'D:/path/to/r\xe4ksm\xf6rg\xe5s',
 
351
            from_url('file:///d:/path/to/r%c3%a4ksm%c3%b6rg%c3%a5s'))
 
352
        self.assertEqual('/', from_url('file:///'))
 
353
 
 
354
        self.assertRaises(InvalidURL, from_url, '/path/to/foo')
 
355
        # Not a valid _win32 url, no drive letter
 
356
        self.assertRaises(InvalidURL, from_url, 'file:///path/to/foo')
 
357
 
 
358
    def test_win32_unc_path_from_url(self):
 
359
        from_url = urlutils._win32_local_path_from_url
 
360
        self.assertEqual('//HOST/path', from_url('file://HOST/path'))
 
361
        # despite IE allows 2, 4, 5 and 6 slashes in URL to another machine
 
362
        # we want to use only 2 slashes
 
363
        # Firefox understand only 5 slashes in URL, but it's ugly
 
364
        self.assertRaises(InvalidURL, from_url, 'file:////HOST/path')
 
365
        self.assertRaises(InvalidURL, from_url, 'file://///HOST/path')
 
366
        self.assertRaises(InvalidURL, from_url, 'file://////HOST/path')
 
367
        # check for file://C:/ instead of file:///C:/
 
368
        self.assertRaises(InvalidURL, from_url, 'file://C:/path')
 
369
 
 
370
    def test_win32_extract_drive_letter(self):
 
371
        extract = urlutils._win32_extract_drive_letter
 
372
        self.assertEqual(('file:///C:', '/foo'), extract('file://', '/C:/foo'))
 
373
        self.assertEqual(('file:///d|', '/path'), extract('file://', '/d|/path'))
 
374
        self.assertRaises(InvalidURL, extract, 'file://', '/path')
 
375
 
 
376
    def test_split(self):
 
377
        # Test bzrlib.urlutils.split()
 
378
        split = urlutils.split
 
379
        if sys.platform == 'win32':
 
380
            self.assertRaises(InvalidURL, split, 'file:///path/to/foo')
 
381
            self.assertEqual(('file:///C|/', 'foo'), split('file:///C|/foo'))
 
382
            self.assertEqual(('file:///C:/', ''), split('file:///C:/'))
 
383
        else:
 
384
            self.assertEqual(('file:///', 'foo'), split('file:///foo'))
 
385
            self.assertEqual(('file:///', ''), split('file:///'))
 
386
 
 
387
        self.assertEqual(('http://host/path/to', 'foo'), split('http://host/path/to/foo'))
 
388
        self.assertEqual(('http://host/path/to', 'foo'), split('http://host/path/to/foo/'))
 
389
        self.assertEqual(('http://host/path/to/foo', ''),
 
390
            split('http://host/path/to/foo/', exclude_trailing_slash=False))
 
391
        self.assertEqual(('http://host/', 'path'), split('http://host/path'))
 
392
        self.assertEqual(('http://host/', ''), split('http://host/'))
 
393
        self.assertEqual(('http://host', ''), split('http://host'))
 
394
        self.assertEqual(('http:///nohost', 'path'), split('http:///nohost/path'))
 
395
 
 
396
        self.assertEqual(('random+scheme://user:pass@ahost:port/', 'path'),
 
397
            split('random+scheme://user:pass@ahost:port/path'))
 
398
        self.assertEqual(('random+scheme://user:pass@ahost:port/', 'path'),
 
399
            split('random+scheme://user:pass@ahost:port/path/'))
 
400
        self.assertEqual(('random+scheme://user:pass@ahost:port/', ''),
 
401
            split('random+scheme://user:pass@ahost:port/'))
 
402
 
 
403
        # relative paths
 
404
        self.assertEqual(('path/to', 'foo'), split('path/to/foo'))
 
405
        self.assertEqual(('path/to', 'foo'), split('path/to/foo/'))
 
406
        self.assertEqual(('path/to/foo', ''),
 
407
            split('path/to/foo/', exclude_trailing_slash=False))
 
408
        self.assertEqual(('path/..', 'foo'), split('path/../foo'))
 
409
        self.assertEqual(('../path', 'foo'), split('../path/foo'))
 
410
 
 
411
    def test_win32_strip_local_trailing_slash(self):
 
412
        strip = urlutils._win32_strip_local_trailing_slash
 
413
        self.assertEqual('file://', strip('file://'))
 
414
        self.assertEqual('file:///', strip('file:///'))
 
415
        self.assertEqual('file:///C', strip('file:///C'))
 
416
        self.assertEqual('file:///C:', strip('file:///C:'))
 
417
        self.assertEqual('file:///d|', strip('file:///d|'))
 
418
        self.assertEqual('file:///C:/', strip('file:///C:/'))
 
419
        self.assertEqual('file:///C:/a', strip('file:///C:/a/'))
 
420
 
 
421
    def test_strip_trailing_slash(self):
 
422
        sts = urlutils.strip_trailing_slash
 
423
        if sys.platform == 'win32':
 
424
            self.assertEqual('file:///C|/', sts('file:///C|/'))
 
425
            self.assertEqual('file:///C:/foo', sts('file:///C:/foo'))
 
426
            self.assertEqual('file:///C|/foo', sts('file:///C|/foo/'))
 
427
        else:
 
428
            self.assertEqual('file:///', sts('file:///'))
 
429
            self.assertEqual('file:///foo', sts('file:///foo'))
 
430
            self.assertEqual('file:///foo', sts('file:///foo/'))
 
431
 
 
432
        self.assertEqual('http://host/', sts('http://host/'))
 
433
        self.assertEqual('http://host/foo', sts('http://host/foo'))
 
434
        self.assertEqual('http://host/foo', sts('http://host/foo/'))
 
435
 
 
436
        # No need to fail just because the slash is missing
 
437
        self.assertEqual('http://host', sts('http://host'))
 
438
        # TODO: jam 20060502 Should this raise InvalidURL?
 
439
        self.assertEqual('file://', sts('file://'))
 
440
 
 
441
        self.assertEqual('random+scheme://user:pass@ahost:port/path',
 
442
            sts('random+scheme://user:pass@ahost:port/path'))
 
443
        self.assertEqual('random+scheme://user:pass@ahost:port/path',
 
444
            sts('random+scheme://user:pass@ahost:port/path/'))
 
445
        self.assertEqual('random+scheme://user:pass@ahost:port/',
 
446
            sts('random+scheme://user:pass@ahost:port/'))
 
447
 
 
448
        # Make sure relative paths work too
 
449
        self.assertEqual('path/to/foo', sts('path/to/foo'))
 
450
        self.assertEqual('path/to/foo', sts('path/to/foo/'))
 
451
        self.assertEqual('../to/foo', sts('../to/foo/'))
 
452
        self.assertEqual('path/../foo', sts('path/../foo/'))
 
453
 
 
454
    def test_unescape_for_display_utf8(self):
 
455
        # Test that URLs are converted to nice unicode strings for display
 
456
        def test(expected, url, encoding='utf-8'):
 
457
            disp_url = urlutils.unescape_for_display(url, encoding=encoding)
 
458
            self.assertIsInstance(disp_url, unicode)
 
459
            self.assertEqual(expected, disp_url)
 
460
 
 
461
        test('http://foo', 'http://foo')
 
462
        if sys.platform == 'win32':
 
463
            test('C:/foo/path', 'file:///C|/foo/path')
 
464
            test('C:/foo/path', 'file:///C:/foo/path')
 
465
        else:
 
466
            test('/foo/path', 'file:///foo/path')
 
467
 
 
468
        test('http://foo/%2Fbaz', 'http://foo/%2Fbaz')
 
469
        test(u'http://host/r\xe4ksm\xf6rg\xe5s',
 
470
             'http://host/r%C3%A4ksm%C3%B6rg%C3%A5s')
 
471
 
 
472
        # Make sure special escaped characters stay escaped
 
473
        test(u'http://host/%3B%2F%3F%3A%40%26%3D%2B%24%2C%23',
 
474
             'http://host/%3B%2F%3F%3A%40%26%3D%2B%24%2C%23')
 
475
 
 
476
        # Can we handle sections that don't have utf-8 encoding?
 
477
        test(u'http://host/%EE%EE%EE/r\xe4ksm\xf6rg\xe5s',
 
478
             'http://host/%EE%EE%EE/r%C3%A4ksm%C3%B6rg%C3%A5s')
 
479
 
 
480
        # Test encoding into output that can handle some characters
 
481
        test(u'http://host/%EE%EE%EE/r\xe4ksm\xf6rg\xe5s',
 
482
             'http://host/%EE%EE%EE/r%C3%A4ksm%C3%B6rg%C3%A5s',
 
483
             encoding='iso-8859-1')
 
484
 
 
485
        # This one can be encoded into utf8
 
486
        test(u'http://host/\u062c\u0648\u062c\u0648',
 
487
             'http://host/%d8%ac%d9%88%d8%ac%d9%88',
 
488
             encoding='utf-8')
 
489
 
 
490
        # This can't be put into 8859-1 and so stays as escapes
 
491
        test(u'http://host/%d8%ac%d9%88%d8%ac%d9%88',
 
492
             'http://host/%d8%ac%d9%88%d8%ac%d9%88',
 
493
             encoding='iso-8859-1')
 
494
 
 
495
    def test_escape(self):
 
496
        self.assertEqual('%25', urlutils.escape('%'))
 
497
        self.assertEqual('%C3%A5', urlutils.escape(u'\xe5'))
 
498
        self.assertFalse(isinstance(urlutils.escape(u'\xe5'), unicode))
 
499
 
 
500
    def test_unescape(self):
 
501
        self.assertEqual('%', urlutils.unescape('%25'))
 
502
        self.assertEqual(u'\xe5', urlutils.unescape('%C3%A5'))
 
503
 
 
504
        self.assertRaises(InvalidURL, urlutils.unescape, u'\xe5')
 
505
        self.assertRaises(InvalidURL, urlutils.unescape, '\xe5')
 
506
        self.assertRaises(InvalidURL, urlutils.unescape, '%E5')
 
507
 
 
508
    def test_escape_unescape(self):
 
509
        self.assertEqual(u'\xe5', urlutils.unescape(urlutils.escape(u'\xe5')))
 
510
        self.assertEqual('%', urlutils.unescape(urlutils.escape('%')))
 
511
 
 
512
    def test_relative_url(self):
 
513
        def test(expected, base, other):
 
514
            result = urlutils.relative_url(base, other)
 
515
            self.assertEqual(expected, result)
 
516
            
 
517
        test('a', 'http://host/', 'http://host/a')
 
518
        test('http://entirely/different', 'sftp://host/branch',
 
519
                    'http://entirely/different')
 
520
        test('../person/feature', 'http://host/branch/mainline',
 
521
                    'http://host/branch/person/feature')
 
522
        test('..', 'http://host/branch', 'http://host/')
 
523
        test('http://host2/branch', 'http://host1/branch', 'http://host2/branch')
 
524
        test('.', 'http://host1/branch', 'http://host1/branch')
 
525
        test('../../../branch/2b', 'file:///home/jelmer/foo/bar/2b',
 
526
                    'file:///home/jelmer/branch/2b')
 
527
        test('../../branch/2b', 'sftp://host/home/jelmer/bar/2b',
 
528
                    'sftp://host/home/jelmer/branch/2b')
 
529
        test('../../branch/feature/%2b', 'http://host/home/jelmer/bar/%2b',
 
530
                    'http://host/home/jelmer/branch/feature/%2b')
 
531
        test('../../branch/feature/2b', 'http://host/home/jelmer/bar/2b/', 
 
532
                    'http://host/home/jelmer/branch/feature/2b')
 
533
        # relative_url should preserve a trailing slash
 
534
        test('../../branch/feature/2b/', 'http://host/home/jelmer/bar/2b/',
 
535
                    'http://host/home/jelmer/branch/feature/2b/')
 
536
        test('../../branch/feature/2b/', 'http://host/home/jelmer/bar/2b',
 
537
                    'http://host/home/jelmer/branch/feature/2b/')
 
538
 
 
539
        # TODO: treat http://host as http://host/
 
540
        #       relative_url is typically called from a branch.base or
 
541
        #       transport.base which always ends with a /
 
542
        #test('a', 'http://host', 'http://host/a')
 
543
        test('http://host/a', 'http://host', 'http://host/a')
 
544
        #test('.', 'http://host', 'http://host/')
 
545
        test('http://host/', 'http://host', 'http://host/')
 
546
        #test('.', 'http://host/', 'http://host')
 
547
        test('http://host', 'http://host/', 'http://host')
 
548
 
 
549
        # On Windows file:///C:/path/to and file:///D:/other/path
 
550
        # should not use relative url over the non-existent '/' directory.
 
551
        if sys.platform == 'win32':
 
552
            # on the same drive
 
553
            test('../../other/path',
 
554
                'file:///C:/path/to', 'file:///C:/other/path')
 
555
            #~next two tests is failed, i.e. urlutils.relative_url expects
 
556
            #~to see normalized file URLs?
 
557
            #~test('../../other/path',
 
558
            #~    'file:///C:/path/to', 'file:///c:/other/path')
 
559
            #~test('../../other/path',
 
560
            #~    'file:///C:/path/to', 'file:///C|/other/path')
 
561
 
 
562
            # check UNC paths too
 
563
            test('../../other/path',
 
564
                'file://HOST/base/path/to', 'file://HOST/base/other/path')
 
565
            # on different drives
 
566
            test('file:///D:/other/path',
 
567
                'file:///C:/path/to', 'file:///D:/other/path')
 
568
            # TODO: strictly saying in UNC path //HOST/base is full analog
 
569
            # of drive letter for hard disk, and this situation is also
 
570
            # should be exception from rules. [bialix 20071221]
 
571
 
 
572
 
 
573
class TestCwdToURL(TestCaseInTempDir):
 
574
    """Test that local_path_to_url works base on the cwd"""
 
575
 
 
576
    def test_dot(self):
 
577
        # This test will fail if getcwd is not ascii
 
578
        os.mkdir('mytest')
 
579
        os.chdir('mytest')
 
580
 
 
581
        url = urlutils.local_path_to_url('.')
 
582
        self.assertEndsWith(url, '/mytest')
 
583
 
 
584
    def test_non_ascii(self):
 
585
        if win32utils.winver == 'Windows 98':
 
586
            raise TestSkipped('Windows 98 cannot handle unicode filenames')
 
587
 
 
588
        try:
 
589
            os.mkdir(u'dod\xe9')
 
590
        except UnicodeError:
 
591
            raise TestSkipped('cannot create unicode directory')
 
592
 
 
593
        os.chdir(u'dod\xe9')
 
594
 
 
595
        # On Mac OSX this directory is actually: 
 
596
        #   u'/dode\u0301' => '/dode\xcc\x81
 
597
        # but we should normalize it back to 
 
598
        #   u'/dod\xe9' => '/dod\xc3\xa9'
 
599
        url = urlutils.local_path_to_url('.')
 
600
        self.assertEndsWith(url, '/dod%C3%A9')
 
601
 
 
602
 
 
603
class TestDeriveToLocation(TestCase):
 
604
    """Test that the mapping of FROM_LOCATION to TO_LOCATION works."""
 
605
 
 
606
    def test_to_locations_derived_from_paths(self):
 
607
        derive = urlutils.derive_to_location
 
608
        self.assertEqual("bar", derive("bar"))
 
609
        self.assertEqual("bar", derive("../bar"))
 
610
        self.assertEqual("bar", derive("/foo/bar"))
 
611
        self.assertEqual("bar", derive("c:/foo/bar"))
 
612
        self.assertEqual("bar", derive("c:bar"))
 
613
 
 
614
    def test_to_locations_derived_from_urls(self):
 
615
        derive = urlutils.derive_to_location
 
616
        self.assertEqual("bar", derive("http://foo/bar"))
 
617
        self.assertEqual("bar", derive("bzr+ssh://foo/bar"))
 
618
        self.assertEqual("foo-bar", derive("lp:foo-bar"))
 
619
 
 
620
 
 
621
class TestRebaseURL(TestCase):
 
622
    """Test the behavior of rebase_url."""
 
623
 
 
624
    def test_non_relative(self):
 
625
        result = urlutils.rebase_url('file://foo', 'file://foo',
 
626
                                     'file://foo/bar')
 
627
        self.assertEqual('file://foo', result)
 
628
        result = urlutils.rebase_url('/foo', 'file://foo',
 
629
                                     'file://foo/bar')
 
630
        self.assertEqual('/foo', result)
 
631
 
 
632
    def test_different_ports(self):
 
633
        e = self.assertRaises(InvalidRebaseURLs, urlutils.rebase_url,
 
634
                              'foo', 'http://bar:80', 'http://bar:81')
 
635
        self.assertEqual(str(e), "URLs differ by more than path:"
 
636
                         " 'http://bar:80' and 'http://bar:81'")
 
637
 
 
638
    def test_different_hosts(self):
 
639
        e = self.assertRaises(InvalidRebaseURLs, urlutils.rebase_url,
 
640
                              'foo', 'http://bar', 'http://baz')
 
641
        self.assertEqual(str(e), "URLs differ by more than path: 'http://bar'"
 
642
                         " and 'http://baz'")
 
643
 
 
644
    def test_different_protocol(self):
 
645
        e = self.assertRaises(InvalidRebaseURLs, urlutils.rebase_url,
 
646
                              'foo', 'http://bar', 'ftp://bar')
 
647
        self.assertEqual(str(e), "URLs differ by more than path: 'http://bar'"
 
648
                         " and 'ftp://bar'")
 
649
 
 
650
    def test_rebase_success(self):
 
651
        self.assertEqual('../bar', urlutils.rebase_url('bar', 'http://baz/',
 
652
                         'http://baz/qux'))
 
653
        self.assertEqual('qux/bar', urlutils.rebase_url('bar',
 
654
                         'http://baz/qux', 'http://baz/'))
 
655
        self.assertEqual('.', urlutils.rebase_url('foo',
 
656
                         'http://bar/', 'http://bar/foo/'))
 
657
        self.assertEqual('qux/bar', urlutils.rebase_url('../bar',
 
658
                         'http://baz/qux/foo', 'http://baz/'))
 
659
 
 
660
    def test_determine_relative_path(self):
 
661
        self.assertEqual('../../baz/bar',
 
662
                         urlutils.determine_relative_path(
 
663
                         '/qux/quxx', '/baz/bar'))
 
664
        self.assertEqual('..',
 
665
                         urlutils.determine_relative_path(
 
666
                         '/bar/baz', '/bar'))
 
667
        self.assertEqual('baz',
 
668
                         urlutils.determine_relative_path(
 
669
                         '/bar', '/bar/baz'))
 
670
        self.assertEqual('.', urlutils.determine_relative_path(
 
671
                         '/bar', '/bar'))