1
# Copyright (C) 2005 Canonical Ltd
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11
# GNU General Public License for more details.
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17
"""Test that various operations work in a non-ASCII environment."""
21
from unicodedata import normalize
23
from bzrlib import osutils
24
from bzrlib.osutils import pathjoin
25
from bzrlib.tests import TestCase, TestCaseWithTransport, TestSkipped
26
from bzrlib.workingtree import WorkingTree
29
class NonAsciiTest(TestCaseWithTransport):
31
def test_add_in_nonascii_branch(self):
32
"""Test adding in a non-ASCII branch."""
35
wt = self.make_branch_and_tree(br_dir)
36
except UnicodeEncodeError:
37
raise TestSkipped("filesystem can't accomodate nonascii names")
39
file(pathjoin(br_dir, "a"), "w").write("hello")
40
wt.add(["a"], ["a-id"])
44
a_circle_d = u'a\u030a'
48
z_umlat_d = u'Z\u030c'
51
class TestNormalization(TestCase):
52
"""Verify that we have our normalizations correct."""
54
def test_normalize(self):
55
self.assertEqual(a_circle_d, normalize('NFKD', a_circle_c))
56
self.assertEqual(a_circle_c, normalize('NFKC', a_circle_d))
57
self.assertEqual(a_dots_d, normalize('NFKD', a_dots_c))
58
self.assertEqual(a_dots_c, normalize('NFKC', a_dots_d))
59
self.assertEqual(z_umlat_d, normalize('NFKD', z_umlat_c))
60
self.assertEqual(z_umlat_c, normalize('NFKC', z_umlat_d))
63
class NormalizedFilename(TestCaseWithTransport):
64
"""Test normalized_filename and associated helpers"""
66
def test__accessible_normalized_filename(self):
67
anf = osutils._accessible_normalized_filename
68
# normalized_filename should allow plain ascii strings
69
# not just unicode strings
70
self.assertEqual((u'ascii', True), anf('ascii'))
71
self.assertEqual((a_circle_c, True), anf(a_circle_c))
72
self.assertEqual((a_circle_c, True), anf(a_circle_d))
73
self.assertEqual((a_dots_c, True), anf(a_dots_c))
74
self.assertEqual((a_dots_c, True), anf(a_dots_d))
75
self.assertEqual((z_umlat_c, True), anf(z_umlat_c))
76
self.assertEqual((z_umlat_c, True), anf(z_umlat_d))
78
def test__inaccessible_normalized_filename(self):
79
inf = osutils._inaccessible_normalized_filename
80
# normalized_filename should allow plain ascii strings
81
# not just unicode strings
82
self.assertEqual((u'ascii', True), inf('ascii'))
83
self.assertEqual((a_circle_c, True), inf(a_circle_c))
84
self.assertEqual((a_circle_c, False), inf(a_circle_d))
85
self.assertEqual((a_dots_c, True), inf(a_dots_c))
86
self.assertEqual((a_dots_c, False), inf(a_dots_d))
87
self.assertEqual((z_umlat_c, True), inf(z_umlat_c))
88
self.assertEqual((z_umlat_c, False), inf(z_umlat_d))
90
def test_functions(self):
91
if osutils.normalizes_filenames():
92
self.assertEqual(osutils.normalized_filename,
93
osutils._accessible_normalized_filename)
95
self.assertEqual(osutils.normalized_filename,
96
osutils._inaccessible_normalized_filename)
98
def test_platform(self):
99
# With FAT32 and certain encodings on win32
100
# a_circle_c and a_dots_c actually map to the same file
101
# adding a suffix kicks in the 'preserving but insensitive'
102
# route, and maintains the right files
103
files = [a_circle_c+'.1', a_dots_c+'.2', z_umlat_c+'.3']
105
self.build_tree(files)
107
raise TestSkipped("filesystem cannot create unicode files")
109
if sys.platform == 'darwin':
110
expected = sorted([a_circle_d+'.1', a_dots_d+'.2', z_umlat_d+'.3'])
112
expected = sorted(files)
114
present = sorted(os.listdir(u'.'))
115
self.assertEqual(expected, present)
117
def test_access_normalized(self):
118
# We should always be able to access files created with
119
# normalized filenames
120
# With FAT32 and certain encodings on win32
121
# a_circle_c and a_dots_c actually map to the same file
122
# adding a suffix kicks in the 'preserving but insensitive'
123
# route, and maintains the right files
124
files = [a_circle_c+'.1', a_dots_c+'.2', z_umlat_c+'.3']
126
self.build_tree(files, line_endings='native')
128
raise TestSkipped("filesystem cannot create unicode files")
131
# We should get an exception if we can't open the file at
133
path, can_access = osutils.normalized_filename(fname)
135
self.assertEqual(path, fname)
136
self.assertTrue(can_access)
141
shouldbe = 'contents of %s%s' % (path.encode('utf8'),
146
self.assertEqual(shouldbe, actual,
147
'contents of %r is incorrect: %r != %r'
148
% (path, shouldbe, actual))
150
def test_access_non_normalized(self):
151
# Sometimes we can access non-normalized files by their normalized
152
# path, verify that normalized_filename returns the right info
153
files = [a_circle_d+'.1', a_dots_d+'.2', z_umlat_d+'.3']
156
self.build_tree(files)
158
raise TestSkipped("filesystem cannot create unicode files")
161
# We should get an exception if we can't open the file at
163
path, can_access = osutils.normalized_filename(fname)
165
self.assertNotEqual(path, fname)
167
# We should always be able to access them from the name
168
# they were created with
169
f = open(fname, 'rb')
172
# And normalized_filename sholud tell us correctly if we can
173
# access them by an alternate name
178
self.assertRaises(IOError, open, path, 'rb')