~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/tests/EncodingAdapter.py

Committer: John Arbash Meinel
Date: 2006-04-25 15:05:42 UTC
mfrom: (1185.85.85 bzr-encoding)
mto: This revision was merged to the branch mainline in revision 1752.
Revision ID: john@arbash-meinel.com-20060425150542-c7b518dca9928691

[merge] the old bzr-encoding changes, reparenting them on bzr.dev

files added:
bzrlib/tests/EncodingAdapter.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_log.py.moved

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_status.py.moved

files modified:
bzrlib/add.py

bzrlib/builtins.py

bzrlib/commands.py

bzrlib/config.py

bzrlib/errors.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/test_log.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/http/__init__.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/workingtree.py

Show diffs side-by-side

added added

removed removed

bzrlib/tests/EncodingAdapter.py

# -*- coding: utf-8 -*-

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""\

Adapter for running test cases against multiple encodings.

"""

from copy import deepcopy

from bzrlib.tests import TestSuite

# prefix for micro (1/1000)

_mu = u'\xb5'

# Swedish?

_erik = u'Erik B\xe5gfors'

# Swedish 'räksmörgås' means shrimp sandwich

_shrimp_sandwich = u'r\xe4ksm\xf6rg\xe5s'

# Arabic, probably only Unicode encodings can handle this one

_juju = u'\u062c\u0648\u062c\u0648'

# iso-8859-1 alternative for juju

_juju_alt = u'j\xfbj\xfa'

# Russian, 'Alexander' in russian

_alexander = u'\u0410\u043b\u0435\u043a\u0441\u0430\u043d\u0434\u0440'

# No idea if this means anything, but we need another string

_alex = u'\u0410\u043b\u0435\u043a'

# Kanji

# It is a kanji sequence for nihonjin, or Japanese in English.

# '\u4eba' being person, 'u\65e5' sun and '\u672c' origin. Ie,

# sun-origin-person, 'native from the land where the sun rises'. Note, I'm

# not a fluent speaker, so this is just my crude breakdown.

# Wouter van Heyst

_nihonjin = u'\u65e5\u672c\u4eba'

# Czech

# It's what is usually used for showing how fonts look, because it contains

# most accented characters, ie. in places where Englishman use 'Quick brown fox

# jumped over a lazy dog'. The literal translation of the Czech version would

# be something like 'Yellow horse groaned devilish codes'. Actually originally

# the last word used to be 'ódy' (odes). The 'k' was added as a pun when using

# the sentece to check whether one has properly set encoding.

_yellow_horse = (u'\u017dlu\u0165ou\u010dk\xfd k\u016f\u0148'

u' \xfap\u011bl \u010f\xe1belsk\xe9 k\xf3dy')

_yellow = u'\u017dlu\u0165ou\u010dk\xfd'

_someone = u'Some\u016f\u0148\u011b'

_something = u'\u0165ou\u010dk\xfd'

# Hebrew

# Shalom -> 'hello' or 'peace', used as a common greeting

_shalom = u'\u05e9\u05dc\u05d5\u05dd'

class EncodingTestAdapter(object):

"""A tool to generate a suite, testing multiple encodings for a single test.

This is similar to bzrlib.transport.TransportTestProviderAdapter.

It is done by copying the test once for each encoding, and injecting

the encoding name, and the list of valid strings for that encoding.

Each copy is also given a new id() to make it easy to identify.

"""

_encodings = [

# Permutation 1 of utf-8

('utf-8', 1, {'committer':_erik

, 'message':_yellow_horse

, 'filename':_shrimp_sandwich

, 'directory':_nihonjin}),

# Permutation 2 of utf-8

('utf-8', 2, {'committer':_alexander

, 'message':u'Testing ' + _mu

, 'filename':_shalom

, 'directory':_juju}),

('iso-8859-1', 0, {'committer':_erik

, 'message':u'Testing ' + _mu

, 'filename':_juju_alt

, 'directory':_shrimp_sandwich}),

('iso-8859-2', 0, {'committer':_someone

, 'message':_yellow_horse

, 'filename':_yellow

100

, 'directory':_something}),

101

('cp1251', 0, {'committer':_alexander

102

, 'message':u'Testing ' + _mu

103

, 'filename':_alex

104

, 'directory':_alex + 'dir'}),

105

]

106

107

def adapt(self, test):

108

result = TestSuite()

109

for encoding, count, info in self._encodings:

110

new_test = deepcopy(test)

111

new_test.encoding = encoding

112

new_test.info = info

113

def make_new_test_id():

114

if count:

115

new_id = "%s(%s,%s)" % (new_test.id(), encoding, count)

116

else:

117

new_id = "%s(%s)" % (new_test.id(), encoding)

118

return lambda: new_id

119

new_test.id = make_new_test_id()

120

result.addTest(new_test)

121

return result

122

123

Older »