~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/benchmarks/bench_cache_utf8.py

Committer: Aaron Bentley
Date: 2006-08-17 00:15:23 UTC
mfrom: (1934 +trunk)
mto: (2100.3.5 by-reference-trees) (1731.2.8 nested-trees)
mto: This revision was merged to the branch mainline in revision 2078.
Revision ID: aaron.bentley@utoronto.ca-20060817001523-f23f3e0a6260dbc0

merge from bzr.dev

files added:
bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/cache_utf8.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_version.py

bzrlib/version.py

files renamed:
bzrlib/tests/repository_implementations/test_revprops.py => bzrlib/tests/repository_implementations/test_revision.py

files modified:
.bzrignore

Makefile

NEWS

bzrlib/__init__.py

bzrlib/add.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/commands.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/help.py

bzrlib/knit.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_xml.py

bzrlib/transport/__init__.py

bzrlib/xml5.py

doc/tutorial.txt

setup.py

tools/doc_generate/autodoc_man.py

Show diffs side-by-side

added added

removed removed

bzrlib/benchmarks/bench_cache_utf8.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License version 2 as published by

# the Free Software Foundation.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Tests for encoding performance."""

from bzrlib import (

cache_utf8,

osutils,

)

from bzrlib.benchmarks import Benchmark

_normal_revision_id = (u'john@arbash-meinel.com-20060801200018'

u'-cafa6272d9b8cac4')

_unicode_revision_id = (u'\u062c\u0648\u062c\u0648@\xe5rbash-meinel.com-'

u'\xb5\xb5\xb5-20060801200018-cafa6272d9b8cac4')

_normal_revision_id_utf8 = _normal_revision_id.encode('utf-8')

_unicode_revision_id_utf8 = _unicode_revision_id.encode('utf-8')

class EncodingBenchmark(Benchmark):

def setUp(self):

super(EncodingBenchmark, self).setUp()

# Make sure we start and end with a clean cache

cache_utf8.clear_encoding_cache()

self.addCleanup(cache_utf8.clear_encoding_cache)

def encode_1M(self, revision_id):

"""Encode the given revision id 1 million times"""

# In a real kernel tree there are 7.7M lines of code

# so the initial import actually has to encode a revision

# id to store annotated lines one time for every line.

for i in xrange(1000000):

revision_id.encode('utf8')

def encode_cached_1M(self, revision_id):

"""Encode the given revision id 1 million times using the cache"""

encode = cache_utf8.encode

for i in xrange(1000000):

encode(revision_id)

def encode_multi(self, revision_list, count):

"""Encode each entry in the list count times"""

for i in xrange(count):

for revision_id in revision_list:

revision_id.encode('utf-8')

def encode_cached_multi(self, revision_list, count):

"""Encode each entry in the list count times"""

encode = cache_utf8.encode

for i in xrange(count):

for revision_id in revision_list:

encode(revision_id)

def test_encode_1_by_1M_ascii(self):

"""Test encoding a single revision id 1 million times."""

self.time(self.encode_1M, _normal_revision_id)

def test_encode_1_by_1M_ascii_cached(self):

"""Test encoding a single revision id 1 million times."""

self.time(self.encode_cached_1M, _normal_revision_id)

def test_encode_1_by_1M_ascii_str(self):

# We have places that think they have a unicode revision id

# but actually, they have a plain string. So .encode(utf8)

# actually has to decode from ascii, and then encode into utf8

self.time(self.encode_1M, str(_normal_revision_id))

def test_encode_1_by_1M_ascii_str_cached(self):

self.time(self.encode_cached_1M, str(_normal_revision_id))

def test_encode_1_by_1M_unicode(self):

"""Test encoding a single revision id 1 million times."""

self.time(self.encode_1M, _unicode_revision_id)

def test_encode_1_by_1M_unicode_cached(self):

"""Test encoding a single revision id 1 million times."""

self.time(self.encode_cached_1M, _unicode_revision_id)

def test_encode_1k_by_1k_ascii(self):

"""Test encoding 5 revisions 100k times"""

revisions = [unicode(osutils.rand_chars(60)) for x in xrange(1000)]

self.time(self.encode_multi, revisions, 1000)

100

def test_encode_1k_by_1k_ascii_cached(self):

101

"""Test encoding 5 revisions 100k times"""

102

revisions = [unicode(osutils.rand_chars(60)) for x in xrange(1000)]

103

self.time(self.encode_cached_multi, revisions, 1000)

104

105

def test_encode_1k_by_1k_unicode(self):

106

"""Test encoding 5 revisions 100k times"""

107

revisions = ['\u062c\u0648\u062c\u0648' +

108

unicode(osutils.rand_chars(60)) for x in xrange(1000)]

109

self.time(self.encode_multi, revisions, 1000)

110

111

def test_encode_1k_by_1k_unicode_cached(self):

112

"""Test encoding 5 revisions 100k times"""

113

revisions = ['\u062c\u0648\u062c\u0648' +

114

unicode(osutils.rand_chars(60)) for x in xrange(1000)]

115

self.time(self.encode_cached_multi, revisions, 1000)

116

117

118

class DecodingBenchmarks(Benchmark):

119

120

def setUp(self):

121

super(DecodingBenchmarks, self).setUp()

122

# Make sure we start and end with a clean cache

123

cache_utf8.clear_encoding_cache()

124

self.addCleanup(cache_utf8.clear_encoding_cache)

125

126

def decode_1M(self, revision_id):

127

for i in xrange(1000000):

128

revision_id.decode('utf8')

129

130

def decode_cached_1M(self, revision_id):

131

decode = cache_utf8.decode

132

for i in xrange(1000000):

133

decode(revision_id)

134

135

def decode_multi(self, revision_list, count):

136

for i in xrange(count):

137

for revision_id in revision_list:

138

revision_id.decode('utf-8')

139

140

def decode_cached_multi(self, revision_list, count):

141

decode = cache_utf8.decode

142

for i in xrange(count):

143

for revision_id in revision_list:

144

decode(revision_id)

145

146

def test_decode_1_by_1M_ascii(self):

147

"""Test decoding a single revision id 1 million times."""

148

self.time(self.decode_1M, _normal_revision_id_utf8)

149

150

def test_decode_1_by_1M_ascii_cached(self):

151

"""Test decoding a single revision id 1 million times."""

152

self.time(self.decode_cached_1M, _normal_revision_id_utf8)

153

154

def test_decode_1_by_1M_unicode(self):

155

"""Test decoding a single revision id 1 million times."""

156

self.time(self.decode_1M, _unicode_revision_id_utf8)

157

158

def test_decode_1_by_1M_unicode_cached(self):

159

"""Test decoding a single revision id 1 million times."""

160

self.time(self.decode_cached_1M, _unicode_revision_id_utf8)

161

162

def test_decode_1k_by_1k_ascii(self):

163

"""Test decoding 5 revisions 100k times"""

164

revisions = [osutils.rand_chars(60) for x in xrange(1000)]

165

self.time(self.decode_multi, revisions, 1000)

166

167

def test_decode_1k_by_1k_ascii_cached(self):

168

"""Test decoding 5 revisions 100k times"""

169

revisions = [osutils.rand_chars(60) for x in xrange(1000)]

170

self.time(self.decode_cached_multi, revisions, 1000)

171

172

def test_decode_1k_by_1k_unicode(self):

173

"""Test decoding 5 revisions 100k times"""

174

revisions = [('\u062c\u0648\u062c\u0648' +

175

unicode(osutils.rand_chars(60))).encode('utf8')

176

for x in xrange(1000)]

177

self.time(self.decode_multi, revisions, 1000)

178

179

def test_decode_1k_by_1k_unicode_cached(self):

180

"""Test decoding 5 revisions 100k times"""

181

revisions = [('\u062c\u0648\u062c\u0648' +

182

unicode(osutils.rand_chars(60))).encode('utf8')

183

for x in xrange(1000)]

184

self.time(self.decode_cached_multi, revisions, 1000)

Older »