~bzr-pqm/bzr/bzr.dev

Committer: Patch Queue Manager
Date: 2011-12-19 14:40:24 UTC
mfrom: (6379.6.8 feature-absolute-imports)
Revision ID: pqm@pqm.ubuntu.com-20111219144024-awadgqxn2fugwr7m

(jelmer) Use the absolute_import feature everywhere in bzrlib,
and add a source test to make sure it's used everywhere. (Jelmer Vernooij)

files added:
bzrlib/plugins/po_merge

bzrlib/plugins/po_merge/README

bzrlib/plugins/po_merge/__init__.py

bzrlib/plugins/po_merge/po_merge.py

bzrlib/plugins/po_merge/tests

bzrlib/plugins/po_merge/tests/__init__.py

bzrlib/plugins/po_merge/tests/test_po_merge.py

bzrlib/tests/blackbox/test_mkdir.py

bzrlib/tests/test_vf_search.py

bzrlib/vf_search.py

doc/developers/new-config-rationale.txt

files removed:
bzrlib/help_topics/en/location-alias.txt

files modified:
Makefile

bzrlib/__init__.py

bzrlib/_annotator_py.py

bzrlib/_btree_serializer_py.py

bzrlib/_chk_map_py.py

bzrlib/_chunks_to_lines_py.py

bzrlib/_dirstate_helpers_py.py

bzrlib/_groupcompress_py.py

bzrlib/_knit_load_data_py.py

bzrlib/_known_graph_py.py

bzrlib/_patiencediff_py.py

bzrlib/_readdir_py.py

bzrlib/_rio_py.py

bzrlib/_static_tuple_py.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/api.py

bzrlib/atomicfile.py

bzrlib/bencode.py

bzrlib/bisect_multi.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzr_distutils.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/cethread.py

bzrlib/check.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/chunk_writer.py

bzrlib/clean_tree.py

bzrlib/cleanup.py

bzrlib/cmd_test_script.py

bzrlib/cmd_version_info.py

bzrlib/cmdline.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/commit_signature_commands.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/controldir.py

bzrlib/counted_lock.py

bzrlib/crash.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc_generate/__init__.py

bzrlib/doc_generate/autodoc_bash_completion.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/doc_generate/builders/__init__.py

bzrlib/doc_generate/builders/texinfo.py

bzrlib/doc_generate/conf.py

bzrlib/doc_generate/writers/__init__.py

bzrlib/doc_generate/writers/texinfo.py

bzrlib/email_message.py

bzrlib/errors.py

bzrlib/estimate_compressed_size.py

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/export_pot.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/fifo_cache.py

bzrlib/filter_tree.py

bzrlib/filters/__init__.py

bzrlib/filters/eol.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/debug-flags.txt

bzrlib/hooks.py

bzrlib/i18n.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/inventory_delta.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/library_state.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/lsprof.py

bzrlib/mail_client.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/mergetools.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/pack.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/bash_completion/__init__.py

bzrlib/plugins/bash_completion/bashcomp.py

bzrlib/plugins/changelog_merge/__init__.py

bzrlib/plugins/changelog_merge/changelog_merge.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/account.py

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/lp_api_lite.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_propose.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/weave_fmt/__init__.py

bzrlib/plugins/weave_fmt/branch.py

bzrlib/plugins/weave_fmt/bzrdir.py

bzrlib/plugins/weave_fmt/repository.py

bzrlib/plugins/weave_fmt/test_bzrdir.py

bzrlib/plugins/weave_fmt/test_repository.py

bzrlib/plugins/weave_fmt/test_workingtree.py

bzrlib/plugins/weave_fmt/workingtree.py

bzrlib/plugins/weave_fmt/xml4.py

bzrlib/progress.py

bzrlib/push.py

bzrlib/pyutils.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/recordcounter.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/rename_map.py

bzrlib/repofmt/__init__.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitpack_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/rules.py

bzrlib/send.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/packrepository.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/signals.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/static_tuple.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/strace.py

bzrlib/switch.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_config.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_pack.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_rmbranch.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/features.py

bzrlib/tests/fixtures.py

bzrlib/tests/http_server.py

bzrlib/tests/matchers.py

bzrlib/tests/per_branch/test_create_checkout.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_controldir/test_controldir.py

bzrlib/tests/per_controldir_colo/test_supported.py

bzrlib/tests/per_controldir_colo/test_unsupported.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_interrepository/test_fetch.py

bzrlib/tests/per_merger.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository_chk/test_supported.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_vf/test_add_inventory_by_delta.py

bzrlib/tests/per_repository_vf/test_check_reconcile.py

bzrlib/tests/per_repository_vf/test_fetch.py

bzrlib/tests/per_workingtree/test_paths2ids.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_config.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_export_pot.py

bzrlib/tests/test_features.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_import_tariff.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_matchers.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_server.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_request.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_test_server.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_xml.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/ftp/_gssapi.py

bzrlib/transport/gio_transport.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/log.py

bzrlib/transport/memory.py

bzrlib/transport/nosmart.py

bzrlib/transport/pathfilter.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/transport/trace.py

bzrlib/transport/unlistable.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/utextwrap.py

bzrlib/util/__init__.py

bzrlib/util/_bencode_py.py

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/simplemapi.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_custom.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/vf_repository.py

bzrlib/views.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_3.py

bzrlib/workingtree_4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/developers/configuration.txt

doc/developers/network-protocol.txt

doc/developers/plans.txt

doc/en/release-notes/bzr-2.4.txt

doc/en/release-notes/bzr-2.5.txt

doc/en/whats-new/whats-new-in-2.5.txt

po/bzr.pot

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/xml8.py

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

from __future__ import absolute_import

import cStringIO

import re

from bzrlib import (

cache_utf8,

errors,

inventory,

lazy_regex,

revision as _mod_revision,

trace,

Element,

SubElement,

XMLSerializer,

encode_and_escape,

escape_invalid_chars,

get_utf8_or_ascii,

serialize_inventory_flat,

unpack_inventory_entry,

unpack_inventory_flat,

)

from bzrlib.inventory import InventoryEntry

from bzrlib.revision import Revision

from bzrlib.errors import BzrError

_utf8_re = None

_unicode_re = None

_xml_escape_map = {

"&":'&',

"'":"'", # FIXME: overkill

"\"":""",

"<":"<",

">":">",

}

_xml_unescape_map = {

'apos':"'",

'quot':'"',

return unichr(int(code[1:])).encode('utf8')

_unescape_re = None

_unescape_re = lazy_regex.lazy_compile('\&([^;]*);')

def _unescape_xml(data):

"""Unescape predefined XML entities in a string of data."""

global _unescape_re

if _unescape_re is None:

_unescape_re = re.compile('\&([^;]*);')

return _unescape_re.sub(_unescaper, data)

def _ensure_utf8_re():

"""Make sure the _utf8_re and _unicode_re regexes have been compiled."""

global _utf8_re, _unicode_re

if _utf8_re is None:

_utf8_re = re.compile('[&<>\'\"]|[\x80-\xff]+')

if _unicode_re is None:

_unicode_re = re.compile(u'[&<>\'\"\u0080-\uffff]')

def _unicode_escape_replace(match, _map=_xml_escape_map):

"""Replace a string of non-ascii, non XML safe characters with their escape

This will escape both Standard XML escapes, like <>"', etc.

As well as escaping non ascii characters, because ElementTree did.

This helps us remain compatible to older versions of bzr. We may change

our policy in the future, though.

"""

# jam 20060816 Benchmarks show that try/KeyError is faster if you

# expect the entity to rarely miss. There is about a 10% difference

# in overall time. But if you miss frequently, then if None is much

# faster. For our use case, we *rarely* have a revision id, file id

100

# or path name that is unicode. So use try/KeyError.

101

try:

102

return _map[match.group()]

103

except KeyError:

104

return "&#%d;" % ord(match.group())

105

106

107

def _utf8_escape_replace(match, _map=_xml_escape_map):

108

"""Escape utf8 characters into XML safe ones.

109

110

This uses 2 tricks. It is either escaping "standard" characters, like "&<>,

111

or it is handling characters with the high-bit set. For ascii characters,

112

we just lookup the replacement in the dictionary. For everything else, we

113

decode back into Unicode, and then use the XML escape code.

114

"""

115

try:

116

return _map[match.group()]

117

except KeyError:

118

return ''.join('&#%d;' % ord(uni_chr)

119

for uni_chr in match.group().decode('utf8'))

120

121

122

_to_escaped_map = {}

123

124

def _encode_and_escape(unicode_or_utf8_str, _map=_to_escaped_map):

125

"""Encode the string into utf8, and escape invalid XML characters"""

126

# We frequently get entities we have not seen before, so it is better

127

# to check if None, rather than try/KeyError

128

text = _map.get(unicode_or_utf8_str)

129

if text is None:

130

if unicode_or_utf8_str.__class__ is unicode:

131

# The alternative policy is to do a regular UTF8 encoding

132

# and then escape only XML meta characters.

133

# Performance is equivalent once you use cache_utf8. *However*

134

# this makes the serialized texts incompatible with old versions

135

# of bzr. So no net gain. (Perhaps the read code would handle utf8

136

# better than entity escapes, but cElementTree seems to do just fine

137

# either way)

138

text = str(_unicode_re.sub(_unicode_escape_replace,

139

unicode_or_utf8_str)) + '"'

140

else:

141

# Plain strings are considered to already be in utf-8 so we do a

142

# slightly different method for escaping.

143

text = _utf8_re.sub(_utf8_escape_replace,

144

unicode_or_utf8_str) + '"'

145

_map[unicode_or_utf8_str] = text

146

return text

147

148

149

def _get_utf8_or_ascii(a_str,

150

_encode_utf8=cache_utf8.encode,

151

_get_cached_ascii=cache_utf8.get_cached_ascii):

152

"""Return a cached version of the string.

153

154

cElementTree will return a plain string if the XML is plain ascii. It only

155

returns Unicode when it needs to. We want to work in utf-8 strings. So if

156

cElementTree returns a plain string, we can just return the cached version.

157

If it is Unicode, then we need to encode it.

158

159

:param a_str: An 8-bit string or Unicode as returned by

160

cElementTree.Element.get()

161

:return: A utf-8 encoded 8-bit string.

162

"""

163

# This is fairly optimized because we know what cElementTree does, this is

164

# not meant as a generic function for all cases. Because it is possible for

165

# an 8-bit string to not be ascii or valid utf8.

166

if a_str.__class__ is unicode:

167

return _encode_utf8(a_str)

168

else:

169

return intern(a_str)

170

171

172

def _clear_cache():

173

"""Clean out the unicode => escaped map"""

174

_to_escaped_map.clear()

175

176

177

class Serializer_v8(XMLSerializer):

178

"""This serialiser adds rich roots.

179

261

152

reference_revision, symlink_target.

262

153

:return: The inventory as a list of lines.

263

154

"""

264

_ensure_utf8_re()

265

self._check_revisions(inv)

266

155

output = []

267

156

append = output.append

268

157

self._append_inventory_root(append, inv)

269

entries = inv.iter_entries()

270

# Skip the root

271

root_path, root_ie = entries.next()

272

for path, ie in entries:

273

if ie.parent_id != self.root_id:

274

parent_str = ' parent_id="'

275

parent_id = _encode_and_escape(ie.parent_id)

276

else:

277

parent_str = ''

278

parent_id = ''

279

if ie.kind == 'file':

280

if ie.executable:

281

executable = ' executable="yes"'

282

else:

283

executable = ''

284

if not working:

285

append('<file%s file_id="%s name="%s%s%s revision="%s '

286

'text_sha1="%s" text_size="%d" />\n' % (

287

executable, _encode_and_escape(ie.file_id),

288

_encode_and_escape(ie.name), parent_str, parent_id,

289

_encode_and_escape(ie.revision), ie.text_sha1,

290

ie.text_size))

291

else:

292

append('<file%s file_id="%s name="%s%s%s />\n' % (

293

executable, _encode_and_escape(ie.file_id),

294

_encode_and_escape(ie.name), parent_str, parent_id))

295

elif ie.kind == 'directory':

296

if not working:

297

append('<directory file_id="%s name="%s%s%s revision="%s '

298

'/>\n' % (

299

_encode_and_escape(ie.file_id),

300

_encode_and_escape(ie.name),

301

parent_str, parent_id,

302

_encode_and_escape(ie.revision)))

303

else:

304

append('<directory file_id="%s name="%s%s%s />\n' % (

305

_encode_and_escape(ie.file_id),

306

_encode_and_escape(ie.name),

307

parent_str, parent_id))

308

elif ie.kind == 'symlink':

309

if not working:

310

append('<symlink file_id="%s name="%s%s%s revision="%s '

311

'symlink_target="%s />\n' % (

312

_encode_and_escape(ie.file_id),

313

_encode_and_escape(ie.name),

314

parent_str, parent_id,

315

_encode_and_escape(ie.revision),

316

_encode_and_escape(ie.symlink_target)))

317

else:

318

append('<symlink file_id="%s name="%s%s%s />\n' % (

319

_encode_and_escape(ie.file_id),

320

_encode_and_escape(ie.name),

321

parent_str, parent_id))

322

elif ie.kind == 'tree-reference':

323

if ie.kind not in self.supported_kinds:

324

raise errors.UnsupportedInventoryKind(ie.kind)

325

if not working:

326

append('<tree-reference file_id="%s name="%s%s%s '

327

'revision="%s reference_revision="%s />\n' % (

328

_encode_and_escape(ie.file_id),

329

_encode_and_escape(ie.name),

330

parent_str, parent_id,

331

_encode_and_escape(ie.revision),

332

_encode_and_escape(ie.reference_revision)))

333

else:

334

append('<tree-reference file_id="%s name="%s%s%s />\n' % (

335

_encode_and_escape(ie.file_id),

336

_encode_and_escape(ie.name),

337

parent_str, parent_id))

338

else:

339

raise errors.UnsupportedInventoryKind(ie.kind)

340

append('</inventory>\n')

158

serialize_inventory_flat(inv, append,

159

self.root_id, self.supported_kinds, working)

341

160

if f is not None:

342

161

f.writelines(output)

343

162

# Just to keep the cache from growing without bounds

349

168

"""Append the inventory root to output."""

350

169

if inv.revision_id is not None:

351

170

revid1 = ' revision_id="'

352

revid2 = _encode_and_escape(inv.revision_id)

171

revid2 = encode_and_escape(inv.revision_id)

353

172

else:

354

173

revid1 = ""

355

174

revid2 = ""

356

175

append('<inventory format="%s"%s%s>\n' % (

357

176

self.format_num, revid1, revid2))

358

177

append('<directory file_id="%s name="%s revision="%s />\n' % (

359

_encode_and_escape(inv.root.file_id),

360

_encode_and_escape(inv.root.name),

361

_encode_and_escape(inv.root.revision)))

178

encode_and_escape(inv.root.file_id),

179

encode_and_escape(inv.root.name),

180

encode_and_escape(inv.root.revision)))

362

181

363

182

def _pack_revision(self, rev):

364

183

"""Revision object -> xml tree"""

408

227

prop_elt.tail = '\n'

409

228

top_elt.tail = '\n'

410

229

230

def _unpack_entry(self, elt, entry_cache=None, return_from_cache=False):

231

# This is here because it's overridden by xml7

232

return unpack_inventory_entry(elt, entry_cache,

233

return_from_cache)

234

411

235

def _unpack_inventory(self, elt, revision_id=None, entry_cache=None,

412

236

return_from_cache=False):

413

237

"""Construct from XML Element"""

414

if elt.tag != 'inventory':

415

raise errors.UnexpectedInventoryFormat('Root tag is %r' % elt.tag)

416

format = elt.get('format')

417

if format != self.format_num:

418

raise errors.UnexpectedInventoryFormat('Invalid format version %r'

419

% format)

420

revision_id = elt.get('revision_id')

421

if revision_id is not None:

422

revision_id = cache_utf8.encode(revision_id)

423

inv = inventory.Inventory(root_id=None, revision_id=revision_id)

424

for e in elt:

425

ie = self._unpack_entry(e, entry_cache=entry_cache,

426

return_from_cache=return_from_cache)

427

inv.add(ie)

238

inv = unpack_inventory_flat(elt, self.format_num, self._unpack_entry,

239

entry_cache, return_from_cache)

428

240

self._check_cache_size(len(inv), entry_cache)

429

241

return inv

430

242

431

def _unpack_entry(self, elt, entry_cache=None, return_from_cache=False):

432

elt_get = elt.get

433

file_id = elt_get('file_id')

434

revision = elt_get('revision')

435

# Check and see if we have already unpacked this exact entry

436

# Some timings for "repo.revision_trees(last_100_revs)"

437

# bzr mysql

438

# unmodified 4.1s 40.8s

439

# using lru 3.5s

440

# using fifo 2.83s 29.1s

441

# lru._cache 2.8s

442

# dict 2.75s 26.8s

443

# inv.add 2.5s 26.0s

444

# no_copy 2.00s 20.5s

445

# no_c,dict 1.95s 18.0s

446

# Note that a cache of 10k nodes is more than sufficient to hold all of

447

# the inventory for the last 100 revs for bzr, but not for mysql (20k

448

# is enough for mysql, which saves the same 2s as using a dict)

449

450

# Breakdown of mysql using time.clock()

451

# 4.1s 2 calls to element.get for file_id, revision_id

452

# 4.5s cache_hit lookup

453

# 7.1s InventoryFile.copy()

454

# 2.4s InventoryDirectory.copy()

455

# 0.4s decoding unique entries

456

# 1.6s decoding entries after FIFO fills up

457

# 0.8s Adding nodes to FIFO (including flushes)

458

# 0.1s cache miss lookups

459

# Using an LRU cache

460

# 4.1s 2 calls to element.get for file_id, revision_id

461

# 9.9s cache_hit lookup

462

# 10.8s InventoryEntry.copy()

463

# 0.3s cache miss lookus

464

# 1.2s decoding entries

465

# 1.0s adding nodes to LRU

466

if entry_cache is not None and revision is not None:

467

key = (file_id, revision)

468

try:

469

# We copy it, because some operations may mutate it

470

cached_ie = entry_cache[key]

471

except KeyError:

472

pass

473

else:

474

# Only copying directory entries drops us 2.85s => 2.35s

475

if return_from_cache:

476

if cached_ie.kind == 'directory':

477

return cached_ie.copy()

478

return cached_ie

479

return cached_ie.copy()

480

481

kind = elt.tag

482

if not InventoryEntry.versionable_kind(kind):

483

raise AssertionError('unsupported entry kind %s' % kind)

484

485

get_cached = _get_utf8_or_ascii

486

487

file_id = get_cached(file_id)

488

if revision is not None:

489

revision = get_cached(revision)

490

parent_id = elt_get('parent_id')

491

if parent_id is not None:

492

parent_id = get_cached(parent_id)

493

494

if kind == 'directory':

495

ie = inventory.InventoryDirectory(file_id,

496

elt_get('name'),

497

parent_id)

498

elif kind == 'file':

499

ie = inventory.InventoryFile(file_id,

500

elt_get('name'),

501

parent_id)

502

ie.text_sha1 = elt_get('text_sha1')

503

if elt_get('executable') == 'yes':

504

ie.executable = True

505

v = elt_get('text_size')

506

ie.text_size = v and int(v)

507

elif kind == 'symlink':

508

ie = inventory.InventoryLink(file_id,

509

elt_get('name'),

510

parent_id)

511

ie.symlink_target = elt_get('symlink_target')

512

else:

513

raise errors.UnsupportedInventoryKind(kind)

514

ie.revision = revision

515

if revision is not None and entry_cache is not None:

516

# We cache a copy() because callers like to mutate objects, and

517

# that would cause the item in cache to mutate as well.

518

# This has a small effect on many-inventory performance, because

519

# the majority fraction is spent in cache hits, not misses.

520

entry_cache[key] = ie.copy()

521

522

return ie

523

524

243

def _unpack_revision(self, elt):

525

244

"""XML Element -> Revision object"""

526

245

format = elt.get('format')

531

250

if format != format_num:

532

251

raise BzrError("invalid format version %r on revision"

533

252

% format)

534

get_cached = _get_utf8_or_ascii

253

get_cached = get_utf8_or_ascii

535

254

rev = Revision(committer = elt.get('committer'),

536

255

timestamp = float(elt.get('timestamp')),

537

256

revision_id = get_cached(elt.get('revision_id')),

Older »