~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/chk_map.py

Committer: John Arbash Meinel
Date: 2010-02-17 17:11:16 UTC
mfrom: (4797.2.17 2.1)
mto: (4797.2.18 2.1)
mto: This revision was merged to the branch mainline in revision 5055.
Revision ID: john@arbash-meinel.com-20100217171116-h7t9223ystbnx5h8

merge bzr.2.1 in preparation for NEWS entry.

files added:
MANIFEST.in

README_BDIST_RPM

bzrlib/cleanup.py

bzrlib/help_topics/en/location-alias.txt

bzrlib/help_topics/es

bzrlib/plugins/launchpad/lp_api.py

bzrlib/plugins/launchpad/test_lp_api.py

bzrlib/plugins/news_merge

bzrlib/plugins/news_merge/README

bzrlib/plugins/news_merge/__init__.py

bzrlib/plugins/news_merge/news_merge.py

bzrlib/plugins/news_merge/parser.py

bzrlib/plugins/news_merge/tests

bzrlib/plugins/news_merge/tests/__init__.py

bzrlib/plugins/news_merge/tests/test_news_merge.py

bzrlib/tests/per_foreign_vcs/test_repository.py

bzrlib/tests/per_merger.py

bzrlib/tests/test_cleanup.py

bzrlib/tests/test_patches_data/binary-after-normal.patch

bzrlib/tests/test_patches_data/binary.patch

contrib/debian

contrib/debian/default

contrib/debian/init.d

doc/developers/_static/bzr-doc.css

doc/developers/contribution-quickstart.txt

doc/developers/principles.txt

doc/developers/win32_build_setup.txt

doc/en/admin-guide/advanced.txt

doc/en/admin-guide/backup.txt

doc/en/admin-guide/code-browsing.txt

doc/en/admin-guide/hooks-plugins.txt

doc/en/admin-guide/index-plain.txt

doc/en/admin-guide/integration.txt

doc/en/admin-guide/introduction.txt

doc/en/admin-guide/migration.txt

doc/en/admin-guide/other-setups.txt

doc/en/admin-guide/security.txt

doc/en/admin-guide/simple-setups.txt

doc/en/admin-guide/upgrade.txt

doc/index.ja.txt

doc/ja

doc/ja/_static

doc/ja/_static/bzr icon 16.png

doc/ja/_static/bzr.ico

doc/ja/_templates

doc/ja/conf.py

doc/ja/index.txt

doc/ja/mini-tutorial

doc/ja/mini-tutorial/index.txt

doc/ja/tutorials

doc/ja/tutorials/centralized_workflow.txt

doc/ja/tutorials/index.txt

doc/ja/tutorials/tutorial.txt

doc/ja/tutorials/using_bazaar_with_launchpad.txt

doc/ja/upgrade-guide

doc/ja/upgrade-guide/data_migration.txt

doc/ja/upgrade-guide/index.txt

doc/ja/upgrade-guide/overview.txt

doc/ja/upgrade-guide/tips_and_tricks.txt

doc/ja/user-guide

doc/ja/user-guide/adv_merging.txt

doc/ja/user-guide/annotating_changes.txt

doc/ja/user-guide/bazaar_workflows.txt

doc/ja/user-guide/branching_a_project.txt

doc/ja/user-guide/browsing_history.txt

doc/ja/user-guide/bug_trackers.txt

doc/ja/user-guide/bzrtools_plugin.txt

doc/ja/user-guide/central_intro.txt

doc/ja/user-guide/configuring_bazaar.txt

doc/ja/user-guide/controlling_registration.txt

doc/ja/user-guide/core_concepts.txt

doc/ja/user-guide/distributed_intro.txt

doc/ja/user-guide/entering_commands.txt

doc/ja/user-guide/filtered_views.txt

doc/ja/user-guide/getting_help.txt

doc/ja/user-guide/hooks.txt

doc/ja/user-guide/http_smart_server.txt

doc/ja/user-guide/images

doc/ja/user-guide/images/workflows_centralized.png

doc/ja/user-guide/images/workflows_centralized.svg

doc/ja/user-guide/images/workflows_gatekeeper.png

doc/ja/user-guide/images/workflows_gatekeeper.svg

doc/ja/user-guide/images/workflows_localcommit.png

doc/ja/user-guide/images/workflows_localcommit.svg

doc/ja/user-guide/images/workflows_peer.png

doc/ja/user-guide/images/workflows_peer.svg

doc/ja/user-guide/images/workflows_pqm.png

doc/ja/user-guide/images/workflows_pqm.svg

doc/ja/user-guide/images/workflows_shared.png

doc/ja/user-guide/images/workflows_shared.svg

doc/ja/user-guide/images/workflows_single.png

doc/ja/user-guide/images/workflows_single.svg

doc/ja/user-guide/index.txt

doc/ja/user-guide/installing_bazaar.txt

doc/ja/user-guide/introducing_bazaar.txt

doc/ja/user-guide/merging_changes.txt

doc/ja/user-guide/organizing_branches.txt

doc/ja/user-guide/organizing_your_workspace.txt

doc/ja/user-guide/part2_intro.txt

doc/ja/user-guide/partner_intro.txt

doc/ja/user-guide/plugins.txt

doc/ja/user-guide/publishing_a_branch.txt

doc/ja/user-guide/recording_changes.txt

doc/ja/user-guide/releasing_a_project.txt

doc/ja/user-guide/resolving_conflicts.txt

doc/ja/user-guide/reusing_a_checkout.txt

doc/ja/user-guide/reviewing_changes.txt

doc/ja/user-guide/sending_changes.txt

doc/ja/user-guide/server.txt

doc/ja/user-guide/setting_up_email.txt

doc/ja/user-guide/shared_repository_layouts.txt

doc/ja/user-guide/shelving_changes.txt

doc/ja/user-guide/solo_intro.txt

doc/ja/user-guide/specifying_revisions.txt

doc/ja/user-guide/stacked.txt

doc/ja/user-guide/starting_a_project.txt

doc/ja/user-guide/svn_plugin.txt

doc/ja/user-guide/undoing_mistakes.txt

doc/ja/user-guide/using_aliases.txt

doc/ja/user-guide/using_checkouts.txt

doc/ja/user-guide/using_gatekeepers.txt

doc/ja/user-guide/version_info.txt

doc/ja/user-guide/web_browsing.txt

doc/ja/user-guide/working_offline_central.txt

doc/ja/user-guide/writing_a_plugin.txt

doc/ja/user-guide/zen.txt

doc/ja/user-reference

doc/ja/user-reference/index.txt

files removed:
bzrlib/textui.py

files renamed:
bzrlib/help_topics/en/conflicts.txt => bzrlib/help_topics/en/conflict-types.txt

doc/es/user-guide/resolving_conflicts.txt => bzrlib/help_topics/es/conflicts.txt

bzrlib/tests/test_bencode.py => bzrlib/tests/test__bencode.py

files modified:
Makefile

NEWS

bzrlib/__init__.py

bzrlib/_annotator_pyx.pyx

bzrlib/_bencode_pyx.pyx

bzrlib/_btree_serializer_py.py

bzrlib/_btree_serializer_pyx.pyx

bzrlib/_chk_map_py.py

bzrlib/_chk_map_pyx.pyx

bzrlib/_dirstate_helpers_pyx.pyx

bzrlib/_groupcompress_pyx.pyx

bzrlib/_knit_load_data_pyx.pyx

bzrlib/_known_graph_py.py

bzrlib/_known_graph_pyx.pyx

bzrlib/_patiencediff_c.c

bzrlib/_readdir_pyx.pyx

bzrlib/_rio_pyx.pyx

bzrlib/_simple_set_pyx.pxd

bzrlib/_simple_set_pyx.pyx

bzrlib/_static_tuple_c.c

bzrlib/_static_tuple_c.pxd

bzrlib/_static_tuple_py.py

bzrlib/_walkdirs_win32.pyx

bzrlib/benchmarks/bench_dirstate.py

bzrlib/branch.py

bzrlib/btree_index.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bzrdir.py

bzrlib/chk_map.py

bzrlib/chk_serializer.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff-delta.c

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc_generate/autodoc_man.py

bzrlib/doc_generate/autodoc_rstx.py

bzrlib/errors.py

bzrlib/export/dir_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/fetch.py

bzrlib/foreign.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/content-filters.txt

bzrlib/help_topics/en/debug-flags.txt

bzrlib/help_topics/en/log-formats.txt

bzrlib/help_topics/en/patterns.txt

bzrlib/help_topics/en/rules.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patches.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/plugins/launchpad/test_lp_open.py

bzrlib/push.py

bzrlib/reconcile.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/serializer.py

bzrlib/shelf_ui.py

bzrlib/shellcomplete.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/static_tuple.py

bzrlib/status.py

bzrlib/switch.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_filtered_view_ops.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_shelve.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/commands/test_branch.py

bzrlib/tests/commands/test_cat.py

bzrlib/tests/commands/test_checkout.py

bzrlib/tests/commands/test_commit.py

bzrlib/tests/commands/test_init.py

bzrlib/tests/commands/test_init_repository.py

bzrlib/tests/commands/test_merge.py

bzrlib/tests/commands/test_missing.py

bzrlib/tests/commands/test_pull.py

bzrlib/tests/commands/test_push.py

bzrlib/tests/commands/test_update.py

bzrlib/tests/features.py

bzrlib/tests/ftp_server/__init__.py

bzrlib/tests/ftp_server/medusa_based.py

bzrlib/tests/ftp_server/pyftpdlib_based.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/per_branch/test_hooks.py

bzrlib/tests/per_branch/test_iter_merge_sorted_revisions.py

bzrlib/tests/per_branch/test_parent.py

bzrlib/tests/per_branch/test_push.py

bzrlib/tests/per_bzrdir/test_bzrdir.py

bzrlib/tests/per_foreign_vcs/__init__.py

bzrlib/tests/per_interbranch/test_push.py

bzrlib/tests/per_intertree/__init__.py

bzrlib/tests/per_pack_repository.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository_reference/test_check.py

bzrlib/tests/per_transport.py

bzrlib/tests/per_tree/test_get_file_with_stat.py

bzrlib/tests/per_tree/test_inv.py

bzrlib/tests/per_tree/test_iter_search_rules.py

bzrlib/tests/per_tree/test_path_content_summary.py

bzrlib/tests/per_uifactory/__init__.py

bzrlib/tests/per_versionedfile.py

bzrlib/tests/per_workingtree/test_content_filters.py

bzrlib/tests/per_workingtree/test_is_ignored.py

bzrlib/tests/per_workingtree/test_pull.py

bzrlib/tests/per_workingtree/test_set_root_id.py

bzrlib/tests/per_workingtree/test_smart_add.py

bzrlib/tests/per_workingtree/test_workingtree.py

bzrlib/tests/script.py

bzrlib/tests/ssl_certs/create_ssls.py

bzrlib/tests/ssl_certs/server.crt

bzrlib/tests/ssl_certs/server.csr

bzrlib/tests/ssl_certs/server_with_pass.key

bzrlib/tests/ssl_certs/server_without_pass.key

bzrlib/tests/stub_sftp.py

bzrlib/tests/test__annotator.py

bzrlib/tests/test__chk_map.py

bzrlib/tests/test__chunks_to_lines.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test__known_graph.py

bzrlib/tests/test__rio.py

bzrlib/tests/test__simple_set.py

bzrlib/tests/test__static_tuple.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_btree_index.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_chk_map.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_crash.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_index.py

bzrlib/tests/test_info.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_script.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_shelf.py

bzrlib/tests/test_shelf_ui.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_log.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp/__init__.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/pathfilter.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/urlutils.py

bzrlib/util/_bencode_py.py

bzrlib/version.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml7.py

bzrlib/xml8.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/HACKING.txt

doc/developers/_templates/layout.html

doc/developers/add.txt

doc/developers/api-versioning.txt

doc/developers/apport.txt

doc/developers/authentication-ring.txt

doc/developers/bug-handling.txt

doc/developers/bundles.txt

doc/developers/case-insensitive-file-systems.txt

doc/developers/colocated-branches.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/content-filtering.txt

doc/developers/cycle.txt

doc/developers/development-repo.txt

doc/developers/diff.txt

doc/developers/directory-fingerprints.txt

doc/developers/ec2.txt

doc/developers/improved_chk_index.txt

doc/developers/incremental-push-pull.txt

doc/developers/index-plain.txt

doc/developers/index.txt

doc/developers/inventory.txt

doc/developers/last-modified.txt

doc/developers/network-protocol.txt

doc/developers/overview.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/plans.txt

doc/developers/plugin-api.txt

doc/developers/ppa.txt

doc/developers/process.txt

doc/developers/profiling.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/repository.txt

doc/developers/revert.txt

doc/developers/specifications.txt

doc/developers/status.txt

doc/developers/testing.txt

doc/developers/tortoise-strategy.txt

doc/developers/update.txt

doc/en/_templates/index.html

doc/en/_templates/layout.html

doc/en/admin-guide/index.txt

doc/en/conf.py

doc/en/index.txt

doc/en/mini-tutorial/index.txt

doc/en/tutorials/centralized_workflow.txt

doc/en/tutorials/tutorial.txt

doc/en/tutorials/using_bazaar_with_launchpad.txt

doc/en/user-guide/adv_merging.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/filtered_views.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index-plain.txt

doc/en/user-guide/index.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/plugins.txt

doc/en/user-guide/publishing_a_branch.txt

doc/en/user-guide/recording_changes.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/reviewing_changes.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/server.txt

doc/en/user-guide/setting_up_email.txt

doc/en/user-guide/shared_repository_layouts.txt

doc/en/user-guide/shelving_changes.txt

doc/en/user-guide/specifying_revisions.txt

doc/en/user-guide/stacked.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/version_info.txt

doc/en/user-guide/web_browsing.txt

doc/en/user-guide/zen.txt

doc/es/_templates/layout.html

doc/es/index.txt

doc/es/mini-tutorial/index.txt

doc/es/user-guide/index-plain.txt

doc/es/user-guide/index.txt

doc/es/user-guide/version_info.txt

doc/index.es.txt

doc/index.ru.txt

doc/index.txt

doc/ru/_templates/layout.html

doc/ru/index.txt

doc/ru/mini-tutorial/index.txt

doc/ru/tutorials/centralized_workflow.txt

doc/ru/tutorials/tutorial.txt

doc/ru/tutorials/using_bazaar_with_launchpad.txt

doc/ru/user-guide/branching_a_project.txt

doc/ru/user-guide/index-plain.txt

doc/ru/user-guide/index.txt

doc/ru/user-guide/introducing_bazaar.txt

doc/ru/user-guide/specifying_revisions.txt

doc/ru/user-guide/zen.txt

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/chk_map.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

"""

import heapq

import threading

from bzrlib import lazy_import

lazy_import.lazy_import(globals(), """

lru_cache,

osutils,

registry,

static_tuple,

trace,

)

from bzrlib.static_tuple import StaticTuple

# approx 4MB

# If each line is 50 bytes, and you have 255 internal pages, with 255-way fan

# out, it takes 3.1MB to cache the layer.

_PAGE_CACHE_SIZE = 4*1024*1024

# We are caching bytes so len(value) is perfectly accurate

_page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)

# Per thread caches for 2 reasons:

# - in the server we may be serving very different content, so we get less

# cache thrashing.

# - we avoid locking on every cache lookup.

_thread_caches = threading.local()

# The page cache.

_thread_caches.page_cache = None

def _get_cache():

"""Get the per-thread page cache.

We need a function to do this because in a new thread the _thread_caches

threading.local object does not have the cache initialized yet.

"""

page_cache = getattr(_thread_caches, 'page_cache', None)

if page_cache is None:

# We are caching bytes so len(value) is perfectly accurate

page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)

_thread_caches.page_cache = page_cache

return page_cache

def clear_cache():

_page_cache.clear()

_get_cache().clear()

# If a ChildNode falls below this many bytes, we check for a remap

_INTERESTING_NEW_SIZE = 50

114

137

"""

115

138

delete_count = 0

116

139

# Check preconditions first.

117

new_items = set([key for (old, key, value) in delta if key is not None

118

and old is None])

140

as_st = StaticTuple.from_sequence

141

new_items = set([as_st(key) for (old, key, value) in delta

142

if key is not None and old is None])

119

143

existing_new = list(self.iteritems(key_filter=new_items))

120

144

if existing_new:

121

145

raise errors.InconsistentDeltaDelta(delta,

135

159

136

160

def _ensure_root(self):

137

161

"""Ensure that the root node is an object not a key."""

138

if type(self._root_node) is tuple:

162

if type(self._root_node) is StaticTuple:

139

163

# Demand-load the root

140

164

self._root_node = self._get_node(self._root_node)

141

165

149

173

:param node: A tuple key or node object.

150

174

:return: A node object.

151

175

"""

152

if type(node) is tuple:

176

if type(node) is StaticTuple:

153

177

bytes = self._read_bytes(node)

154

178

return _deserialise(bytes, node,

155

179

search_key_func=self._search_key_func)

158

182

159

183

def _read_bytes(self, key):

160

184

try:

161

return _page_cache[key]

185

return _get_cache()[key]

162

186

except KeyError:

163

187

stream = self._store.get_record_stream([key], 'unordered', True)

164

188

bytes = stream.next().get_bytes_as('fulltext')

165

_page_cache[key] = bytes

189

_get_cache()[key] = bytes

166

190

return bytes

167

191

168

192

def _dump_tree(self, include_keys=False):

196

220

for key, value in sorted(node._items.iteritems()):

197

221

# Don't use prefix nor indent here to line up when used in

198

222

# tests in conjunction with assertEqualDiff

199

result.append(' %r %r' % (key, value))

223

result.append(' %r %r' % (tuple(key), value))

200

224

return result

201

225

202

226

@classmethod

220

244

root_key = klass._create_directly(store, initial_value,

221

245

maximum_size=maximum_size, key_width=key_width,

222

246

search_key_func=search_key_func)

247

if type(root_key) is not StaticTuple:

248

raise AssertionError('we got a %s instead of a StaticTuple'

249

% (type(root_key),))

223

250

return root_key

224

251

225

252

@classmethod

240

267

node = LeafNode(search_key_func=search_key_func)

241

268

node.set_maximum_size(maximum_size)

242

269

node._key_width = key_width

243

node._items = dict(initial_value)

270

as_st = StaticTuple.from_sequence

271

node._items = dict([(as_st(key), val) for key, val

272

in initial_value.iteritems()])

244

273

node._raw_size = sum([node._key_value_len(key, value)

245

for key,value in initial_value.iteritems()])

274

for key,value in node._items.iteritems()])

246

275

node._len = len(node._items)

247

276

node._compute_search_prefix()

248

277

node._compute_serialised_prefix()

484

513

def iteritems(self, key_filter=None):

485

514

"""Iterate over the entire CHKMap's contents."""

486

515

self._ensure_root()

516

if key_filter is not None:

517

as_st = StaticTuple.from_sequence

518

key_filter = [as_st(key) for key in key_filter]

487

519

return self._root_node.iteritems(self._store, key_filter=key_filter)

488

520

489

521

def key(self):

490

522

"""Return the key for this map."""

491

if type(self._root_node) is tuple:

523

if type(self._root_node) is StaticTuple:

492

524

return self._root_node

493

525

else:

494

526

return self._root_node._key

503

535

:param key: A key to map.

504

536

:param value: The value to assign to key.

505

537

"""

538

key = StaticTuple.from_sequence(key)

506

539

# Need a root object.

507

540

self._ensure_root()

508

541

prefix, node_details = self._root_node.map(self._store, key, value)

519

552

def _node_key(self, node):

520

553

"""Get the key for a node whether it's a tuple or node."""

521

554

if type(node) is tuple:

555

node = StaticTuple.from_sequence(node)

556

if type(node) is StaticTuple:

522

557

return node

523

558

else:

524

559

return node._key

525

560

526

561

def unmap(self, key, check_remap=True):

527

562

"""remove key from the map."""

563

key = StaticTuple.from_sequence(key)

528

564

self._ensure_root()

529

565

if type(self._root_node) is InternalNode:

530

566

unmapped = self._root_node.unmap(self._store, key,

544

580

545

581

:return: The key of the root node.

546

582

"""

547

if type(self._root_node) is tuple:

583

if type(self._root_node) is StaticTuple:

548

584

# Already saved.

549

585

return self._root_node

550

586

keys = list(self._root_node.serialise(self._store))

706

742

:param bytes: The bytes of the node.

707

743

:param key: The key that the serialised node has.

708

744

"""

745

key = static_tuple.expect_static_tuple(key)

709

746

return _deserialise_leaf_node(bytes, key,

710

747

search_key_func=search_key_func)

711

748

881

918

lines.append(serialized[prefix_len:])

882

919

lines.extend(value_lines)

883

920

sha1, _, _ = store.add_lines((None,), (), lines)

884

self._key = ("sha1:" + sha1,)

921

self._key = StaticTuple("sha1:" + sha1,).intern()

885

922

bytes = ''.join(lines)

886

923

if len(bytes) != self._current_size():

887

924

raise AssertionError('Invalid _current_size')

888

_page_cache.add(self._key, bytes)

925

_get_cache().add(self._key, bytes)

889

926

return [self._key]

890

927

891

928

def refs(self):

1004

1041

:param key: The key that the serialised node has.

1005

1042

:return: An InternalNode instance.

1006

1043

"""

1044

key = static_tuple.expect_static_tuple(key)

1007

1045

return _deserialise_internal_node(bytes, key,

1008

1046

search_key_func=search_key_func)

1009

1047

1034

1072

# for whatever we are missing

1035

1073

shortcut = True

1036

1074

for prefix, node in self._items.iteritems():

1037

if node.__class__ is tuple:

1075

if node.__class__ is StaticTuple:

1038

1076

keys[node] = (prefix, None)

1039

1077

else:

1040

1078

yield node, None

1069

1107

# A given key can only match 1 child node, if it isn't

1070

1108

# there, then we can just return nothing

1071

1109

return

1072

if node.__class__ is tuple:

1110

if node.__class__ is StaticTuple:

1073

1111

keys[node] = (search_prefix, [key])

1074

1112

else:

1075

1113

# This is loaded, and the only thing that can match,

1102

1140

# We can ignore this one

1103

1141

continue

1104

1142

node_key_filter = prefix_to_keys[search_prefix]

1105

if node.__class__ is tuple:

1143

if node.__class__ is StaticTuple:

1106

1144

keys[node] = (search_prefix, node_key_filter)

1107

1145

else:

1108

1146

yield node, node_key_filter

1117

1155

if sub_prefix in length_filter:

1118

1156

node_key_filter.extend(prefix_to_keys[sub_prefix])

1119

1157

if node_key_filter: # this key matched something, yield it

1120

if node.__class__ is tuple:

1158

if node.__class__ is StaticTuple:

1121

1159

keys[node] = (prefix, node_key_filter)

1122

1160

else:

1123

1161

yield node, node_key_filter

1126

1164

found_keys = set()

1127

1165

for key in keys:

1128

1166

try:

1129

bytes = _page_cache[key]

1167

bytes = _get_cache()[key]

1130

1168

except KeyError:

1131

1169

continue

1132

1170

else:

1157

1195

prefix, node_key_filter = keys[record.key]

1158

1196

node_and_filters.append((node, node_key_filter))

1159

1197

self._items[prefix] = node

1160

_page_cache.add(record.key, bytes)

1198

_get_cache().add(record.key, bytes)

1161

1199

for info in node_and_filters:

1162

1200

yield info

1163

1201

1255

1293

:return: An iterable of the keys inserted by this operation.

1256

1294

"""

1257

1295

for node in self._items.itervalues():

1258

if type(node) is tuple:

1296

if type(node) is StaticTuple:

1259

1297

# Never deserialised.

1260

1298

continue

1261

1299

if node._key is not None:

1272

1310

lines.append('%s\n' % (self._search_prefix,))

1273

1311

prefix_len = len(self._search_prefix)

1274

1312

for prefix, node in sorted(self._items.items()):

1275

if type(node) is tuple:

1313

if type(node) is StaticTuple:

1276

1314

key = node[0]

1277

1315

else:

1278

1316

key = node._key[0]

1282

1320

% (serialised, self._search_prefix))

1283

1321

lines.append(serialised[prefix_len:])

1284

1322

sha1, _, _ = store.add_lines((None,), (), lines)

1285

self._key = ("sha1:" + sha1,)

1286

_page_cache.add(self._key, ''.join(lines))

1323

self._key = StaticTuple("sha1:" + sha1,).intern()

1324

_get_cache().add(self._key, ''.join(lines))

1287

1325

yield self._key

1288

1326

1289

1327

def _search_key(self, key):

1317

1355

raise AssertionError("unserialised nodes have no refs.")

1318

1356

refs = []

1319

1357

for value in self._items.itervalues():

1320

if type(value) is tuple:

1358

if type(value) is StaticTuple:

1321

1359

refs.append(value)

1322

1360

else:

1323

1361

refs.append(value.key())

1437

1475

1438

1476

def __init__(self, store, new_root_keys, old_root_keys,

1439

1477

search_key_func, pb=None):

1478

# TODO: Should we add a StaticTuple barrier here? It would be nice to

1479

# force callers to use StaticTuple, because there will often be

1480

# lots of keys passed in here. And even if we cast it locally,

1481

# that just meanst that we will have *both* a StaticTuple and a

1482

# tuple() in memory, referring to the same object. (so a net

1483

# increase in memory, not a decrease.)

1440

1484

self._store = store

1441

1485

self._new_root_keys = new_root_keys

1442

1486

self._old_root_keys = old_root_keys

1444

1488

# All uninteresting chks that we have seen. By the time they are added

1445

1489

# here, they should be either fully ignored, or queued up for

1446

1490

# processing

1491

# TODO: This might grow to a large size if there are lots of merge

1492

# parents, etc. However, it probably doesn't scale to O(history)

1493

# like _processed_new_refs does.

1447

1494

self._all_old_chks = set(self._old_root_keys)

1448

1495

# All items that we have seen from the old_root_keys

1449

1496

self._all_old_items = set()

1450

1497

# These are interesting items which were either read, or already in the

1451

1498

# interesting queue (so we don't need to walk them again)

1499

# TODO: processed_new_refs becomes O(all_chks), consider switching to

1500

# SimpleSet here.

1452

1501

self._processed_new_refs = set()

1453

1502

self._search_key_func = search_key_func

1454

1503

1461

1510

self._state = None

1462

1511

1463

1512

def _read_nodes_from_store(self, keys):

1464

# We chose not to use _page_cache, because we think in terms of records

1465

# to be yielded. Also, we expect to touch each page only 1 time during

1466

# this code. (We may want to evaluate saving the raw bytes into the

1467

# page cache, which would allow a working tree update after the fetch

1468

# to not have to read the bytes again.)

1513

# We chose not to use _get_cache(), because we think in

1514

# terms of records to be yielded. Also, we expect to touch each page

1515

# only 1 time during this code. (We may want to evaluate saving the

1516

# raw bytes into the page cache, which would allow a working tree

1517

# update after the fetch to not have to read the bytes again.)

1518

as_st = StaticTuple.from_sequence

1469

1519

stream = self._store.get_record_stream(keys, 'unordered', True)

1470

1520

for record in stream:

1471

1521

if self._pb is not None:

1478

1528

if type(node) is InternalNode:

1479

1529

# Note we don't have to do node.refs() because we know that

1480

1530

# there are no children that have been pushed into this node

1531

# Note: Using as_st() here seemed to save 1.2MB, which would

1532

# indicate that we keep 100k prefix_refs around while

1533

# processing. They *should* be shorter lived than that...

1534

# It does cost us ~10s of processing time

1535

#prefix_refs = [as_st(item) for item in node._items.iteritems()]

1481

1536

prefix_refs = node._items.items()

1482

1537

items = []

1483

1538

else:

1484

1539

prefix_refs = []

1540

# Note: We don't use a StaticTuple here. Profiling showed a

1541

# minor memory improvement (0.8MB out of 335MB peak 0.2%)

1542

# But a significant slowdown (15s / 145s, or 10%)

1485

1543

items = node._items.items()

1486

1544

yield record, node, prefix_refs, items

1487

1545

1495

1553

if p_r[1] not in all_old_chks]

1496

1554

new_refs = [p_r[1] for p_r in prefix_refs]

1497

1555

all_old_chks.update(new_refs)

1556

# TODO: This might be a good time to turn items into StaticTuple

1557

# instances and possibly intern them. However, this does not

1558

# impact 'initial branch' performance, so I'm not worrying

1559

# about this yet

1498

1560

self._all_old_items.update(items)

1499

1561

# Queue up the uninteresting references

1500

1562

# Don't actually put them in the 'to-read' queue until we have

1553

1615

# current design allows for this, as callers will do the work

1554

1616

# to make the results unique. We might profile whether we

1555

1617

# gain anything by ensuring unique return values for items

1618

# TODO: This might be a good time to cast to StaticTuple, as

1619

# self._new_item_queue will hold the contents of multiple

1620

# records for an extended lifetime

1556

1621

new_items = [item for item in items

1557

1622

if item not in self._all_old_items]

1558

1623

self._new_item_queue.extend(new_items)

1583

1648

if new_items:

1584

1649

yield None, new_items

1585

1650

refs = refs.difference(all_old_chks)

1651

processed_new_refs.update(refs)

1586

1652

while refs:

1653

# TODO: Using a SimpleSet for self._processed_new_refs and

1654

# saved as much as 10MB of peak memory. However, it requires

1655

# implementing a non-pyrex version.

1587

1656

next_refs = set()

1588

1657

next_refs_update = next_refs.update

1589

1658

# Inlining _read_nodes_from_store improves 'bzr branch bzr.dev'

1590

1659

# from 1m54s to 1m51s. Consider it.

1591

1660

for record, _, p_refs, items in self._read_nodes_from_store(refs):

1592

items = [item for item in items

1593

if item not in all_old_items]

1661

if all_old_items:

1662

# using the 'if' check saves about 145s => 141s, when

1663

# streaming initial branch of Launchpad data.

1664

items = [item for item in items

1665

if item not in all_old_items]

1594

1666

yield record, items

1595

1667

next_refs_update([p_r[1] for p_r in p_refs])

1668

del p_refs

1669

# set1.difference(set/dict) walks all of set1, and checks if it

1670

# exists in 'other'.

1671

# set1.difference(iterable) walks all of iterable, and does a

1672

# 'difference_update' on a clone of set1. Pick wisely based on the

1673

# expected sizes of objects.

1674

# in our case it is expected that 'new_refs' will always be quite

1675

# small.

1596

1676

next_refs = next_refs.difference(all_old_chks)

1597

1677

next_refs = next_refs.difference(processed_new_refs)

1598

1678

processed_new_refs.update(next_refs)

1605

1685

self._old_queue = []

1606

1686

all_old_chks = self._all_old_chks

1607

1687

for record, _, prefix_refs, items in self._read_nodes_from_store(refs):

1688

# TODO: Use StaticTuple here?

1608

1689

self._all_old_items.update(items)

1609

1690

refs = [r for _,r in prefix_refs if r not in all_old_chks]

1610

1691

self._old_queue.extend(refs)

1660

1741

)

1661

1742

search_key_registry.register('hash-16-way', _search_key_16)

1662

1743

search_key_registry.register('hash-255-way', _search_key_255)

1744

1745

1746

def _check_key(key):

1747

"""Helper function to assert that a key is properly formatted.

1748

1749

This generally shouldn't be used in production code, but it can be helpful

1750

to debug problems.

1751

"""

1752

if type(key) is not StaticTuple:

1753

raise TypeError('key %r is not StaticTuple but %s' % (key, type(key)))

1754

if len(key) != 1:

1755

raise ValueError('key %r should have length 1, not %d' % (key, len(key),))

1756

if type(key[0]) is not str:

1757

raise TypeError('key %r should hold a str, not %r'

1758

% (key, type(key[0])))

1759

if not key[0].startswith('sha1:'):

1760

raise ValueError('key %r should point to a sha1:' % (key,))

1761

1762

Older »