~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/hashcache.py

Committer: Robert Collins
Date: 2006-02-11 11:58:06 UTC
mto: (1534.1.22 integration)
mto: This revision was merged to the branch mainline in revision 1554.
Revision ID: robertc@robertcollins.net-20060211115806-732dabc1e35714ed

Give format3 working trees their own last-revision marker.

files added:
BRANCH.TODO

INSTALL

bzrlib/bzrdir.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/gpg.py

bzrlib/identitymap.py

bzrlib/iterablefile.py

bzrlib/lockable_files.py

bzrlib/lsprof.py

bzrlib/option.py

bzrlib/repository.py

bzrlib/rio.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/transactions.py

bzrlib/transport/ftp.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/win32console.py

generate_docs.py

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/riodemo.py

tools/trace-revisions

files removed:
bzrlib/clone.py

bzrlib/mdiff.py

bzrlib/revfile.py

bzrlib/store/compressed_text.py

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files renamed:
bzrlib/changeset.py => bzrlib/_changeset.py

bzrlib/merge_core.py => bzrlib/_merge_core.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/test_revision_info.py => bzrlib/tests/blackbox/test_revision_info.py

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/testbranch.py => bzrlib/tests/branch_implementations/test_branch.py

bzrlib/selftest/test_parent.py => bzrlib/tests/branch_implementations/test_parent.py

bzrlib/selftest/testdiff.py => bzrlib/tests/test_diff.py

bzrlib/selftest/testfetch.py => bzrlib/tests/test_fetch.py

bzrlib/selftest/testgraph.py => bzrlib/tests/test_graph.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testlog.py => bzrlib/tests/test_log.py

bzrlib/selftest/testmerge.py => bzrlib/tests/test_merge.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevision.py => bzrlib/tests/test_revision.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/selftest/teststore.py => bzrlib/tests/test_store.py

bzrlib/selftest/testtransport.py => bzrlib/tests/test_transport.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

bzrlib/selftest/testworkingtree.py => bzrlib/tests/test_workingtree.py

bzrlib/ui.py => bzrlib/ui/__init__.py

bzrlib/xml.py => bzrlib/xml_serializer.py

bzr-man.py => tools/doc_generate/autodoc_man.py

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_xml.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/zsh/_bzr

doc/random.txt

setup.py *

tutorial.txt

Show diffs side-by-side

added added

removed removed

bzrlib/hashcache.py

import os, stat, time

import sha

from bzrlib.osutils import sha_file

from bzrlib.osutils import sha_file, pathjoin, safe_unicode

from bzrlib.trace import mutter, warning

from bzrlib.atomicfile import AtomicFile

from bzrlib.errors import BzrError

FP_MTIME_COLUMN = 1

FP_CTIME_COLUMN = 2

FP_MODE_COLUMN = 5

def _fingerprint(abspath):

"""

needs_write = False

def __init__(self, basedir):

self.basedir = basedir

def __init__(self, root, cache_file_name, mode=None):

"""Create a hash cache in base dir, and set the file mode to mode."""

self.root = safe_unicode(root)

100

self.hit_count = 0

101

self.miss_count = 0

102

self.stat_count = 0

100

104

self.removed_count = 0

101

105

self.update_count = 0

102

106

self._cache = {}

103

107

self._mode = mode

108

self._cache_file_name = safe_unicode(cache_file_name)

104

109

105

110

def cache_file_name(self):

106

return os.sep.join([self.basedir, '.bzr', 'stat-cache'])

107

108

109

111

return self._cache_file_name

110

112

111

113

def clear(self):

112

114

"""Discard all cached information.

116

118

self.needs_write = True

117

119

self._cache = {}

118

120

119

120

121

def scan(self):

121

122

"""Scan all files and remove entries where the cache entry is obsolete.

122

123

124

Obsolete entries are those where the file has been modified or deleted

124

125

since the entry was inserted.

125

126

"""

127

# FIXME optimisation opportunity, on linux [and check other oses]:

128

# rather than iteritems order, stat in inode order.

126

129

prep = [(ce[1][3], path, ce) for (path, ce) in self._cache.iteritems()]

127

130

prep.sort()

128

131

129

132

for inum, path, cache_entry in prep:

130

abspath = os.sep.join([self.basedir, path])

133

abspath = pathjoin(self.root, path)

131

134

fp = _fingerprint(abspath)

132

135

self.stat_count += 1

133

136

143

146

def get_sha1(self, path):

144

147

"""Return the sha1 of a file.

145

148

"""

146

abspath = os.sep.join([self.basedir, path])

149

abspath = pathjoin(self.root, path)

147

150

self.stat_count += 1

148

151

file_fp = _fingerprint(abspath)

149

152

171

174

if stat.S_ISREG(mode):

172

175

digest = sha_file(file(abspath, 'rb', buffering=65000))

173

176

elif stat.S_ISLNK(mode):

174

link_target = os.readlink(abspath)

175

177

digest = sha.new(os.readlink(abspath)).hexdigest()

176

178

else:

177

179

raise BzrError("file %r: unknown file stat mode: %o"%(abspath,mode))

178

180

179

181

now = int(time.time())

180

if file_fp[1] >= now or file_fp[2] >= now:

182

if file_fp[FP_MTIME_COLUMN] >= now or file_fp[FP_CTIME_COLUMN] >= now:

181

183

# changed too recently; can't be cached. we can

182

184

# return the result and it could possibly be cached

183

185

# next time.

186

187

# the point is that we only want to cache when we are sure that any

188

# subsequent modifications of the file can be detected. If a

189

# modification neither changes the inode, the device, the size, nor

190

# the mode, then we can only distinguish it by time; therefore we

191

# need to let sufficient time elapse before we may cache this entry

192

# again. If we didn't do this, then, for example, a very quick 1

193

# byte replacement in the file might go undetected.

184

194

self.danger_count += 1

185

195

if cache_fp:

186

196

self.removed_count += 1

194

204

195

205

def write(self):

196

206

"""Write contents of cache to file."""

197

outf = AtomicFile(self.cache_file_name(), 'wb')

207

outf = AtomicFile(self.cache_file_name(), 'wb', new_mode=self._mode)

198

208

try:

199

209

print >>outf, CACHE_HEADER,

200

210

212

222

finally:

213

223

if not outf.closed:

214

224

outf.abort()

215

216

217

225

218

226

def read(self):

219

227

"""Reinstate cache from file.

228

236

try:

229

237

inf = file(fn, 'rb', buffering=65000)

230

238

except IOError, e:

231

mutter("failed to open %s: %s" % (fn, e))

239

mutter("failed to open %s: %s", fn, e)

232

240

# better write it now so it is valid

233

241

self.needs_write = True

234

242

return

236

244

237

245

hdr = inf.readline()

238

246

if hdr != CACHE_HEADER:

239

mutter('cache header marker not found at top of %s; discarding cache'

240

% fn)

247

mutter('cache header marker not found at top of %s;'

248

' discarding cache', fn)

241

249

self.needs_write = True

242

250

return

243

251

Older »