~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/hashcache.py

Committer: Aaron Bentley
Date: 2006-02-10 20:18:42 UTC
mto: (1558.1.4 Aaron's integration) (1534.9.2 Transactional Tree Transforms) (1185.50.82 bzr-jam-integration) (2027.1.2 revert-subpath-56549)
mto: This revision was merged to the branch mainline in revision 1558.
Revision ID: abentley@panoramicfeedback.com-20060210201842-cd2cec177a6fa1ee

Handled simultaneous renames of parent and child better

files added:
BRANCH.TODO

INSTALL

NEWS.developers

bzrlib/annotate.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/identitymap.py

bzrlib/iterablefile.py

bzrlib/lockable_files.py

bzrlib/lsprof.py

bzrlib/option.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/store

bzrlib/store/text.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_fileid_involved.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/treeshape.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/win32console.py

bzrlib/xml4.py

generate_docs.py

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/riodemo.py

tools/trace-revisions

trash

files removed:
bzrlib/mdiff.py

bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/upgrade.py

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

files renamed:
bzrlib/store.py => bzrlib/store/__init__.py

bzrlib/weavestore.py => bzrlib/store/weave.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/testbranch.py => bzrlib/tests/branch_implementations/test_branch.py

bzrlib/selftest/testdiff.py => bzrlib/tests/test_diff.py

bzrlib/selftest/testfetch.py => bzrlib/tests/test_fetch.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testlog.py => bzrlib/tests/test_log.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevision.py => bzrlib/tests/test_revision.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionnamespaces.py

bzrlib/selftest/teststore.py => bzrlib/tests/test_store.py

tools/testweave.py => bzrlib/tests/test_weave.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

bzrlib/ui.py => bzrlib/ui/__init__.py

tools/history2weaves.py => bzrlib/upgrade.py

bzrlib/xml.py => bzrlib/xml_serializer.py

bzr-man.py => tools/doc_generate/autodoc_man.py

bzrlib/changeset.py => trash/_changeset.py

bzrlib/merge_core.py => trash/_merge_core.py

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/tests/__init__.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_parent.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_xml.py

bzrlib/textinv.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml5.py

contrib/newinventory.py

contrib/zsh/_bzr

doc/random.txt

setup.py *

tutorial.txt

Show diffs side-by-side

added added

removed removed

bzrlib/hashcache.py

CACHE_HEADER = "### bzr hashcache v5\n"

import os, stat, time

import sha

from bzrlib.osutils import sha_file

from bzrlib.osutils import sha_file, pathjoin

from bzrlib.trace import mutter, warning

from bzrlib.atomicfile import AtomicFile

from bzrlib.errors import BzrError

FP_MTIME_COLUMN = 1

FP_CTIME_COLUMN = 2

FP_MODE_COLUMN = 5

def _fingerprint(abspath):

try:

# we discard any high precision because it's not reliable; perhaps we

# could do better on some systems?

return (fs.st_size, long(fs.st_mtime),

long(fs.st_ctime), fs.st_ino, fs.st_dev)

long(fs.st_ctime), fs.st_ino, fs.st_dev, fs.st_mode)

class HashCache(object):

100

104

self.update_count = 0

101

105

self._cache = {}

102

106

103

104

107

def cache_file_name(self):

105

return os.sep.join([self.basedir, '.bzr', 'stat-cache'])

106

107

108

# FIXME: duplicate path logic here, this should be

109

# something like 'branch.controlfile'.

110

return pathjoin(self.basedir, '.bzr', 'stat-cache')

109

111

110

112

def clear(self):

111

113

"""Discard all cached information.

126

128

prep.sort()

127

129

128

130

for inum, path, cache_entry in prep:

129

abspath = os.sep.join([self.basedir, path])

131

abspath = pathjoin(self.basedir, path)

130

132

fp = _fingerprint(abspath)

131

133

self.stat_count += 1

132

134

139

141

del self._cache[path]

140

142

141

143

142

143

144

def get_sha1(self, path):

144

145

"""Return the sha1 of a file.

145

146

"""

146

abspath = os.sep.join([self.basedir, path])

147

abspath = pathjoin(self.basedir, path)

147

148

self.stat_count += 1

148

149

file_fp = _fingerprint(abspath)

149

150

165

166

return cache_sha1

166

167

168

self.miss_count += 1

168

digest = sha_file(file(abspath, 'rb', buffering=65000))

169

170

171

mode = file_fp[FP_MODE_COLUMN]

172

if stat.S_ISREG(mode):

173

digest = sha_file(file(abspath, 'rb', buffering=65000))

174

elif stat.S_ISLNK(mode):

175

digest = sha.new(os.readlink(abspath)).hexdigest()

176

else:

177

raise BzrError("file %r: unknown file stat mode: %o"%(abspath,mode))

169

178

170

179

now = int(time.time())

171

if file_fp[1] >= now or file_fp[2] >= now:

180

if file_fp[FP_MTIME_COLUMN] >= now or file_fp[FP_CTIME_COLUMN] >= now:

172

181

# changed too recently; can't be cached. we can

173

182

# return the result and it could possibly be cached

174

183

# next time.

184

185

# the point is that we only want to cache when we are sure that any

186

# subsequent modifications of the file can be detected. If a

187

# modification neither changes the inode, the device, the size, nor

188

# the mode, then we can only distinguish it by time; therefore we

189

# need to let sufficient time elapse before we may cache this entry

190

# again. If we didn't do this, then, for example, a very quick 1

191

# byte replacement in the file might go undetected.

175

192

self.danger_count += 1

176

193

if cache_fp:

177

194

self.removed_count += 1

181

198

self.update_count += 1

182

199

self.needs_write = True

183

200

self._cache[path] = (digest, file_fp)

184

185

201

return digest

186

202

187

188

189

190

203

def write(self):

191

204

"""Write contents of cache to file."""

192

205

outf = AtomicFile(self.cache_file_name(), 'wb')

207

220

finally:

208

221

if not outf.closed:

209

222

outf.abort()

210

211

212

223

213

224

def read(self):

214

225

"""Reinstate cache from file.

223

234

try:

224

235

inf = file(fn, 'rb', buffering=65000)

225

236

except IOError, e:

226

mutter("failed to open %s: %s" % (fn, e))

237

mutter("failed to open %s: %s", fn, e)

227

238

# better write it now so it is valid

228

239

self.needs_write = True

229

240

return

231

242

232

243

hdr = inf.readline()

233

244

if hdr != CACHE_HEADER:

234

mutter('cache header marker not found at top of %s; discarding cache'

235

% fn)

245

mutter('cache header marker not found at top of %s;'

246

' discarding cache', fn)

236

247

self.needs_write = True

237

248

return

238

249

245

256

246

257

pos += 3

247

258

fields = l[pos:].split(' ')

248

if len(fields) != 6:

259

if len(fields) != 7:

249

260

warning("bad line in hashcache: %r" % l)

250

261

continue

251

262

Older »