~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/hashcache.py

Committer: John Arbash Meinel
Date: 2006-02-15 15:18:44 UTC
mto: (1185.79.1 bzr-jam-pending)
mto: This revision was merged to the branch mainline in revision 1554.
Revision ID: john@arbash-meinel.com-20060215151844-ce3e3efccd19da3f

Reverting gpg changes, should not be mainline, see gpg_uses_tempfile plugin.

files added:
BRANCH.TODO

INSTALL

NEWS.developers

bzrlib/annotate.py

bzrlib/builtins.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/identitymap.py

bzrlib/iterablefile.py

bzrlib/lockable_files.py

bzrlib/lsprof.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/store

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_fileid_involved.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_parent.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/transactions.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/win32console.py

bzrlib/xml4.py

bzrlib/xml5.py

generate_docs.py

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/riodemo.py

tools/trace-revisions

files removed:
bzrlib/mdiff.py

bzrlib/meta_store.py

bzrlib/plugins/checkperms

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/upgrade.py

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

files renamed:
bzrlib/changeset.py => bzrlib/_changeset.py

bzrlib/merge_core.py => bzrlib/_merge_core.py

bzrlib/store.py => bzrlib/store/__init__.py

bzrlib/selftest/ => bzrlib/tests/

bzrlib/selftest/teststatus.py => bzrlib/tests/blackbox/test_status.py

bzrlib/selftest/blackbox.py => bzrlib/tests/blackbox/test_too_much.py

bzrlib/selftest/versioning.py => bzrlib/tests/blackbox/test_versioning.py

bzrlib/selftest/testbranch.py => bzrlib/tests/branch_implementations/test_branch.py

bzrlib/selftest/testdiff.py => bzrlib/tests/test_diff.py

bzrlib/selftest/testhashcache.py => bzrlib/tests/test_hashcache.py

bzrlib/selftest/testinv.py => bzrlib/tests/test_inv.py

bzrlib/selftest/testlog.py => bzrlib/tests/test_log.py

bzrlib/selftest/testmerge3.py => bzrlib/tests/test_merge3.py

bzrlib/selftest/plugins.py => bzrlib/tests/test_plugins.py

bzrlib/selftest/testrevision.py => bzrlib/tests/test_revision.py

bzrlib/selftest/testrevisionnamespaces.py => bzrlib/tests/test_revisionnamespaces.py

tools/testweave.py => bzrlib/tests/test_weave.py

bzrlib/selftest/whitebox.py => bzrlib/tests/test_whitebox.py

bzrlib/ui.py => bzrlib/ui/__init__.py

tools/history2weaves.py => bzrlib/upgrade.py

bzrlib/xml.py => bzrlib/xml_serializer.py

bzrlib/newinventory.py => contrib/newinventory.py

bzr-man.py => tools/doc_generate/autodoc_man.py

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/tests/__init__.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_smart_add.py

bzrlib/textinv.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib/zsh/_bzr

doc/index.txt

doc/random.txt

doc/todo-from-arch.txt

setup.py *

tools/weavebench.py

tutorial.txt

Show diffs side-by-side

added added

removed removed

bzrlib/hashcache.py

# TODO: Perhaps return more details on the file to avoid statting it

# again: nonexistent, file type, size, etc

# TODO: Perhaps use a Python pickle instead of a text file; might be faster.

CACHE_HEADER = "### bzr hashcache v5\n"

import os, stat, time

import sha

from bzrlib.osutils import sha_file

from bzrlib.osutils import sha_file, pathjoin

from bzrlib.trace import mutter, warning

from bzrlib.atomicfile import AtomicFile

from bzrlib.errors import BzrError

FP_MTIME_COLUMN = 1

FP_CTIME_COLUMN = 2

FP_MODE_COLUMN = 5

def _fingerprint(abspath):

try:

# we discard any high precision because it's not reliable; perhaps we

# could do better on some systems?

return (fs.st_size, long(fs.st_mtime),

long(fs.st_ctime), fs.st_ino, fs.st_dev)

long(fs.st_ctime), fs.st_ino, fs.st_dev, fs.st_mode)

class HashCache(object):

104

self.update_count = 0

105

self._cache = {}

106

100

107

def cache_file_name(self):

101

return os.sep.join([self.basedir, '.bzr', 'stat-cache'])

102

103

104

108

# FIXME: duplicate path logic here, this should be

109

# something like 'branch.controlfile'.

110

return pathjoin(self.basedir, '.bzr', 'stat-cache')

105

111

106

112

def clear(self):

107

113

"""Discard all cached information.

122

128

prep.sort()

123

129

124

130

for inum, path, cache_entry in prep:

125

abspath = os.sep.join([self.basedir, path])

131

abspath = pathjoin(self.basedir, path)

126

132

fp = _fingerprint(abspath)

127

133

self.stat_count += 1

128

134

135

141

del self._cache[path]

136

142

137

143

138

139

144

def get_sha1(self, path):

140

145

"""Return the sha1 of a file.

141

146

"""

142

abspath = os.sep.join([self.basedir, path])

147

abspath = pathjoin(self.basedir, path)

143

148

self.stat_count += 1

144

149

file_fp = _fingerprint(abspath)

145

150

161

166

return cache_sha1

162

167

163

168

self.miss_count += 1

164

digest = sha_file(file(abspath, 'rb', buffering=65000))

169

170

171

mode = file_fp[FP_MODE_COLUMN]

172

if stat.S_ISREG(mode):

173

digest = sha_file(file(abspath, 'rb', buffering=65000))

174

elif stat.S_ISLNK(mode):

175

digest = sha.new(os.readlink(abspath)).hexdigest()

176

else:

177

raise BzrError("file %r: unknown file stat mode: %o"%(abspath,mode))

165

178

166

179

now = int(time.time())

167

if file_fp[1] >= now or file_fp[2] >= now:

180

if file_fp[FP_MTIME_COLUMN] >= now or file_fp[FP_CTIME_COLUMN] >= now:

168

181

# changed too recently; can't be cached. we can

169

182

# return the result and it could possibly be cached

170

183

# next time.

184

185

# the point is that we only want to cache when we are sure that any

186

# subsequent modifications of the file can be detected. If a

187

# modification neither changes the inode, the device, the size, nor

188

# the mode, then we can only distinguish it by time; therefore we

189

# need to let sufficient time elapse before we may cache this entry

190

# again. If we didn't do this, then, for example, a very quick 1

191

# byte replacement in the file might go undetected.

171

192

self.danger_count += 1

172

193

if cache_fp:

173

194

self.removed_count += 1

177

198

self.update_count += 1

178

199

self.needs_write = True

179

200

self._cache[path] = (digest, file_fp)

180

181

201

return digest

182

202

183

184

185

186

203

def write(self):

187

204

"""Write contents of cache to file."""

188

from atomicfile import AtomicFile

189

190

205

outf = AtomicFile(self.cache_file_name(), 'wb')

191

206

try:

192

207

print >>outf, CACHE_HEADER,

205

220

finally:

206

221

if not outf.closed:

207

222

outf.abort()

208

209

210

223

211

224

def read(self):

212

225

"""Reinstate cache from file.

221

234

try:

222

235

inf = file(fn, 'rb', buffering=65000)

223

236

except IOError, e:

224

mutter("failed to open %s: %s" % (fn, e))

237

mutter("failed to open %s: %s", fn, e)

238

# better write it now so it is valid

239

self.needs_write = True

225

240

return

226

241

227

242

228

243

hdr = inf.readline()

229

244

if hdr != CACHE_HEADER:

230

mutter('cache header marker not found at top of %s; discarding cache'

231

% fn)

245

mutter('cache header marker not found at top of %s;'

246

' discarding cache', fn)

247

self.needs_write = True

232

248

return

233

249

234

250

for l in inf:

240

256

241

257

pos += 3

242

258

fields = l[pos:].split(' ')

243

if len(fields) != 6:

259

if len(fields) != 7:

244

260

warning("bad line in hashcache: %r" % l)

245

261

continue

246

262

Older »