~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/statcache.py

Committer: Martin Pool
Date: 2005-07-04 07:34:19 UTC
Revision ID: mbp@sourcefrog.net-20050704073419-44eb753d5556a4d0

- rename control file to pending-merges

files added:
bzr-man.py

bzrlib/lock.py

bzrlib/meta_store.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/selftest

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/upgrade.py

contrib/bash/bzr

contrib/create_bzr_rollup.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

effbot

effbot/__init__.py

effbot/org

effbot/org/__init__.py

effbot/org/gzip_consumer.py

effbot/org/http_client.py

effbot/org/http_manager.py

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/plugins-no-plugins.patch

patches/progress.diff

plugins

plugins/changeset

plugins/changeset/__init__.py

plugins/changeset/apply_changeset.py

plugins/changeset/common.py

plugins/changeset/gen_changeset.py

plugins/changeset/read_changeset.py

plugins/checkperms

plugins/rsync

plugins/rsync/__init__.py

plugins/rsync/rsync_update.py

files renamed:
contrib/bash/bzr => contrib/bash/bzr.simple

files modified:
.bzrignore

NEWS

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/help.py

bzrlib/inventory.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge_core.py

bzrlib/newinventory.py

bzrlib/osutils.py

bzrlib/remotebranch.py

bzrlib/revision.py

bzrlib/statcache.py

bzrlib/status.py

bzrlib/store.py

bzrlib/tree.py

bzrlib/xml.py

contrib/add-bzr-to-baz

doc/formats.txt

testbzr

Show diffs side-by-side

added added

removed removed

bzrlib/statcache.py

to gradually adjust your clock or don't use bzr over the step.

At the moment this is stored in a simple textfile; it might be nice

to use a tdb instead.

to use a tdb instead to allow faster lookup by file-id.

The cache is represented as a map from file_id to a tuple of (file_id,

sha1, path, size, mtime, ctime, ino, dev).

The SHA-1 is stored in memory as a hexdigest.

File names and file-ids are written out with non-ascii or whitespace

characters given as python-style unicode escapes. (file-ids shouldn't

contain wierd characters, but it might happen.)

This version of the file on disk has one line per record, and fields

separated by \0 records.

"""

# order of fields returned by fingerprint()

CACHE_HEADER = "### bzr statcache v3"

CACHE_HEADER = "### bzr statcache v4"

def fingerprint(abspath):

107

106

108

107

109

108

110

def safe_quote(s):

111

return s.encode('unicode_escape') \

112

.replace('\n', '\\u000a') \

113

.replace(' ', '\\u0020') \

114

.replace('\r', '\\u000d')

115

116

117

109

def _write_cache(basedir, entries):

118

110

from atomicfile import AtomicFile

119

111

120

112

cachefn = os.path.join(basedir, '.bzr', 'stat-cache')

121

113

outf = AtomicFile(cachefn, 'wb')

122

outf.write(CACHE_HEADER + '\n')

123

114

try:

115

outf.write(CACHE_HEADER + '\n')

116

124

117

for entry in entries:

125

118

if len(entry) != 8:

126

119

raise ValueError("invalid statcache entry tuple %r" % entry)

127

outf.write(safe_quote(entry[0])) # file id

128

outf.write(' ')

120

outf.write(entry[0].encode('utf-8')) # file id

121

outf.write('\0')

129

122

outf.write(entry[1]) # hex sha1

130

outf.write(' ')

131

outf.write(safe_quote(entry[2])) # name

123

outf.write('\0')

124

outf.write(entry[2].encode('utf-8')) # name

132

125

for nf in entry[3:]:

133

outf.write(' %d' % nf)

126

outf.write('\0%d' % nf)

134

127

outf.write('\n')

135

128

136

129

outf.commit()

153

146

import re

154

147

cache = {}

155

148

seen_paths = {}

149

from bzrlib.trace import warning

150

151

assert isinstance(basedir, basestring)

156

152

157

153

sha_re = re.compile(r'[a-f0-9]{40}')

158

154

164

160

165

161

line1 = cachefile.readline().rstrip('\r\n')

166

162

if line1 != CACHE_HEADER:

167

mutter('cache header marker not found at top of %s' % cachefn)

163

mutter('cache header marker not found at top of %s; discarding cache'

164

% cachefn)

168

165

return cache

169

166

170

167

for l in cachefile:

171

f = l.split(' ')

168

f = l.split('\0')

172

169

173

file_id = f[0].decode('unicode_escape')

170

file_id = f[0].decode('utf-8')

174

171

if file_id in cache:

175

raise BzrCheckError("duplicated file_id in cache: {%s}" % file_id)

172

warning("duplicated file_id in cache: {%s}" % file_id)

176

173

177

174

text_sha = f[1]

178

175

if len(text_sha) != 40 or not sha_re.match(text_sha):

179

176

raise BzrCheckError("invalid file SHA-1 in cache: %r" % text_sha)

180

177

181

path = f[2].decode('unicode_escape')

178

path = f[2].decode('utf-8')

182

179

if path in seen_paths:

183

raise BzrCheckError("duplicated path in cache: %r" % path)

180

warning("duplicated path in cache: %r" % path)

184

181

seen_paths[path] = True

185

182

186

183

entry = (file_id, text_sha, path) + tuple([long(x) for x in f[3:]])

192

189

193

190

194

191

195

196

192

def _files_from_inventory(inv):

197

193

for path, ie in inv.iter_entries():

198

194

if ie.kind != 'file':

Older »