~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/store.py

Committer: Martin Pool
Date: 2005-08-23 00:27:12 UTC
Revision ID: mbp@sourcefrog.net-20050823002712-2b0f5e12243a6116

- merge aaron's merge improvements 999..1008

abentley@panoramicfeedback.com-20050822154931-a0da28d30681e2c6

files added:
bzrlib/mdiff.py

bzrlib/meta_store.py

bzrlib/plugins/checkperms

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/upgrade.py

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

files removed:
INSTALL

Makefile

NEWS.developers

bzrlib/annotate.py

bzrlib/builtins.py

bzrlib/clone.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/identitymap.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/store

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_parent.py

bzrlib/tests/test_revision_info.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_store.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/transactions.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/win32console.py

bzrlib/xml4.py

bzrlib/xml5.py

tools/biobench.py

tools/capture_tree.py

tools/riodemo.py

tools/trace-revisions

files renamed:
bzr_man.py => bzr-man.py

contrib/newinventory.py => bzrlib/newinventory.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/__init__.py => bzrlib/store.py

bzrlib/upgrade.py => tools/history2weaves.py

bzrlib/tests/test_weave.py => tools/testweave.py

files modified:
.bzrignore

.rsyncexclude

HACKING

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/selftest/__init__.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml.py

contrib/zsh/_bzr

doc/index.txt

doc/random.txt

doc/todo-from-arch.txt

setup.py *

tools/weavebench.py

tutorial.txt

Show diffs side-by-side

added added

removed removed

bzrlib/store.py

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# TODO: Could remember a bias towards whether a particular store is typically

# compressed or not.

"""

Stores are the main data-storage mechanism for Bazaar-NG.

unique ID.

"""

import os

from cStringIO import StringIO

import urllib

from zlib import adler32

import bzrlib

import bzrlib.errors as errors

from bzrlib.errors import BzrError, UnlistableStore, TransportNotPossible

from bzrlib.trace import mutter

import bzrlib.transport as transport

from bzrlib.transport.local import LocalTransport

import os, tempfile, types, osutils, gzip, errno

from stat import ST_SIZE

from StringIO import StringIO

from trace import mutter

######################################################################

# stores

pass

class Store(object):

"""This class represents the abstract storage layout for saving information.

class ImmutableStore(object):

"""Store that holds files indexed by unique names.

Files can be added, but not modified once they are in. Typically

the hash is used as the name, or something else known to be unique,

such as a UUID.

>>> st = ImmutableScratchStore()

>>> st.add(StringIO('hello'), 'aa')

>>> 'aa' in st

True

>>> 'foo' in st

False

You are not allowed to add an id that is already present.

Entries can be retrieved as files, which may then be read.

>>> st.add(StringIO('goodbye'), '123123')

>>> st['123123'].read()

'goodbye'

TODO: Atomic add by writing to a temporary file and renaming.

In bzr 0.0.5 and earlier, files within the store were marked

readonly on disk. This is no longer done but existing stores need

to be accomodated.

"""

def __len__(self):

raise NotImplementedError('Children should define their length')

def get(self, fileid, suffix=None):

"""Returns a file reading from a particular entry.

If suffix is present, retrieve the named suffix for fileid.

"""

raise NotImplementedError

def __getitem__(self, fileid):

"""DEPRECATED. Please use .get(fileid) instead."""

raise NotImplementedError

#def __contains__(self, fileid):

# """Deprecated, please use has_id"""

# raise NotImplementedError

def __iter__(self):

raise NotImplementedError

def add(self, f, fileid):

"""Add a file object f to the store accessible from the given fileid"""

raise NotImplementedError('Children of Store must define their method of adding entries.')

def has_id(self, fileid, suffix=None):

"""Return True or false for the presence of fileid in the store.

suffix, if present, is a per file suffix, i.e. for digital signature

data."""

raise NotImplementedError

def listable(self):

"""Return True if this store is able to be listed."""

return hasattr(self, "__iter__")

def copy_multi(self, other, ids, pb=None, permit_failure=False):

def __init__(self, basedir):

self._basedir = basedir

def _path(self, id):

if '\\' in id or '/' in id:

raise ValueError("invalid store id %r" % id)

return os.path.join(self._basedir, id)

def __repr__(self):

return "%s(%r)" % (self.__class__.__name__, self._basedir)

def add(self, f, fileid, compressed=True):

"""Add contents of a file into the store.

f -- An open file, or file-like object."""

# FIXME: Only works on files that will fit in memory

from bzrlib.atomicfile import AtomicFile

mutter("add store entry %r" % (fileid))

if isinstance(f, types.StringTypes):

content = f

else:

content = f.read()

p = self._path(fileid)

if os.access(p, os.F_OK) or os.access(p + '.gz', os.F_OK):

from bzrlib.errors import bailout

raise BzrError("store %r already contains id %r" % (self._basedir, fileid))

fn = p

if compressed:

fn = fn + '.gz'

100

af = AtomicFile(fn, 'wb')

101

try:

102

if compressed:

103

gf = gzip.GzipFile(mode='wb', fileobj=af)

104

gf.write(content)

105

gf.close()

106

else:

107

af.write(content)

108

af.commit()

109

finally:

110

af.close()

111

112

113

def copy_multi(self, other, ids):

114

"""Copy texts for ids from other into self.

115

116

If an id is present in self, it is skipped. A count of copied

117

ids is returned, which may be less than len(ids).

:param other: Another Store object

:param ids: A list of entry ids to be copied

:param pb: A ProgressBar object, if none is given, the default will be created.

:param permit_failure: Allow missing entries to be ignored

100

:return: (n_copied, [failed]) The number of entries copied successfully,

101

followed by a list of entries which could not be copied (because they

102

were missing)

103

118

"""

104

if pb is None:

105

pb = bzrlib.ui.ui_factory.progress_bar()

119

from bzrlib.progress import ProgressBar

120

pb = ProgressBar()

106

121

pb.update('preparing to copy')

107

failed = set()

122

to_copy = [id for id in ids if id not in self]

123

if isinstance(other, ImmutableStore):

124

return self.copy_multi_immutable(other, to_copy, pb)

108

125

count = 0

109

ids = list(ids) # get the list for showing a length.

110

for fileid in ids:

126

for id in to_copy:

111

127

count += 1

112

if self.has_id(fileid):

113

continue

128

pb.update('copy', count, len(to_copy))

129

self.add(other[id], id)

130

assert count == len(to_copy)

131

pb.clear()

132

return count

133

134

135

def copy_multi_immutable(self, other, to_copy, pb):

136

from shutil import copyfile

137

count = 0

138

for id in to_copy:

139

p = self._path(id)

140

other_p = other._path(id)

114

141

try:

115

self._copy_one(fileid, None, other, pb)

116

for suffix in self._suffixes:

117

try:

118

self._copy_one(fileid, suffix, other, pb)

119

except KeyError:

120

pass

121

pb.update('copy', count, len(ids))

122

except KeyError:

123

if permit_failure:

124

failed.add(fileid)

142

copyfile(other_p, p)

143

except IOError, e:

144

if e.errno == errno.ENOENT:

145

copyfile(other_p+".gz", p+".gz")

125

146

else:

126

147

raise

127

assert count == len(ids)

148

149

count += 1

150

pb.update('copy', count, len(to_copy))

151

assert count == len(to_copy)

128

152

pb.clear()

129

return count, failed

130

131

def _copy_one(self, fileid, suffix, other, pb):

132

"""Most generic copy-one object routine.

133

134

Subclasses can override this to provide an optimised

135

copy between their own instances. Such overriden routines

136

should call this if they have no optimised facility for a

137

specific 'other'.

138

"""

139

mutter('Store._copy_one: %r', fileid)

140

f = other.get(fileid, suffix)

141

self.add(f, fileid, suffix)

142

143

144

class TransportStore(Store):

145

"""A TransportStore is a Store superclass for Stores that use Transports."""

146

147

def add(self, f, fileid, suffix=None):

148

"""Add contents of a file into the store.

149

150

f -- A file-like object, or string

151

"""

152

mutter("add store entry %r", fileid)

153

154

names = self._id_to_names(fileid, suffix)

155

if self._transport.has_any(names):

156

raise BzrError("store %r already contains id %r"

157

% (self._transport.base, fileid))

158

159

# Most of the time, just adding the file will work

160

# if we find a time where it fails, (because the dir

161

# doesn't exist), then create the dir, and try again

162

self._add(names[0], f)

163

164

165

def _add(self, relpath, f):

166

"""Actually add the file to the given location.

167

This should be overridden by children.

168

"""

169

raise NotImplementedError('children need to implement this function.')

170

171

def _check_fileid(self, fileid):

172

if not isinstance(fileid, basestring):

173

raise TypeError('Fileids should be a string type: %s %r' % (type(fileid), fileid))

174

if '\\' in fileid or '/' in fileid:

175

raise ValueError("invalid store id %r" % fileid)

176

177

def _id_to_names(self, fileid, suffix):

178

"""Return the names in the expected order"""

179

if suffix is not None:

180

fn = self._relpath(fileid, [suffix])

181

else:

182

fn = self._relpath(fileid)

183

184

fn_gz = fn + '.gz'

185

if self._compressed:

186

return fn_gz, fn

187

else:

188

return fn, fn_gz

189

190

def has_id(self, fileid, suffix=None):

191

"""See Store.has_id."""

192

return self._transport.has_any(self._id_to_names(fileid, suffix))

193

194

def _get_name(self, fileid, suffix=None):

195

"""A special check, which returns the name of an existing file.

196

197

This is similar in spirit to 'has_id', but it is designed

198

to return information about which file the store has.

199

"""

200

for name in self._id_to_names(fileid, suffix=suffix):

201

if self._transport.has(name):

202

return name

203

return None

204

205

def _get(self, filename):

206

"""Return an vanilla file stream for clients to read from.

207

208

This is the body of a template method on 'get', and should be

209

implemented by subclasses.

210

"""

211

raise NotImplementedError

212

213

def get(self, fileid, suffix=None):

214

"""See Store.get()."""

215

names = self._id_to_names(fileid, suffix)

216

for name in names:

217

try:

218

return self._get(name)

219

except errors.NoSuchFile:

220

pass

221

raise KeyError(fileid)

222

223

def __init__(self, a_transport, prefixed=False, compressed=False):

224

assert isinstance(a_transport, transport.Transport)

225

super(TransportStore, self).__init__()

226

self._transport = a_transport

227

self._prefixed = prefixed

228

self._compressed = compressed

229

self._suffixes = set()

230

231

def _iter_files_recursive(self):

232

"""Iterate through the files in the transport."""

233

for quoted_relpath in self._transport.iter_files_recursive():

234

yield urllib.unquote(quoted_relpath)

153

return count

154

155

156

def __contains__(self, fileid):

157

""""""

158

p = self._path(fileid)

159

return (os.access(p, os.R_OK)

160

or os.access(p + '.gz', os.R_OK))

161

162

# TODO: Guard against the same thing being stored twice, compressed and uncompresse

235

163

236

164

def __iter__(self):

237

for relpath in self._iter_files_recursive():

238

# worst case is one of each suffix.

239

name = os.path.basename(relpath)

240

if name.endswith('.gz'):

241

name = name[:-3]

242

skip = False

243

for count in range(len(self._suffixes)):

244

for suffix in self._suffixes:

245

if name.endswith('.' + suffix):

246

skip = True

247

if not skip:

248

yield name

165

for f in os.listdir(self._basedir):

166

if f[-3:] == '.gz':

167

# TODO: case-insensitive?

168

yield f[:-3]

169

else:

170

yield f

249

171

250

172

def __len__(self):

251

return len(list(self.__iter__()))

252

253

def _relpath(self, fileid, suffixes=None):

254

self._check_fileid(fileid)

255

if suffixes:

256

for suffix in suffixes:

257

if not suffix in self._suffixes:

258

raise ValueError("Unregistered suffix %r" % suffix)

259

self._check_fileid(suffix)

260

else:

261

suffixes = []

262

if self._prefixed:

263

path = [hash_prefix(fileid) + fileid]

264

else:

265

path = [fileid]

266

path.extend(suffixes)

267

return transport.urlescape(u'.'.join(path))

268

269

def __repr__(self):

270

if self._transport is None:

271

return "%s(None)" % (self.__class__.__name__)

272

else:

273

return "%s(%r)" % (self.__class__.__name__, self._transport.base)

274

275

__str__ = __repr__

276

277

def listable(self):

278

"""Return True if this store is able to be listed."""

279

return self._transport.listable()

280

281

def register_suffix(self, suffix):

282

"""Register a suffix as being expected in this store."""

283

self._check_fileid(suffix)

284

if suffix == 'gz':

285

raise ValueError('You cannot register the "gz" suffix.')

286

self._suffixes.add(suffix)

173

return len(os.listdir(self._basedir))

174

175

176

def __getitem__(self, fileid):

177

"""Returns a file reading from a particular entry."""

178

p = self._path(fileid)

179

try:

180

return gzip.GzipFile(p + '.gz', 'rb')

181

except IOError, e:

182

if e.errno != errno.ENOENT:

183

raise

184

185

try:

186

return file(p, 'rb')

187

except IOError, e:

188

if e.errno != errno.ENOENT:

189

raise

190

191

raise IndexError(fileid)

192

287

193

288

194

def total_size(self):

289

195

"""Return (count, bytes)

292

198

the content."""

293

199

total = 0

294

200

count = 0

295

for relpath in self._transport.iter_files_recursive():

201

for fid in self:

296

202

count += 1

297

total += self._transport.stat(relpath).st_size

203

p = self._path(fid)

204

try:

205

total += os.stat(p)[ST_SIZE]

206

except OSError:

207

total += os.stat(p + '.gz')[ST_SIZE]

298

208

299

209

return count, total

300

210

301

211

302

def ImmutableMemoryStore():

303

return bzrlib.store.text.TextStore(transport.memory.MemoryTransport())

304

305

306

class CachedStore(Store):

307

"""A store that caches data locally, to avoid repeated downloads.

308

The precacache method should be used to avoid server round-trips for

309

every piece of data.

212

213

214

class ImmutableScratchStore(ImmutableStore):

215

"""Self-destructing test subclass of ImmutableStore.

216

217

The Store only exists for the lifetime of the Python object.

218

Obviously you should not put anything precious in it.

310

219

"""

311

312

def __init__(self, store, cache_dir):

313

super(CachedStore, self).__init__()

314

self.source_store = store

315

# This clones the source store type with a locally bound

316

# transport. FIXME: it assumes a constructor is == cloning.

317

# clonable store - it might be nicer to actually have a clone()

318

# or something. RBC 20051003

319

self.cache_store = store.__class__(LocalTransport(cache_dir))

320

321

def get(self, id):

322

mutter("Cache add %s", id)

323

if id not in self.cache_store:

324

self.cache_store.add(self.source_store.get(id), id)

325

return self.cache_store.get(id)

326

327

def has_id(self, fileid, suffix=None):

328

"""See Store.has_id."""

329

if self.cache_store.has_id(fileid, suffix):

330

return True

331

if self.source_store.has_id(fileid, suffix):

332

# We could asynchronously copy at this time

333

return True

334

return False

335

336

337

def copy_all(store_from, store_to):

338

"""Copy all ids from one store to another."""

339

# TODO: Optional progress indicator

340

if not store_from.listable():

341

raise UnlistableStore(store_from)

342

ids = [f for f in store_from]

343

mutter('copy_all ids: %r', ids)

344

store_to.copy_multi(store_from, ids)

345

346

def hash_prefix(fileid):

347

return "%02x/" % (adler32(fileid) & 0xff)

348

220

def __init__(self):

221

ImmutableStore.__init__(self, tempfile.mkdtemp())

222

223

def __del__(self):

224

for f in os.listdir(self._basedir):

225

fpath = os.path.join(self._basedir, f)

226

# needed on windows, and maybe some other filesystems

227

os.chmod(fpath, 0600)

228

os.remove(fpath)

229

os.rmdir(self._basedir)

230

mutter("%r destroyed" % self)

Older »