~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/store.py

Committer: Martin Pool
Date: 2005-07-07 02:07:03 UTC
Revision ID: mbp@sourcefrog.net-20050707020702-0e24e478b738d4db

- Put files inside an exported tarball into a top-level directory rather than
dumping them into the current directory.

files added:
bzrlib/mdiff.py

bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/statcache.py

bzrlib/upgrade.py

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

plugins/changeset

plugins/changeset/__init__.py

plugins/changeset/apply_changeset.py

plugins/changeset/common.py

plugins/changeset/gen_changeset.py

plugins/changeset/read_changeset.py

plugins/checkperms

testbzr

testsweet.py

files removed:
BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS.developers

bzrlib/annotate.py

bzrlib/builtins.py

bzrlib/clone.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/identitymap.py

bzrlib/intset.py

bzrlib/lsprof.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/plugins/__init__.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/store

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_parent.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_remove.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/transactions.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/emacs

contrib/emacs/bzr-mode.el

doc/split-join-files.txt

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/revfile.txt

notes/schemas.xml

tools

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files renamed:
bzr_man.py => bzr-man.py

contrib/newinventory.py => bzrlib/newinventory.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/__init__.py => bzrlib/store.py

bzrlib/util/effbot/ => effbot/

bzrlib/util/elementtree/ => elementtree/

bzrlib/plugins/ => plugins/

bzrlib/util/urlgrabber/ => urlgrabber/

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py *

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/selftest/__init__.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/workingtree.py

bzrlib/xml.py

contrib/pwk

contrib/zsh/_bzr

doc/index.txt

doc/random.txt

doc/todo-from-arch.txt

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/store.py

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# TODO: Could remember a bias towards whether a particular store is typically

# compressed or not.

"""

Stores are the main data-storage mechanism for Bazaar-NG.

unique ID.

"""

import os

from cStringIO import StringIO

import urllib

from zlib import adler32

import bzrlib

import bzrlib.errors as errors

from bzrlib.errors import BzrError, UnlistableStore, TransportNotPossible

from bzrlib.trace import mutter

import bzrlib.transport as transport

from bzrlib.transport.local import LocalTransport

import os, tempfile, types, osutils, gzip, errno

from stat import ST_SIZE

from StringIO import StringIO

from trace import mutter

######################################################################

# stores

pass

class Store(object):

"""This class represents the abstract storage layout for saving information.

class ImmutableStore(object):

"""Store that holds files indexed by unique names.

Files can be added, but not modified once they are in. Typically

the hash is used as the name, or something else known to be unique,

such as a UUID.

>>> st = ImmutableScratchStore()

>>> st.add(StringIO('hello'), 'aa')

>>> 'aa' in st

True

>>> 'foo' in st

False

You are not allowed to add an id that is already present.

Entries can be retrieved as files, which may then be read.

>>> st.add(StringIO('goodbye'), '123123')

>>> st['123123'].read()

'goodbye'

TODO: Atomic add by writing to a temporary file and renaming.

In bzr 0.0.5 and earlier, files within the store were marked

readonly on disk. This is no longer done but existing stores need

to be accomodated.

"""

def __len__(self):

raise NotImplementedError('Children should define their length')

def get(self, fileid, suffix=None):

"""Returns a file reading from a particular entry.

If suffix is present, retrieve the named suffix for fileid.

"""

raise NotImplementedError

def __getitem__(self, fileid):

"""DEPRECATED. Please use .get(fileid) instead."""

raise NotImplementedError

#def __contains__(self, fileid):

# """Deprecated, please use has_id"""

# raise NotImplementedError

def __iter__(self):

raise NotImplementedError

def add(self, f, fileid):

"""Add a file object f to the store accessible from the given fileid"""

raise NotImplementedError('Children of Store must define their method of adding entries.')

def has_id(self, fileid, suffix=None):

"""Return True or false for the presence of fileid in the store.

suffix, if present, is a per file suffix, i.e. for digital signature

data."""

raise NotImplementedError

def listable(self):

"""Return True if this store is able to be listed."""

return hasattr(self, "__iter__")

def copy_multi(self, other, ids, pb=None, permit_failure=False):

def __init__(self, basedir):

self._basedir = basedir

def _path(self, id):

if '\\' in id or '/' in id:

raise ValueError("invalid store id %r" % id)

return os.path.join(self._basedir, id)

def __repr__(self):

return "%s(%r)" % (self.__class__.__name__, self._basedir)

def add(self, f, fileid, compressed=True):

"""Add contents of a file into the store.

f -- An open file, or file-like object."""

# FIXME: Only works on files that will fit in memory

from bzrlib.atomicfile import AtomicFile

mutter("add store entry %r" % (fileid))

if isinstance(f, types.StringTypes):

content = f

else:

content = f.read()

p = self._path(fileid)

if os.access(p, os.F_OK) or os.access(p + '.gz', os.F_OK):

raise BzrError("store %r already contains id %r" % (self._basedir, fileid))

fn = p

if compressed:

fn = fn + '.gz'

af = AtomicFile(fn, 'wb')

100

try:

101

if compressed:

102

gf = gzip.GzipFile(mode='wb', fileobj=af)

103

gf.write(content)

104

gf.close()

105

else:

106

af.write(content)

107

af.commit()

108

finally:

109

af.close()

110

111

112

def copy_multi(self, other, ids):

113

"""Copy texts for ids from other into self.

114

115

If an id is present in self, it is skipped. A count of copied

116

ids is returned, which may be less than len(ids).

:param other: Another Store object

:param ids: A list of entry ids to be copied

:param pb: A ProgressBar object, if none is given, the default will be created.

:param permit_failure: Allow missing entries to be ignored

100

:return: (n_copied, [failed]) The number of entries copied successfully,

101

followed by a list of entries which could not be copied (because they

102

were missing)

103

117

"""

104

if pb is None:

105

pb = bzrlib.ui.ui_factory.progress_bar()

118

from bzrlib.progress import ProgressBar

119

pb = ProgressBar()

106

120

pb.update('preparing to copy')

107

failed = set()

121

to_copy = [id for id in ids if id not in self]

122

if isinstance(other, ImmutableStore):

123

return self.copy_multi_immutable(other, to_copy, pb)

108

124

count = 0

109

ids = list(ids) # get the list for showing a length.

110

for fileid in ids:

125

for id in to_copy:

111

126

count += 1

112

if self.has_id(fileid):

113

continue

127

pb.update('copy', count, len(to_copy))

128

self.add(other[id], id)

129

assert count == len(to_copy)

130

pb.clear()

131

return count

132

133

134

def copy_multi_immutable(self, other, to_copy, pb):

135

from shutil import copyfile

136

count = 0

137

for id in to_copy:

138

p = self._path(id)

139

other_p = other._path(id)

114

140

try:

115

self._copy_one(fileid, None, other, pb)

116

for suffix in self._suffixes:

117

try:

118

self._copy_one(fileid, suffix, other, pb)

119

except KeyError:

120

pass

121

pb.update('copy', count, len(ids))

122

except KeyError:

123

if permit_failure:

124

failed.add(fileid)

141

copyfile(other_p, p)

142

except IOError, e:

143

if e.errno == errno.ENOENT:

144

copyfile(other_p+".gz", p+".gz")

125

145

else:

126

146

raise

127

assert count == len(ids)

147

148

count += 1

149

pb.update('copy', count, len(to_copy))

150

assert count == len(to_copy)

128

151

pb.clear()

129

return count, failed

130

131

def _copy_one(self, fileid, suffix, other, pb):

132

"""Most generic copy-one object routine.

133

134

Subclasses can override this to provide an optimised

135

copy between their own instances. Such overriden routines

136

should call this if they have no optimised facility for a

137

specific 'other'.

138

"""

139

mutter('Store._copy_one: %r', fileid)

140

f = other.get(fileid, suffix)

141

self.add(f, fileid, suffix)

142

143

144

class TransportStore(Store):

145

"""A TransportStore is a Store superclass for Stores that use Transports."""

146

147

def add(self, f, fileid, suffix=None):

148

"""Add contents of a file into the store.

149

150

f -- A file-like object, or string

151

"""

152

mutter("add store entry %r", fileid)

153

154

names = self._id_to_names(fileid, suffix)

155

if self._transport.has_any(names):

156

raise BzrError("store %r already contains id %r"

157

% (self._transport.base, fileid))

158

159

# Most of the time, just adding the file will work

160

# if we find a time where it fails, (because the dir

161

# doesn't exist), then create the dir, and try again

162

self._add(names[0], f)

163

164

165

def _add(self, relpath, f):

166

"""Actually add the file to the given location.

167

This should be overridden by children.

168

"""

169

raise NotImplementedError('children need to implement this function.')

170

171

def _check_fileid(self, fileid):

172

if not isinstance(fileid, basestring):

173

raise TypeError('Fileids should be a string type: %s %r' % (type(fileid), fileid))

174

if '\\' in fileid or '/' in fileid:

175

raise ValueError("invalid store id %r" % fileid)

176

177

def _id_to_names(self, fileid, suffix):

178

"""Return the names in the expected order"""

179

if suffix is not None:

180

fn = self._relpath(fileid, [suffix])

181

else:

182

fn = self._relpath(fileid)

183

184

fn_gz = fn + '.gz'

185

if self._compressed:

186

return fn_gz, fn

187

else:

188

return fn, fn_gz

189

190

def has_id(self, fileid, suffix=None):

191

"""See Store.has_id."""

192

return self._transport.has_any(self._id_to_names(fileid, suffix))

193

194

def _get_name(self, fileid, suffix=None):

195

"""A special check, which returns the name of an existing file.

196

197

This is similar in spirit to 'has_id', but it is designed

198

to return information about which file the store has.

199

"""

200

for name in self._id_to_names(fileid, suffix=suffix):

201

if self._transport.has(name):

202

return name

203

return None

204

205

def _get(self, filename):

206

"""Return an vanilla file stream for clients to read from.

207

208

This is the body of a template method on 'get', and should be

209

implemented by subclasses.

210

"""

211

raise NotImplementedError

212

213

def get(self, fileid, suffix=None):

214

"""See Store.get()."""

215

names = self._id_to_names(fileid, suffix)

216

for name in names:

217

try:

218

return self._get(name)

219

except errors.NoSuchFile:

220

pass

221

raise KeyError(fileid)

222

223

def __init__(self, a_transport, prefixed=False, compressed=False,

224

dir_mode=None, file_mode=None):

225

assert isinstance(a_transport, transport.Transport)

226

super(TransportStore, self).__init__()

227

self._transport = a_transport

228

self._prefixed = prefixed

229

self._compressed = compressed

230

self._suffixes = set()

231

232

# It is okay for these to be None, it just means they

233

# will just use the filesystem defaults

234

self._dir_mode = dir_mode

235

self._file_mode = file_mode

236

237

def _iter_files_recursive(self):

238

"""Iterate through the files in the transport."""

239

for quoted_relpath in self._transport.iter_files_recursive():

240

yield urllib.unquote(quoted_relpath)

152

return count

153

154

155

def __contains__(self, fileid):

156

""""""

157

p = self._path(fileid)

158

return (os.access(p, os.R_OK)

159

or os.access(p + '.gz', os.R_OK))

160

161

# TODO: Guard against the same thing being stored twice, compressed and uncompresse

241

162

242

163

def __iter__(self):

243

for relpath in self._iter_files_recursive():

244

# worst case is one of each suffix.

245

name = os.path.basename(relpath)

246

if name.endswith('.gz'):

247

name = name[:-3]

248

skip = False

249

for count in range(len(self._suffixes)):

250

for suffix in self._suffixes:

251

if name.endswith('.' + suffix):

252

skip = True

253

if not skip:

254

yield name

164

for f in os.listdir(self._basedir):

165

if f[-3:] == '.gz':

166

# TODO: case-insensitive?

167

yield f[:-3]

168

else:

169

yield f

255

170

256

171

def __len__(self):

257

return len(list(self.__iter__()))

258

259

def _relpath(self, fileid, suffixes=None):

260

self._check_fileid(fileid)

261

if suffixes:

262

for suffix in suffixes:

263

if not suffix in self._suffixes:

264

raise ValueError("Unregistered suffix %r" % suffix)

265

self._check_fileid(suffix)

266

else:

267

suffixes = []

268

if self._prefixed:

269

path = [hash_prefix(fileid) + fileid]

270

else:

271

path = [fileid]

272

path.extend(suffixes)

273

return transport.urlescape(u'.'.join(path))

274

275

def __repr__(self):

276

if self._transport is None:

277

return "%s(None)" % (self.__class__.__name__)

278

else:

279

return "%s(%r)" % (self.__class__.__name__, self._transport.base)

280

281

__str__ = __repr__

282

283

def listable(self):

284

"""Return True if this store is able to be listed."""

285

return self._transport.listable()

286

287

def register_suffix(self, suffix):

288

"""Register a suffix as being expected in this store."""

289

self._check_fileid(suffix)

290

if suffix == 'gz':

291

raise ValueError('You cannot register the "gz" suffix.')

292

self._suffixes.add(suffix)

172

return len(os.listdir(self._basedir))

173

174

def __getitem__(self, fileid):

175

"""Returns a file reading from a particular entry."""

176

p = self._path(fileid)

177

try:

178

return gzip.GzipFile(p + '.gz', 'rb')

179

except IOError, e:

180

if e.errno == errno.ENOENT:

181

return file(p, 'rb')

182

else:

183

raise e

293

184

294

185

def total_size(self):

295

186

"""Return (count, bytes)

298

189

the content."""

299

190

total = 0

300

191

count = 0

301

for relpath in self._transport.iter_files_recursive():

192

for fid in self:

302

193

count += 1

303

total += self._transport.stat(relpath).st_size

194

p = self._path(fid)

195

try:

196

total += os.stat(p)[ST_SIZE]

197

except OSError:

198

total += os.stat(p + '.gz')[ST_SIZE]

304

199

305

200

return count, total

306

201

307

202

308

def ImmutableMemoryStore():

309

return bzrlib.store.text.TextStore(transport.memory.MemoryTransport())

310

311

312

def copy_all(store_from, store_to):

313

"""Copy all ids from one store to another."""

314

# TODO: Optional progress indicator

315

if not store_from.listable():

316

raise UnlistableStore(store_from)

317

ids = [f for f in store_from]

318

mutter('copy_all ids: %r', ids)

319

store_to.copy_multi(store_from, ids)

320

321

def hash_prefix(fileid):

322

return "%02x/" % (adler32(fileid) & 0xff)

323

203

204

205

class ImmutableScratchStore(ImmutableStore):

206

"""Self-destructing test subclass of ImmutableStore.

207

208

The Store only exists for the lifetime of the Python object.

209

Obviously you should not put anything precious in it.

210

"""

211

def __init__(self):

212

ImmutableStore.__init__(self, tempfile.mkdtemp())

213

214

def __del__(self):

215

for f in os.listdir(self._basedir):

216

fpath = os.path.join(self._basedir, f)

217

# needed on windows, and maybe some other filesystems

218

os.chmod(fpath, 0600)

219

os.remove(fpath)

220

os.rmdir(self._basedir)

221

mutter("%r destroyed" % self)

Older »