~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/tree.py

Committer: Martin Pool
Date: 2005-07-01 02:36:27 UTC
mto: This revision was merged to the branch mainline in revision 852.
Revision ID: mbp@sourcefrog.net-20050701023627-d8422b67a4c1d6d1

Show profile when converting inventory too.

files added:
.bzrignore

testsweet.py

files removed:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

README

TODO

build-api

bzr-man.py

bzrlib

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/selftest

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/ui.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weavestore.py

bzrlib/workingtree.py

bzrlib/xml.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

setup.py

testbzr

testsweet.py

tools

tools/history2revfiles.py

tools/history2weaves.py

tools/http_client.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files renamed:
tools/convertfile.py => convertfile.py

tools/convertinv.py => convertinv.py

bzrlib/selftest/test_weave.py => testweave.py

bzrlib/weave.py => weave.py

bzrlib/weavefile.py => weavefile.py

Show diffs side-by-side

added added

removed removed

bzrlib/tree.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Tree classes, representing directory at point in time.

"""

import os

from cStringIO import StringIO

import bzrlib

from bzrlib.trace import mutter, note

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.inventory import Inventory

from bzrlib.osutils import pumpfile, appendpath, fingerprint_file

exporters = {}

class Tree(object):

"""Abstract file tree.

There are several subclasses:

* `WorkingTree` exists as files on disk editable by the user.

* `RevisionTree` is a tree as recorded at some point in the past.

* `EmptyTree`

Trees contain an `Inventory` object, and also know how to retrieve

file texts mentioned in the inventory, either from a working

directory or from a store.

It is possible for trees to contain files that are not described

in their inventory or vice versa; for this use `filenames()`.

Trees can be compared, etc, regardless of whether they are working

trees or versioned trees.

"""

def has_filename(self, filename):

"""True if the tree has given filename."""

raise NotImplementedError()

def has_id(self, file_id):

return self.inventory.has_id(file_id)

__contains__ = has_id

def __iter__(self):

return iter(self.inventory)

def id2path(self, file_id):

return self.inventory.id2path(file_id)

def _get_inventory(self):

return self._inventory

def get_file_by_path(self, path):

return self.get_file(self._inventory.path2id(path))

inventory = property(_get_inventory,

doc="Inventory of this Tree")

def _check_retrieved(self, ie, f):

fp = fingerprint_file(f)

f.seek(0)

if ie.text_size != None:

if ie.text_size != fp['size']:

raise BzrError("mismatched size for file %r in %r" % (ie.file_id, self._store),

["inventory expects %d bytes" % ie.text_size,

"file is actually %d bytes" % fp['size'],

"store is probably damaged/corrupt"])

if ie.text_sha1 != fp['sha1']:

raise BzrError("wrong SHA-1 for file %r in %r" % (ie.file_id, self._store),

["inventory expects %s" % ie.text_sha1,

"file is actually %s" % fp['sha1'],

"store is probably damaged/corrupt"])

def print_file(self, file_id):

"""Print file with id `file_id` to stdout."""

import sys

sys.stdout.write(self.get_file_text(file_id))

100

101

102

def export(self, dest, format='dir', root=None):

103

"""Export this tree."""

104

try:

105

exporter = exporters[format]

106

except KeyError:

107

from bzrlib.errors import BzrCommandError

108

raise BzrCommandError("export format %r not supported" % format)

109

exporter(self, dest, root)

110

111

112

113

class RevisionTree(Tree):

114

"""Tree viewing a previous revision.

115

116

File text can be retrieved from the text store.

117

118

TODO: Some kind of `__repr__` method, but a good one

119

probably means knowing the branch and revision number,

120

or at least passing a description to the constructor.

121

"""

122

123

def __init__(self, weave_store, inv, revision_id):

124

self._weave_store = weave_store

125

self._inventory = inv

126

self._revision_id = revision_id

127

128

def get_weave(self, file_id):

129

return self._weave_store.get_weave(file_id)

130

131

132

def get_file_text(self, file_id):

133

ie = self._inventory[file_id]

134

weave = self.get_weave(file_id)

135

idx = weave.lookup(ie.text_version)

136

content = weave.get_text(idx)

137

if len(content) != ie.text_size:

138

raise BzrCheckError('mismatched size on revision %s of file %s: '

139

'%d vs %d bytes'

140

% (self._revision_id, file_id, len(content),

141

ie.text_size))

142

return content

143

144

def get_file(self, file_id):

145

return StringIO(self.get_file_text(file_id))

146

147

def get_file_size(self, file_id):

148

return self._inventory[file_id].text_size

149

150

def get_file_sha1(self, file_id):

151

ie = self._inventory[file_id]

152

if ie.kind == "file":

153

return ie.text_sha1

154

155

def has_filename(self, filename):

156

return bool(self.inventory.path2id(filename))

157

158

def list_files(self):

159

# The only files returned by this are those from the version

160

for path, entry in self.inventory.iter_entries():

161

yield path, 'V', entry.kind, entry.file_id

162

163

164

class EmptyTree(Tree):

165

def __init__(self):

166

self._inventory = Inventory()

167

168

def has_filename(self, filename):

169

return False

170

171

def list_files(self):

172

if False: # just to make it a generator

173

yield None

174

175

def __contains__(self, file_id):

176

return file_id in self._inventory

177

178

def get_file_sha1(self, file_id):

179

assert self._inventory[file_id].kind == "root_directory"

180

return None

181

182

183

184

185

######################################################################

186

# diff

187

188

# TODO: Merge these two functions into a single one that can operate

189

# on either a whole tree or a set of files.

190

191

# TODO: Return the diff in order by filename, not by category or in

192

# random order. Can probably be done by lock-stepping through the

193

# filenames from both trees.

194

195

196

def file_status(filename, old_tree, new_tree):

197

"""Return single-letter status, old and new names for a file.

198

199

The complexity here is in deciding how to represent renames;

200

many complex cases are possible.

201

"""

202

old_inv = old_tree.inventory

203

new_inv = new_tree.inventory

204

new_id = new_inv.path2id(filename)

205

old_id = old_inv.path2id(filename)

206

207

if not new_id and not old_id:

208

# easy: doesn't exist in either; not versioned at all

209

if new_tree.is_ignored(filename):

210

return 'I', None, None

211

else:

212

return '?', None, None

213

elif new_id:

214

# There is now a file of this name, great.

215

pass

216

else:

217

# There is no longer a file of this name, but we can describe

218

# what happened to the file that used to have

219

# this name. There are two possibilities: either it was

220

# deleted entirely, or renamed.

221

assert old_id

222

if new_inv.has_id(old_id):

223

return 'X', old_inv.id2path(old_id), new_inv.id2path(old_id)

224

else:

225

return 'D', old_inv.id2path(old_id), None

226

227

# if the file_id is new in this revision, it is added

228

if new_id and not old_inv.has_id(new_id):

229

return 'A'

230

231

# if there used to be a file of this name, but that ID has now

232

# disappeared, it is deleted

233

if old_id and not new_inv.has_id(old_id):

234

return 'D'

235

236

return 'wtf?'

237

238

239

240

def find_renames(old_inv, new_inv):

241

for file_id in old_inv:

242

if file_id not in new_inv:

243

continue

244

old_name = old_inv.id2path(file_id)

245

new_name = new_inv.id2path(file_id)

246

if old_name != new_name:

247

yield (old_name, new_name)

248

249

250

251

######################################################################

252

# export

253

254

def dir_exporter(tree, dest, root):

255

"""Export this tree to a new directory.

256

257

`dest` should not exist, and will be created holding the

258

contents of this tree.

259

260

TODO: To handle subdirectories we need to create the

261

directories first.

262

263

:note: If the export fails, the destination directory will be

264

left in a half-assed state.

265

"""

266

import os

267

os.mkdir(dest)

268

mutter('export version %r' % tree)

269

inv = tree.inventory

270

for dp, ie in inv.iter_entries():

271

kind = ie.kind

272

fullpath = appendpath(dest, dp)

273

if kind == 'directory':

274

os.mkdir(fullpath)

275

elif kind == 'file':

276

pumpfile(tree.get_file(ie.file_id), file(fullpath, 'wb'))

277

else:

278

raise BzrError("don't know how to export {%s} of kind %r" % (ie.file_id, kind))

279

mutter(" export {%s} kind %s to %s" % (ie.file_id, kind, fullpath))

280

exporters['dir'] = dir_exporter

281

282

try:

283

import tarfile

284

except ImportError:

285

pass

286

else:

287

def get_root_name(dest):

288

"""Get just the root name for a tarball.

289

290

>>> get_root_name('mytar.tar')

291

'mytar'

292

>>> get_root_name('mytar.tar.bz2')

293

'mytar'

294

>>> get_root_name('tar.tar.tar.tgz')

295

'tar.tar.tar'

296

>>> get_root_name('bzr-0.0.5.tar.gz')

297

'bzr-0.0.5'

298

>>> get_root_name('a/long/path/mytar.tgz')

299

'mytar'

300

>>> get_root_name('../parent/../dir/other.tbz2')

301

'other'

302

"""

303

endings = ['.tar', '.tar.gz', '.tgz', '.tar.bz2', '.tbz2']

304

dest = os.path.basename(dest)

305

for end in endings:

306

if dest.endswith(end):

307

return dest[:-len(end)]

308

309

def tar_exporter(tree, dest, root, compression=None):

310

"""Export this tree to a new tar file.

311

312

`dest` will be created holding the contents of this tree; if it

313

already exists, it will be clobbered, like with "tar -c".

314

"""

315

from time import time

316

now = time()

317

compression = str(compression or '')

318

if root is None:

319

root = get_root_name(dest)

320

try:

321

ball = tarfile.open(dest, 'w:' + compression)

322

except tarfile.CompressionError, e:

323

raise BzrError(str(e))

324

mutter('export version %r' % tree)

325

inv = tree.inventory

326

for dp, ie in inv.iter_entries():

327

mutter(" export {%s} kind %s to %s" % (ie.file_id, ie.kind, dest))

328

item = tarfile.TarInfo(os.path.join(root, dp))

329

# TODO: would be cool to actually set it to the timestamp of the

330

# revision it was last changed

331

item.mtime = now

332

if ie.kind == 'directory':

333

item.type = tarfile.DIRTYPE

334

fileobj = None

335

item.name += '/'

336

item.size = 0

337

item.mode = 0755

338

elif ie.kind == 'file':

339

item.type = tarfile.REGTYPE

340

fileobj = tree.get_file(ie.file_id)

341

item.size = _find_file_size(fileobj)

342

item.mode = 0644

343

else:

344

raise BzrError("don't know how to export {%s} of kind %r" %

345

(ie.file_id, ie.kind))

346

347

ball.addfile(item, fileobj)

348

ball.close()

349

exporters['tar'] = tar_exporter

350

351

def tgz_exporter(tree, dest, root):

352

tar_exporter(tree, dest, root, compression='gz')

353

exporters['tgz'] = tgz_exporter

354

355

def tbz_exporter(tree, dest, root):

356

tar_exporter(tree, dest, root, compression='bz2')

357

exporters['tbz2'] = tbz_exporter

358

359

360

def _find_file_size(fileobj):

361

offset = fileobj.tell()

362

try:

363

fileobj.seek(0, 2)

364

size = fileobj.tell()

365

except TypeError:

366

# gzip doesn't accept second argument to seek()

367

fileobj.seek(0)

368

size = 0

369

while True:

370

nread = len(fileobj.read())

371

if nread == 0:

372

break

373

size += nread

374

fileobj.seek(offset)

375

return size

Older »