~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/branch.py

Committer: Robert Collins
Date: 2005-10-17 08:15:09 UTC
mto: This revision was merged to the branch mainline in revision 1459.
Revision ID: robertc@lifelesslap.robertcollins.net-20051017081509-f108fef422640aba

gpg signing of content

files added:
.rsyncexclude

HACKING

Makefile

NEWS

NEWS.developers

TODO

bzr-man.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/clone.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revfile.py

bzrlib/revisionspec.py

bzrlib/selftest

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_conflicts.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_revision_info.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testannotate.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testconfig.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testgpg.py

bzrlib/selftest/testgraph.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testidentitymap.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/testrevprops.py

bzrlib/selftest/testsampler.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/testtestament.py

bzrlib/selftest/testtransactions.py

bzrlib/selftest/testtransport.py

bzrlib/selftest/testworkingtree.py

bzrlib/selftest/treeshape.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store

bzrlib/store/compressed_text.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/testament.py

bzrlib/textinv.py

bzrlib/transactions.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/ui.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/newinventory.py

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/ignore.txt

doc/quotes.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/split-join-files.txt

doc/switch-in-branch.txt

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

tools

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
bzrlib/tests.py

doc/faq.txt

doc/quickref.txt

doc/roadmap.txt

doc/testing.txt

doc/work-order.txt

files renamed:
bzrlib/store.py => bzrlib/store/__init__.py

files modified:
.bzrignore

README

build-api

bzr *

bzrlib/__init__.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/inventory.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/xml.py

doc/Makefile

doc/bitkeeper.txt

doc/darcs.txt

doc/formats.txt

doc/index.txt

doc/interrupted.txt

doc/merge.txt

doc/purpose.txt

doc/python.txt

doc/random.txt

doc/svk.txt

doc/tagging.txt

doc/thanks.txt

doc/todo-from-arch.txt

notes/performance.txt

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/branch.py

#! /usr/bin/env python

# -*- coding: UTF-8 -*-

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

from sets import Set

import sys

import os

import errno

from warnings import warn

from cStringIO import StringIO

import sys, os, os.path, random, time, sha, sets, types, re, shutil, tempfile

import traceback, socket, fnmatch, difflib, time

from binascii import hexlify

import bzrlib

from inventory import Inventory

from trace import mutter, note

from tree import Tree, EmptyTree, RevisionTree, WorkingTree

from inventory import InventoryEntry, Inventory

from osutils import isdir, quotefn, isfile, uuid, sha_file, username, chomp, \

format_date, compact_date, pumpfile, user_email, rand_bytes, splitpath, \

joinpath, sha_string, file_kind, local_time_offset

from store import ImmutableStore

from revision import Revision

from errors import bailout

from textui import show_status

from diff import diff_trees

BZR_BRANCH_FORMAT = "Bazaar-NG branch, format 0.0.4\n"

from bzrlib.inventory import InventoryEntry

import bzrlib.inventory as inventory

from bzrlib.trace import mutter, note

from bzrlib.osutils import (isdir, quotefn, compact_date, rand_bytes,

rename, splitpath, sha_file, appendpath,

file_kind)

import bzrlib.errors as errors

from bzrlib.errors import (BzrError, InvalidRevisionNumber, InvalidRevisionId,

NoSuchRevision, HistoryMissing, NotBranchError,

DivergedBranches, LockError, UnlistableStore,

UnlistableBranch, NoSuchFile)

from bzrlib.textui import show_status

from bzrlib.revision import Revision

from bzrlib.delta import compare_trees

from bzrlib.tree import EmptyTree, RevisionTree

from bzrlib.inventory import Inventory

from bzrlib.store import copy_all

from bzrlib.store.compressed_text import CompressedTextStore

from bzrlib.store.text import TextStore

from bzrlib.store.weave import WeaveStore

import bzrlib.transactions as transactions

from bzrlib.transport import Transport, get_transport

import bzrlib.xml5

import bzrlib.ui

BZR_BRANCH_FORMAT_4 = "Bazaar-NG branch, format 0.0.4\n"

BZR_BRANCH_FORMAT_5 = "Bazaar-NG branch, format 5\n"

BZR_BRANCH_FORMAT_6 = "Bazaar-NG branch, format 6\n"

## TODO: Maybe include checks for common corruption of newlines, etc?

# TODO: Some operations like log might retrieve the same revisions

# repeatedly to calculate deltas. We could perhaps have a weakref

# cache in memory to make this faster. In general anything can be

# cached in memory between lock and unlock operations.

def find_branch(*ignored, **ignored_too):

# XXX: leave this here for about one release, then remove it

raise NotImplementedError('find_branch() is not supported anymore, '

'please use one of the new branch constructors')

######################################################################

# branch objects

class Branch:

class Branch(object):

"""Branch holding a history of revisions.

:todo: Perhaps use different stores for different classes of object,

so that we can keep track of how much space each one uses,

or garbage-collect them.

:todo: Add a RemoteBranch subclass. For the basic case of read-only

HTTP access this should be very easy by,

just redirecting controlfile access into HTTP requests.

We would need a RemoteStore working similarly.

:todo: Keep the on-disk branch locked while the object exists.

:todo: mkdir() method.

"""

def __init__(self, base, init=False):

base

Base directory/url of the branch.

"""

base = None

def __init__(self, *ignored, **ignored_too):

raise NotImplementedError('The Branch class is abstract')

@staticmethod

def open_downlevel(base):

"""Open a branch which may be of an old format.

Only local branches are supported."""

return _Branch(get_transport(base), relax_version_check=True)

@staticmethod

def open(base):

"""Open an existing branch, rooted at 'base' (url)"""

t = get_transport(base)

mutter("trying to open %r with transport %r", base, t)

return _Branch(t)

@staticmethod

def open_containing(url):

"""Open an existing branch which contains url.

100

This probes for a branch at url, and searches upwards from there.

101

102

Basically we keep looking up until we find the control directory or

103

run into the root. If there isn't one, raises NotBranchError.

104

"""

105

t = get_transport(url)

106

while True:

107

try:

108

return _Branch(t)

109

except NotBranchError:

110

pass

111

new_t = t.clone('..')

112

if new_t.base == t.base:

113

# reached the root, whatever that may be

114

raise NotBranchError('%s is not in a branch' % url)

115

t = new_t

116

117

@staticmethod

118

def initialize(base):

119

"""Create a new branch, rooted at 'base' (url)"""

120

t = get_transport(base)

121

return _Branch(t, init=True)

122

123

def setup_caching(self, cache_root):

124

"""Subclasses that care about caching should override this, and set

125

up cached stores located under cache_root.

126

"""

127

self.cache_root = cache_root

128

129

130

class _Branch(Branch):

131

"""A branch stored in the actual filesystem.

132

133

Note that it's "local" in the context of the filesystem; it doesn't

134

really matter if it's on an nfs/smb/afs/coda/... share, as long as

135

it's writable, and can be accessed via the normal filesystem API.

136

137

_lock_mode

138

None, or 'r' or 'w'

139

140

_lock_count

141

If _lock_mode is true, a positive count of the number of times the

142

lock has been taken.

143

144

_lock

145

Lock object from bzrlib.lock.

146

"""

147

# We actually expect this class to be somewhat short-lived; part of its

148

# purpose is to try to isolate what bits of the branch logic are tied to

149

# filesystem access, so that in a later step, we can extricate them to

150

# a separarte ("storage") class.

151

_lock_mode = None

152

_lock_count = None

153

_lock = None

154

_inventory_weave = None

155

156

# Map some sort of prefix into a namespace

157

# stuff like "revno:10", "revid:", etc.

158

# This should match a prefix with a function which accepts

159

REVISION_NAMESPACES = {}

160

161

def push_stores(self, branch_to):

162

"""Copy the content of this branches store to branch_to."""

163

if (self._branch_format != branch_to._branch_format

164

or self._branch_format != 4):

165

from bzrlib.fetch import greedy_fetch

166

mutter("falling back to fetch logic to push between %s(%s) and %s(%s)",

167

self, self._branch_format, branch_to, branch_to._branch_format)

168

greedy_fetch(to_branch=branch_to, from_branch=self,

169

revision=self.last_revision())

170

return

171

172

store_pairs = ((self.text_store, branch_to.text_store),

173

(self.inventory_store, branch_to.inventory_store),

174

(self.revision_store, branch_to.revision_store))

175

try:

176

for from_store, to_store in store_pairs:

177

copy_all(from_store, to_store)

178

except UnlistableStore:

179

raise UnlistableBranch(from_store)

180

181

def __init__(self, transport, init=False,

182

relax_version_check=False):

183

"""Create new branch object at a particular location.

184

:param base: Base directory for the branch.

:param init: If True, create new control files in a previously

185

transport -- A Transport object, defining how to access files.

186

(If a string, transport.transport() will be used to

187

create a Transport object)

188

189

init -- If True, create new control files in a previously

190

unversioned directory. If False, the branch must already

191

be versioned.

192

193

relax_version_check -- If true, the usual check for the branch

194

version is not applied. This is intended only for

195

upgrade/recovery type use; it's not guaranteed that

196

all operations will work on old format branches.

197

198

In the test suite, creation of new trees is tested using the

199

`ScratchBranch` class.

200

"""

self.base = os.path.realpath(base)

201

assert isinstance(transport, Transport), \

202

"%r is not a Transport" % transport

203

self._transport = transport

204

if init:

205

self._make_control()

else:

if not isdir(self.controlfilename('.')):

bailout("not a bzr branch: %s" % quotefn(base),

['use "bzr init" to initialize a new working tree',

'current bzr can only operate from top-of-tree'])

self._check_format()

self.text_store = ImmutableStore(self.controlfilename('text-store'))

self.revision_store = ImmutableStore(self.controlfilename('revision-store'))

self.inventory_store = ImmutableStore(self.controlfilename('inventory-store'))

206

self._check_format(relax_version_check)

207

208

def get_store(name, compressed=True, prefixed=False):

209

# FIXME: This approach of assuming stores are all entirely compressed

210

# or entirely uncompressed is tidy, but breaks upgrade from

211

# some existing branches where there's a mixture; we probably

212

# still want the option to look for both.

213

relpath = self._rel_controlfilename(name)

214

if compressed:

215

store = CompressedTextStore(self._transport.clone(relpath),

216

prefixed=prefixed)

217

else:

218

store = TextStore(self._transport.clone(relpath),

219

prefixed=prefixed)

220

#if self._transport.should_cache():

221

# cache_path = os.path.join(self.cache_root, name)

222

# os.mkdir(cache_path)

223

# store = bzrlib.store.CachedStore(store, cache_path)

224

return store

225

def get_weave(name, prefixed=False):

226

relpath = self._rel_controlfilename(name)

227

ws = WeaveStore(self._transport.clone(relpath), prefixed=prefixed)

228

if self._transport.should_cache():

229

ws.enable_cache = True

230

return ws

231

232

if self._branch_format == 4:

233

self.inventory_store = get_store('inventory-store')

234

self.text_store = get_store('text-store')

235

self.revision_store = get_store('revision-store')

236

elif self._branch_format == 5:

237

self.control_weaves = get_weave([])

238

self.weave_store = get_weave('weaves')

239

self.revision_store = get_store('revision-store', compressed=False)

240

elif self._branch_format == 6:

241

self.control_weaves = get_weave([])

242

self.weave_store = get_weave('weaves', prefixed=True)

243

self.revision_store = get_store('revision-store', compressed=False,

244

prefixed=True)

245

self._transaction = None

246

247

def __str__(self):

return '%s(%r)' % (self.__class__.__name__, self.base)

248

return '%s(%r)' % (self.__class__.__name__, self._transport.base)

249

250

251

__repr__ = __str__

252

253

def _rel(self, name):

100

"""Return filename relative to branch top"""

101

return os.path.join(self.base, name)

254

def __del__(self):

255

if self._lock_mode or self._lock:

256

# XXX: This should show something every time, and be suitable for

257

# headless operation and embedding

258

warn("branch %r was not explicitly unlocked" % self)

259

self._lock.unlock()

260

261

# TODO: It might be best to do this somewhere else,

262

# but it is nice for a Branch object to automatically

263

# cache it's information.

264

# Alternatively, we could have the Transport objects cache requests

265

# See the earlier discussion about how major objects (like Branch)

266

# should never expect their __del__ function to run.

267

if hasattr(self, 'cache_root') and self.cache_root is not None:

268

try:

269

import shutil

270

shutil.rmtree(self.cache_root)

271

except:

272

pass

273

self.cache_root = None

274

275

def _get_base(self):

276

if self._transport:

277

return self._transport.base

278

return None

279

280

base = property(_get_base, doc="The URL for the root of this branch.")

281

282

def _finish_transaction(self):

283

"""Exit the current transaction."""

284

if self._transaction is None:

285

raise errors.LockError('Branch %s is not in a transaction' %

286

self)

287

transaction = self._transaction

288

self._transaction = None

289

transaction.finish()

290

291

def get_transaction(self):

292

"""Return the current active transaction.

293

294

If no transaction is active, this returns a passthrough object

295

for which all data is immedaitely flushed and no caching happens.

296

"""

297

if self._transaction is None:

298

return transactions.PassThroughTransaction()

299

else:

300

return self._transaction

301

302

def _set_transaction(self, new_transaction):

303

"""Set a new active transaction."""

304

if self._transaction is not None:

305

raise errors.LockError('Branch %s is in a transaction already.' %

306

self)

307

self._transaction = new_transaction

308

309

def lock_write(self):

310

mutter("lock write: %s (%s)", self, self._lock_count)

311

# TODO: Upgrade locking to support using a Transport,

312

# and potentially a remote locking protocol

313

if self._lock_mode:

314

if self._lock_mode != 'w':

315

raise LockError("can't upgrade to a write lock from %r" %

316

self._lock_mode)

317

self._lock_count += 1

318

else:

319

self._lock = self._transport.lock_write(

320

self._rel_controlfilename('branch-lock'))

321

self._lock_mode = 'w'

322

self._lock_count = 1

323

self._set_transaction(transactions.PassThroughTransaction())

324

325

def lock_read(self):

326

mutter("lock read: %s (%s)", self, self._lock_count)

327

if self._lock_mode:

328

assert self._lock_mode in ('r', 'w'), \

329

"invalid lock mode %r" % self._lock_mode

330

self._lock_count += 1

331

else:

332

self._lock = self._transport.lock_read(

333

self._rel_controlfilename('branch-lock'))

334

self._lock_mode = 'r'

335

self._lock_count = 1

336

self._set_transaction(transactions.ReadOnlyTransaction())

337

# 5K may be excessive, but hey, its a knob.

338

self.get_transaction().set_cache_size(5000)

339

340

def unlock(self):

341

mutter("unlock: %s (%s)", self, self._lock_count)

342

if not self._lock_mode:

343

raise LockError('branch %r is not locked' % (self))

344

345

if self._lock_count > 1:

346

self._lock_count -= 1

347

else:

348

self._finish_transaction()

349

self._lock.unlock()

350

self._lock = None

351

self._lock_mode = self._lock_count = None

352

353

def abspath(self, name):

354

"""Return absolute filename for something in the branch

102

355

356

XXX: Robert Collins 20051017 what is this used for? why is it a branch

357

method and not a tree method.

358

"""

359

return self._transport.abspath(name)

360

361

def _rel_controlfilename(self, file_or_path):

362

if isinstance(file_or_path, basestring):

363

file_or_path = [file_or_path]

364

return [bzrlib.BZRDIR] + file_or_path

103

365

104

366

def controlfilename(self, file_or_path):

105

367

"""Return location relative to branch."""

106

if isinstance(file_or_path, types.StringTypes):

107

file_or_path = [file_or_path]

108

return os.path.join(self.base, bzrlib.BZRDIR, *file_or_path)

368

return self._transport.abspath(self._rel_controlfilename(file_or_path))

109

369

110

370

111

371

def controlfile(self, file_or_path, mode='r'):

112

"""Open a control file for this branch"""

113

return file(self.controlfilename(file_or_path), mode)

114

372

"""Open a control file for this branch.

373

374

There are two classes of file in the control directory: text

375

and binary. binary files are untranslated byte streams. Text

376

control files are stored with Unix newlines and in UTF-8, even

377

if the platform or locale defaults are different.

378

379

Controlfiles should almost never be opened in write mode but

380

rather should be atomically copied and replaced using atomicfile.

381

"""

382

import codecs

383

384

relpath = self._rel_controlfilename(file_or_path)

385

#TODO: codecs.open() buffers linewise, so it was overloaded with

386

# a much larger buffer, do we need to do the same for getreader/getwriter?

387

if mode == 'rb':

388

return self._transport.get(relpath)

389

elif mode == 'wb':

390

raise BzrError("Branch.controlfile(mode='wb') is not supported, use put_controlfiles")

391

elif mode == 'r':

392

return codecs.getreader('utf-8')(self._transport.get(relpath), errors='replace')

393

elif mode == 'w':

394

raise BzrError("Branch.controlfile(mode='w') is not supported, use put_controlfiles")

395

else:

396

raise BzrError("invalid controlfile mode %r" % mode)

397

398

def put_controlfile(self, path, f, encode=True):

399

"""Write an entry as a controlfile.

400

401

:param path: The path to put the file, relative to the .bzr control

402

directory

403

:param f: A file-like or string object whose contents should be copied.

404

:param encode: If true, encode the contents as utf-8

405

"""

406

self.put_controlfiles([(path, f)], encode=encode)

407

408

def put_controlfiles(self, files, encode=True):

409

"""Write several entries as controlfiles.

410

411

:param files: A list of [(path, file)] pairs, where the path is the directory

412

underneath the bzr control directory

413

:param encode: If true, encode the contents as utf-8

414

"""

415

import codecs

416

ctrl_files = []

417

for path, f in files:

418

if encode:

419

if isinstance(f, basestring):

420

f = f.encode('utf-8', 'replace')

421

else:

422

f = codecs.getwriter('utf-8')(f, errors='replace')

423

path = self._rel_controlfilename(path)

424

ctrl_files.append((path, f))

425

self._transport.put_multi(ctrl_files)

115

426

116

427

def _make_control(self):

117

os.mkdir(self.controlfilename([]))

118

self.controlfile('README', 'w').write(

428

from bzrlib.inventory import Inventory

429

from bzrlib.weavefile import write_weave_v5

430

from bzrlib.weave import Weave

431

432

# Create an empty inventory

433

sio = StringIO()

434

# if we want per-tree root ids then this is the place to set

435

# them; they're not needed for now and so ommitted for

436

# simplicity.

437

bzrlib.xml5.serializer_v5.write_inventory(Inventory(), sio)

438

empty_inv = sio.getvalue()

439

sio = StringIO()

440

bzrlib.weavefile.write_weave_v5(Weave(), sio)

441

empty_weave = sio.getvalue()

442

443

dirs = [[], 'revision-store', 'weaves']

444

files = [('README',

119

445

"This is a Bazaar-NG control directory.\n"

120

"Do not change any files in this directory.")

121

self.controlfile('branch-format', 'w').write(BZR_BRANCH_FORMAT)

122

for d in ('text-store', 'inventory-store', 'revision-store'):

123

os.mkdir(self.controlfilename(d))

124

for f in ('revision-history', 'merged-patches',

125

'pending-merged-patches', 'branch-name'):

126

self.controlfile(f, 'w').write('')

127

mutter('created control directory in ' + self.base)

128

Inventory().write_xml(self.controlfile('inventory','w'))

129

130

131

def _check_format(self):

446

"Do not change any files in this directory.\n"),

447

('branch-format', BZR_BRANCH_FORMAT_6),

448

('revision-history', ''),

449

('branch-name', ''),

450

('branch-lock', ''),

451

('pending-merges', ''),

452

('inventory', empty_inv),

453

('inventory.weave', empty_weave),

454

('ancestry.weave', empty_weave)

455

]

456

cfn = self._rel_controlfilename

457

self._transport.mkdir_multi([cfn(d) for d in dirs])

458

self.put_controlfiles(files)

459

mutter('created control directory in ' + self._transport.base)

460

461

def _check_format(self, relax_version_check):

132

462

"""Check this branch format is supported.

133

463

134

The current tool only supports the current unstable format.

464

The format level is stored, as an integer, in

465

self._branch_format for code that needs to check it later.

135

466

136

467

In the future, we might need different in-memory Branch

137

468

classes to support downlevel branches. But not yet.

138

"""

139

# read in binary mode to detect newline wierdness.

140

fmt = self.controlfile('branch-format', 'rb').read()

141

if fmt != BZR_BRANCH_FORMAT:

142

bailout('sorry, branch format %r not supported' % fmt,

143

['use a different bzr version',

144

'or remove the .bzr directory and "bzr init" again'])

145

469

"""

470

try:

471

fmt = self.controlfile('branch-format', 'r').read()

472

except NoSuchFile:

473

raise NotBranchError(self.base)

474

mutter("got branch format %r", fmt)

475

if fmt == BZR_BRANCH_FORMAT_6:

476

self._branch_format = 6

477

elif fmt == BZR_BRANCH_FORMAT_5:

478

self._branch_format = 5

479

elif fmt == BZR_BRANCH_FORMAT_4:

480

self._branch_format = 4

481

482

if (not relax_version_check

483

and self._branch_format not in (5, 6)):

484

raise errors.UnsupportedFormatError(

485

'sorry, branch format %r not supported' % fmt,

486

['use a different bzr version',

487

'or remove the .bzr directory'

488

' and "bzr init" again'])

489

490

def get_root_id(self):

491

"""Return the id of this branches root"""

492

inv = self.read_working_inventory()

493

return inv.root.file_id

494

495

def set_root_id(self, file_id):

496

inv = self.read_working_inventory()

497

orig_root_id = inv.root.file_id

498

del inv._byid[inv.root.file_id]

499

inv.root.file_id = file_id

500

inv._byid[inv.root.file_id] = inv.root

501

for fid in inv:

502

entry = inv[fid]

503

if entry.parent_id in (None, orig_root_id):

504

entry.parent_id = inv.root.file_id

505

self._write_inventory(inv)

146

506

147

507

def read_working_inventory(self):

148

508

"""Read the working inventory."""

149

before = time.time()

150

inv = Inventory.read_xml(self.controlfile('inventory', 'r'))

151

mutter("loaded inventory of %d items in %f"

152

% (len(inv), time.time() - before))

153

return inv

154

509

self.lock_read()

510

try:

511

# ElementTree does its own conversion from UTF-8, so open in

512

# binary.

513

f = self.controlfile('inventory', 'rb')

514

return bzrlib.xml5.serializer_v5.read_inventory(f)

515

finally:

516

self.unlock()

517

155

518

156

519

def _write_inventory(self, inv):

157

520

"""Update the working inventory.

159

522

That is to say, the inventory describing changes underway, that

160

523

will be committed to the next revision.

161

524

"""

162

## TODO: factor out to atomicfile? is rename safe on windows?

163

tmpfname = self.controlfilename('inventory.tmp')

164

tmpf = file(tmpfname, 'w')

165

inv.write_xml(tmpf)

166

tmpf.close()

167

os.rename(tmpfname, self.controlfilename('inventory'))

525

from cStringIO import StringIO

526

self.lock_write()

527

try:

528

sio = StringIO()

529

bzrlib.xml5.serializer_v5.write_inventory(inv, sio)

530

sio.seek(0)

531

# Transport handles atomicity

532

self.put_controlfile('inventory', sio)

533

finally:

534

self.unlock()

535

168

536

mutter('wrote working inventory')

169

170

537

171

538

inventory = property(read_working_inventory, _write_inventory, None,

172

539

"""Inventory for the working copy.""")

173

540

174

175

def add(self, files, verbose=False):

541

def add(self, files, ids=None):

176

542

"""Make files versioned.

177

543

544

Note that the command line normally calls smart_add instead,

545

which can automatically recurse.

546

178

547

This puts the files in the Added state, so that they will be

179

548

recorded by the next commit.

180

549

181

:todo: Perhaps have an option to add the ids even if the files do

182

not (yet) exist.

183

184

:todo: Perhaps return the ids of the files? But then again it

185

is easy to retrieve them if they're needed.

186

187

:todo: Option to specify file id.

188

189

:todo: Adding a directory should optionally recurse down and

190

add all non-ignored children. Perhaps do that in a

191

higher-level method.

192

193

>>> b = ScratchBranch(files=['foo'])

194

>>> 'foo' in b.unknowns()

195

True

196

>>> b.show_status()

197

? foo

198

>>> b.add('foo')

199

>>> 'foo' in b.unknowns()

200

False

201

>>> bool(b.inventory.path2id('foo'))

202

True

203

>>> b.show_status()

204

A foo

205

206

>>> b.add('foo')

207

Traceback (most recent call last):

208

...

209

BzrError: ('foo is already versioned', [])

210

211

>>> b.add(['nothere'])

212

Traceback (most recent call last):

213

BzrError: ('cannot add: not a regular file or directory: nothere', [])

550

files

551

List of paths to add, relative to the base of the tree.

552

553

ids

554

If set, use these instead of automatically generated ids.

555

Must be the same length as the list of files, but may

556

contain None for ids that are to be autogenerated.

557

558

TODO: Perhaps have an option to add the ids even if the files do

559

not (yet) exist.

560

561

TODO: Perhaps yield the ids and paths as they're added.

214

562

"""

215

216

563

# TODO: Re-adding a file that is removed in the working copy

217

564

# should probably put it back with the previous ID.

218

if isinstance(files, types.StringTypes):

565

if isinstance(files, basestring):

566

assert(ids is None or isinstance(ids, basestring))

219

567

files = [files]

220

221

inv = self.read_working_inventory()

222

for f in files:

223

if is_control_file(f):

224

bailout("cannot add control file %s" % quotefn(f))

225

226

fp = splitpath(f)

227

228

if len(fp) == 0:

229

bailout("cannot add top-level %r" % f)

230

231

fullpath = os.path.normpath(self._rel(f))

232

233

if isfile(fullpath):

234

kind = 'file'

235

elif isdir(fullpath):

236

kind = 'directory'

237

else:

238

bailout('cannot add: not a regular file or directory: %s' % quotefn(f))

239

240

if len(fp) > 1:

241

parent_name = joinpath(fp[:-1])

242

mutter("lookup parent %r" % parent_name)

243

parent_id = inv.path2id(parent_name)

244

if parent_id == None:

245

bailout("cannot add: parent %r is not versioned"

246

% joinpath(fp[:-1]))

247

else:

248

parent_id = None

249

250

file_id = _gen_file_id(fp[-1])

251

inv.add(InventoryEntry(file_id, fp[-1], kind=kind, parent_id=parent_id))

252

if verbose:

253

show_status('A', kind, quotefn(f))

254

255

mutter("add file %s file_id:{%s} kind=%r parent_id={%s}"

256

% (f, file_id, kind, parent_id))

257

self._write_inventory(inv)

258

568

if ids is not None:

569

ids = [ids]

570

571

if ids is None:

572

ids = [None] * len(files)

573

else:

574

assert(len(ids) == len(files))

575

576

self.lock_write()

577

try:

578

inv = self.read_working_inventory()

579

for f,file_id in zip(files, ids):

580

if is_control_file(f):

581

raise BzrError("cannot add control file %s" % quotefn(f))

582

583

fp = splitpath(f)

584

585

if len(fp) == 0:

586

raise BzrError("cannot add top-level %r" % f)

587

588

fullpath = os.path.normpath(self.abspath(f))

589

590

try:

591

kind = file_kind(fullpath)

592

except OSError:

593

# maybe something better?

594

raise BzrError('cannot add: not a regular file, symlink or directory: %s' % quotefn(f))

595

596

if not InventoryEntry.versionable_kind(kind):

597

raise BzrError('cannot add: not a versionable file ('

598

'i.e. regular file, symlink or directory): %s' % quotefn(f))

599

600

if file_id is None:

601

file_id = gen_file_id(f)

602

inv.add_path(f, kind=kind, file_id=file_id)

603

604

mutter("add file %s file_id:{%s} kind=%r" % (f, file_id, kind))

605

606

self._write_inventory(inv)

607

finally:

608

self.unlock()

609

610

611

def print_file(self, file, revno):

612

"""Print `file` to stdout."""

613

self.lock_read()

614

try:

615

tree = self.revision_tree(self.get_rev_id(revno))

616

# use inventory as it was in that revision

617

file_id = tree.inventory.path2id(file)

618

if not file_id:

619

raise BzrError("%r is not present in revision %s" % (file, revno))

620

tree.print_file(file_id)

621

finally:

622

self.unlock()

259

623

260

624

261

625

def remove(self, files, verbose=False):

263

627

264

628

This does not remove their text. This does not run on

265

629

266

:todo: Refuse to remove modified files unless --force is given?

267

268

>>> b = ScratchBranch(files=['foo'])

269

>>> b.add('foo')

270

>>> b.inventory.has_filename('foo')

271

True

272

>>> b.remove('foo')

273

>>> b.working_tree().has_filename('foo')

274

True

275

>>> b.inventory.has_filename('foo')

276

False

277

278

>>> b = ScratchBranch(files=['foo'])

279

>>> b.add('foo')

280

>>> b.commit('one')

281

>>> b.remove('foo')

282

>>> b.commit('two')

283

>>> b.inventory.has_filename('foo')

284

False

285

>>> b.basis_tree().has_filename('foo')

286

False

287

>>> b.working_tree().has_filename('foo')

288

True

289

290

:todo: Do something useful with directories.

291

292

:todo: Should this remove the text or not? Tough call; not

630

TODO: Refuse to remove modified files unless --force is given?

631

632

TODO: Do something useful with directories.

633

634

TODO: Should this remove the text or not? Tough call; not

293

635

removing may be useful and the user can just use use rm, and

294

636

is the opposite of add. Removing it is consistent with most

295

637

other tools. Maybe an option.

296

638

"""

297

639

## TODO: Normalize names

298

640

## TODO: Remove nested loops; better scalability

299

300

if isinstance(files, types.StringTypes):

641

if isinstance(files, basestring):

301

642

files = [files]

302

303

tree = self.working_tree()

304

inv = tree.inventory

305

306

# do this before any modifications

307

for f in files:

308

fid = inv.path2id(f)

309

if not fid:

310

bailout("cannot remove unversioned file %s" % quotefn(f))

311

mutter("remove inventory entry %s {%s}" % (quotefn(f), fid))

312

if verbose:

313

# having remove it, it must be either ignored or unknown

314

if tree.is_ignored(f):

315

new_status = 'I'

316

else:

317

new_status = '?'

318

show_status(new_status, inv[fid].kind, quotefn(f))

319

del inv[fid]

320

643

644

self.lock_write()

645

646

try:

647

tree = self.working_tree()

648

inv = tree.inventory

649

650

# do this before any modifications

651

for f in files:

652

fid = inv.path2id(f)

653

if not fid:

654

raise BzrError("cannot remove unversioned file %s" % quotefn(f))

655

mutter("remove inventory entry %s {%s}" % (quotefn(f), fid))

656

if verbose:

657

# having remove it, it must be either ignored or unknown

658

if tree.is_ignored(f):

659

new_status = 'I'

660

else:

661

new_status = '?'

662

show_status(new_status, inv[fid].kind, quotefn(f))

663

del inv[fid]

664

665

self._write_inventory(inv)

666

finally:

667

self.unlock()

668

669

# FIXME: this doesn't need to be a branch method

670

def set_inventory(self, new_inventory_list):

671

from bzrlib.inventory import Inventory, InventoryEntry

672

inv = Inventory(self.get_root_id())

673

for path, file_id, parent, kind in new_inventory_list:

674

name = os.path.basename(path)

675

if name == "":

676

continue

677

# fixme, there should be a factory function inv,add_??

678

if kind == 'directory':

679

inv.add(inventory.InventoryDirectory(file_id, name, parent))

680

elif kind == 'file':

681

inv.add(inventory.InventoryFile(file_id, name, parent))

682

elif kind == 'symlink':

683

inv.add(inventory.InventoryLink(file_id, name, parent))

684

else:

685

raise BzrError("unknown kind %r" % kind)

321

686

self._write_inventory(inv)

322

687

323

324

688

def unknowns(self):

325

689

"""Return all unknown files.

326

690

340

704

return self.working_tree().unknowns()

341

705

342

706

343

def commit(self, message, timestamp=None, timezone=None,

344

committer=None,

345

verbose=False):

346

"""Commit working copy as a new revision.

347

348

The basic approach is to add all the file texts into the

349

store, then the inventory, then make a new revision pointing

350

to that inventory and store that.

351

352

This is not quite safe if the working copy changes during the

353

commit; for the moment that is simply not allowed. A better

354

approach is to make a temporary copy of the files before

355

computing their hashes, and then add those hashes in turn to

356

the inventory. This should mean at least that there are no

357

broken hash pointers. There is no way we can get a snapshot

358

of the whole directory at an instant. This would also have to

359

be robust against files disappearing, moving, etc. So the

360

whole thing is a bit hard.

361

362

:param timestamp: if not None, seconds-since-epoch for a

363

postdated/predated commit.

364

"""

365

366

## TODO: Show branch names

367

368

# TODO: Don't commit if there are no changes, unless forced?

369

370

# First walk over the working inventory; and both update that

371

# and also build a new revision inventory. The revision

372

# inventory needs to hold the text-id, sha1 and size of the

373

# actual file versions committed in the revision. (These are

374

# not present in the working inventory.) We also need to

375

# detect missing/deleted files, and remove them from the

376

# working inventory.

377

378

work_inv = self.read_working_inventory()

379

inv = Inventory()

380

basis = self.basis_tree()

381

basis_inv = basis.inventory

382

missing_ids = []

383

for path, entry in work_inv.iter_entries():

384

## TODO: Cope with files that have gone missing.

385

386

## TODO: Check that the file kind has not changed from the previous

387

## revision of this file (if any).

388

389

entry = entry.copy()

390

391

p = self._rel(path)

392

file_id = entry.file_id

393

mutter('commit prep file %s, id %r ' % (p, file_id))

394

395

if not os.path.exists(p):

396

mutter(" file is missing, removing from inventory")

397

if verbose:

398

show_status('D', entry.kind, quotefn(path))

399

missing_ids.append(file_id)

400

continue

401

402

# TODO: Handle files that have been deleted

403

404

# TODO: Maybe a special case for empty files? Seems a

405

# waste to store them many times.

406

407

inv.add(entry)

408

409

if basis_inv.has_id(file_id):

410

old_kind = basis_inv[file_id].kind

411

if old_kind != entry.kind:

412

bailout("entry %r changed kind from %r to %r"

413

% (file_id, old_kind, entry.kind))

414

415

if entry.kind == 'directory':

416

if not isdir(p):

417

bailout("%s is entered as directory but not a directory" % quotefn(p))

418

elif entry.kind == 'file':

419

if not isfile(p):

420

bailout("%s is entered as file but is not a file" % quotefn(p))

421

422

content = file(p, 'rb').read()

423

424

entry.text_sha1 = sha_string(content)

425

entry.text_size = len(content)

426

427

old_ie = basis_inv.has_id(file_id) and basis_inv[file_id]

428

if (old_ie

429

and (old_ie.text_size == entry.text_size)

430

and (old_ie.text_sha1 == entry.text_sha1)):

431

## assert content == basis.get_file(file_id).read()

432

entry.text_id = basis_inv[file_id].text_id

433

mutter(' unchanged from previous text_id {%s}' %

434

entry.text_id)

435

436

else:

437

entry.text_id = _gen_file_id(entry.name)

438

self.text_store.add(content, entry.text_id)

439

mutter(' stored with text_id {%s}' % entry.text_id)

440

if verbose:

441

if not old_ie:

442

state = 'A'

443

elif (old_ie.name == entry.name

444

and old_ie.parent_id == entry.parent_id):

445

state = 'R'

446

else:

447

state = 'M'

448

449

show_status(state, entry.kind, quotefn(path))

450

451

for file_id in missing_ids:

452

# have to do this later so we don't mess up the iterator.

453

# since parents may be removed before their children we

454

# have to test.

455

456

# FIXME: There's probably a better way to do this; perhaps

457

# the workingtree should know how to filter itself.

458

if work_inv.has_id(file_id):

459

del work_inv[file_id]

460

461

462

inv_id = rev_id = _gen_revision_id(time.time())

463

464

inv_tmp = tempfile.TemporaryFile()

465

inv.write_xml(inv_tmp)

466

inv_tmp.seek(0)

467

self.inventory_store.add(inv_tmp, inv_id)

468

mutter('new inventory_id is {%s}' % inv_id)

469

470

self._write_inventory(work_inv)

471

472

if timestamp == None:

473

timestamp = time.time()

474

475

if committer == None:

476

committer = username()

477

478

if timezone == None:

479

timezone = local_time_offset()

480

481

mutter("building commit log message")

482

rev = Revision(timestamp=timestamp,

483

timezone=timezone,

484

committer=committer,

485

precursor = self.last_patch(),

486

message = message,

487

inventory_id=inv_id,

488

revision_id=rev_id)

489

490

rev_tmp = tempfile.TemporaryFile()

491

rev.write_xml(rev_tmp)

492

rev_tmp.seek(0)

493

self.revision_store.add(rev_tmp, rev_id)

494

mutter("new revision_id is {%s}" % rev_id)

495

496

## XXX: Everything up to here can simply be orphaned if we abort

497

## the commit; it will leave junk files behind but that doesn't

498

## matter.

499

500

## TODO: Read back the just-generated changeset, and make sure it

501

## applies and recreates the right state.

502

503

## TODO: Also calculate and store the inventory SHA1

504

mutter("committing patch r%d" % (self.revno() + 1))

505

506

mutter("append to revision-history")

507

self.controlfile('revision-history', 'at').write(rev_id + '\n')

508

509

mutter("done!")

707

def append_revision(self, *revision_ids):

708

for revision_id in revision_ids:

709

mutter("add {%s} to revision-history" % revision_id)

710

self.lock_write()

711

try:

712

rev_history = self.revision_history()

713

rev_history.extend(revision_ids)

714

self.put_controlfile('revision-history', '\n'.join(rev_history))

715

finally:

716

self.unlock()

717

718

def has_revision(self, revision_id):

719

"""True if this branch has a copy of the revision.

720

721

This does not necessarily imply the revision is merge

722

or on the mainline."""

723

return (revision_id is None

724

or self.revision_store.has_id(revision_id))

725

726

def get_revision_xml_file(self, revision_id):

727

"""Return XML file object for revision object."""

728

if not revision_id or not isinstance(revision_id, basestring):

729

raise InvalidRevisionId(revision_id)

730

731

self.lock_read()

732

try:

733

try:

734

return self.revision_store.get(revision_id)

735

except (IndexError, KeyError):

736

raise bzrlib.errors.NoSuchRevision(self, revision_id)

737

finally:

738

self.unlock()

739

740

#deprecated

741

get_revision_xml = get_revision_xml_file

742

743

def get_revision_xml(self, revision_id):

744

return self.get_revision_xml_file(revision_id).read()

510

745

511

746

512

747

def get_revision(self, revision_id):

513

748

"""Return the Revision object for a named revision"""

514

r = Revision.read_xml(self.revision_store[revision_id])

749

xml_file = self.get_revision_xml_file(revision_id)

750

751

try:

752

r = bzrlib.xml5.serializer_v5.read_revision(xml_file)

753

except SyntaxError, e:

754

raise bzrlib.errors.BzrError('failed to unpack revision_xml',

755

[revision_id,

756

str(e)])

757

515

758

assert r.revision_id == revision_id

516

759

return r

517

760

518

519

def get_inventory(self, inventory_id):

520

"""Get Inventory object by hash.

521

522

:todo: Perhaps for this and similar methods, take a revision

523

parameter which can be either an integer revno or a

524

string hash."""

525

i = Inventory.read_xml(self.inventory_store[inventory_id])

526

return i

527

761

def get_revision_delta(self, revno):

762

"""Return the delta for one revision.

763

764

The delta is relative to its mainline predecessor, or the

765

empty tree for revision 1.

766

"""

767

assert isinstance(revno, int)

768

rh = self.revision_history()

769

if not (1 <= revno <= len(rh)):

770

raise InvalidRevisionNumber(revno)

771

772

# revno is 1-based; list is 0-based

773

774

new_tree = self.revision_tree(rh[revno-1])

775

if revno == 1:

776

old_tree = EmptyTree()

777

else:

778

old_tree = self.revision_tree(rh[revno-2])

779

780

return compare_trees(old_tree, new_tree)

781

782

def get_revision_sha1(self, revision_id):

783

"""Hash the stored value of a revision, and return it."""

784

# In the future, revision entries will be signed. At that

785

# point, it is probably best *not* to include the signature

786

# in the revision hash. Because that lets you re-sign

787

# the revision, (add signatures/remove signatures) and still

788

# have all hash pointers stay consistent.

789

# But for now, just hash the contents.

790

return bzrlib.osutils.sha_file(self.get_revision_xml_file(revision_id))

791

792

def get_ancestry(self, revision_id):

793

"""Return a list of revision-ids integrated by a revision.

794

795

This currently returns a list, but the ordering is not guaranteed:

796

treat it as a set.

797

"""

798

if revision_id is None:

799

return [None]

800

w = self.get_inventory_weave()

801

return [None] + map(w.idx_to_name,

802

w.inclusions([w.lookup(revision_id)]))

803

804

def get_inventory_weave(self):

805

return self.control_weaves.get_weave('inventory',

806

self.get_transaction())

807

808

def get_inventory(self, revision_id):

809

"""Get Inventory object by hash."""

810

xml = self.get_inventory_xml(revision_id)

811

return bzrlib.xml5.serializer_v5.read_inventory_from_string(xml)

812

813

def get_inventory_xml(self, revision_id):

814

"""Get inventory XML as a file object."""

815

try:

816

assert isinstance(revision_id, basestring), type(revision_id)

817

iw = self.get_inventory_weave()

818

return iw.get_text(iw.lookup(revision_id))

819

except IndexError:

820

raise bzrlib.errors.HistoryMissing(self, 'inventory', revision_id)

821

822

def get_inventory_sha1(self, revision_id):

823

"""Return the sha1 hash of the inventory entry

824

"""

825

return self.get_revision(revision_id).inventory_sha1

528

826

529

827

def get_revision_inventory(self, revision_id):

530

828

"""Return inventory of a past revision."""

829

# TODO: Unify this with get_inventory()

830

# bzr 0.0.6 and later imposes the constraint that the inventory_id

831

# must be the same as its revision, so this is trivial.

531

832

if revision_id == None:

532

return Inventory()

833

return Inventory(self.get_root_id())

533

834

else:

534

return self.get_inventory(self.get_revision(revision_id).inventory_id)

535

835

return self.get_inventory(revision_id)

536

836

537

837

def revision_history(self):

538

"""Return sequence of revision hashes on to this branch.

838

"""Return sequence of revision hashes on to this branch."""

839

self.lock_read()

840

try:

841

transaction = self.get_transaction()

842

history = transaction.map.find_revision_history()

843

if history is not None:

844

mutter("cache hit for revision-history in %s", self)

845

return list(history)

846

history = [l.rstrip('\r\n') for l in

847

self.controlfile('revision-history', 'r').readlines()]

848

transaction.map.add_revision_history(history)

849

# this call is disabled because revision_history is

850

# not really an object yet, and the transaction is for objects.

851

# transaction.register_clean(history, precious=True)

852

return list(history)

853

finally:

854

self.unlock()

539

855

540

>>> ScratchBranch().revision_history()

541

[]

542

"""

543

return [chomp(l) for l in self.controlfile('revision-history').readlines()]

856

def common_ancestor(self, other, self_revno=None, other_revno=None):

857

"""

858

>>> from bzrlib.commit import commit

859

>>> sb = ScratchBranch(files=['foo', 'foo~'])

860

>>> sb.common_ancestor(sb) == (None, None)

861

True

862

>>> commit(sb, "Committing first revision", verbose=False)

863

>>> sb.common_ancestor(sb)[0]

864

865

>>> clone = sb.clone()

866

>>> commit(sb, "Committing second revision", verbose=False)

867

>>> sb.common_ancestor(sb)[0]

868

869

>>> sb.common_ancestor(clone)[0]

870

871

>>> commit(clone, "Committing divergent second revision",

872

... verbose=False)

873

>>> sb.common_ancestor(clone)[0]

874

875

>>> sb.common_ancestor(clone) == clone.common_ancestor(sb)

876

True

877

>>> sb.common_ancestor(sb) != clone.common_ancestor(clone)

878

True

879

>>> clone2 = sb.clone()

880

>>> sb.common_ancestor(clone2)[0]

881

882

>>> sb.common_ancestor(clone2, self_revno=1)[0]

883

884

>>> sb.common_ancestor(clone2, other_revno=1)[0]

885

886

"""

887

my_history = self.revision_history()

888

other_history = other.revision_history()

889

if self_revno is None:

890

self_revno = len(my_history)

891

if other_revno is None:

892

other_revno = len(other_history)

893

indices = range(min((self_revno, other_revno)))

894

indices.reverse()

895

for r in indices:

896

if my_history[r] == other_history[r]:

897

return r+1, my_history[r]

898

return None, None

544

899

545

900

546

901

def revno(self):

548

903

549

904

That is equivalent to the number of revisions committed to

550

905

this branch.

551

552

>>> b = ScratchBranch()

553

>>> b.revno()

554

555

>>> b.commit('no foo')

556

>>> b.revno()

557

558

906

"""

559

907

return len(self.revision_history())

560

908

561

909

562

def last_patch(self):

910

def last_revision(self):

563

911

"""Return last patch hash, or None if no history.

564

565

>>> ScratchBranch().last_patch() == None

566

True

567

912

"""

568

913

ph = self.revision_history()

569

914

if ph:

570

915

return ph[-1]

571

572

573

def lookup_revision(self, revno):

574

"""Return revision hash for revision number."""

916

else:

917

return None

918

919

920

def missing_revisions(self, other, stop_revision=None, diverged_ok=False):

921

"""Return a list of new revisions that would perfectly fit.

922

923

If self and other have not diverged, return a list of the revisions

924

present in other, but missing from self.

925

926

>>> from bzrlib.commit import commit

927

>>> bzrlib.trace.silent = True

928

>>> br1 = ScratchBranch()

929

>>> br2 = ScratchBranch()

930

>>> br1.missing_revisions(br2)

931

[]

932

>>> commit(br2, "lala!", rev_id="REVISION-ID-1")

933

>>> br1.missing_revisions(br2)

934

[u'REVISION-ID-1']

935

>>> br2.missing_revisions(br1)

936

[]

937

>>> commit(br1, "lala!", rev_id="REVISION-ID-1")

938

>>> br1.missing_revisions(br2)

939

[]

940

>>> commit(br2, "lala!", rev_id="REVISION-ID-2A")

941

>>> br1.missing_revisions(br2)

942

[u'REVISION-ID-2A']

943

>>> commit(br1, "lala!", rev_id="REVISION-ID-2B")

944

>>> br1.missing_revisions(br2)

945

Traceback (most recent call last):

946

DivergedBranches: These branches have diverged.

947

"""

948

# FIXME: If the branches have diverged, but the latest

949

# revision in this branch is completely merged into the other,

950

# then we should still be able to pull.

951

self_history = self.revision_history()

952

self_len = len(self_history)

953

other_history = other.revision_history()

954

other_len = len(other_history)

955

common_index = min(self_len, other_len) -1

956

if common_index >= 0 and \

957

self_history[common_index] != other_history[common_index]:

958

raise DivergedBranches(self, other)

959

960

if stop_revision is None:

961

stop_revision = other_len

962

else:

963

assert isinstance(stop_revision, int)

964

if stop_revision > other_len:

965

raise bzrlib.errors.NoSuchRevision(self, stop_revision)

966

return other_history[self_len:stop_revision]

967

968

def update_revisions(self, other, stop_revision=None):

969

"""Pull in new perfect-fit revisions."""

970

from bzrlib.fetch import greedy_fetch

971

from bzrlib.revision import get_intervening_revisions

972

if stop_revision is None:

973

stop_revision = other.last_revision()

974

if (stop_revision is not None and

975

stop_revision in self.revision_history()):

976

return

977

greedy_fetch(to_branch=self, from_branch=other,

978

revision=stop_revision)

979

pullable_revs = self.missing_revisions(

980

other, other.revision_id_to_revno(stop_revision))

981

if pullable_revs:

982

greedy_fetch(to_branch=self,

983

from_branch=other,

984

revision=pullable_revs[-1])

985

self.append_revision(*pullable_revs)

986

987

def commit(self, *args, **kw):

988

from bzrlib.commit import Commit

989

Commit().commit(self, *args, **kw)

990

991

def revision_id_to_revno(self, revision_id):

992

"""Given a revision id, return its revno"""

993

if revision_id is None:

994

return 0

995

history = self.revision_history()

996

try:

997

return history.index(revision_id) + 1

998

except ValueError:

999

raise bzrlib.errors.NoSuchRevision(self, revision_id)

1000

1001

def get_rev_id(self, revno, history=None):

1002

"""Find the revision id of the specified revno."""

575

1003

if revno == 0:

576

1004

return None

577

578

try:

579

# list is 0-based; revisions are 1-based

580

return self.revision_history()[revno-1]

581

except IndexError:

582

bailout("no such revision %s" % revno)

583

1005

if history is None:

1006

history = self.revision_history()

1007

elif revno <= 0 or revno > len(history):

1008

raise bzrlib.errors.NoSuchRevision(self, revno)

1009

return history[revno - 1]

584

1010

585

1011

def revision_tree(self, revision_id):

586

1012

"""Return Tree for a revision on this branch.

587

1013

588

1014

`revision_id` may be None for the null revision, in which case

589

1015

an `EmptyTree` is returned."""

590

1016

# TODO: refactor this to use an existing revision object

1017

# so we don't need to read it in twice.

591

1018

if revision_id == None:

592

1019

return EmptyTree()

593

1020

else:

594

1021

inv = self.get_revision_inventory(revision_id)

595

return RevisionTree(self.text_store, inv)

596

1022

return RevisionTree(self.weave_store, inv, revision_id)

597

1023

598

1024

def working_tree(self):

599

1025

"""Return a `Tree` for the working copy."""

600

return WorkingTree(self.base, self.read_working_inventory())

1026

from bzrlib.workingtree import WorkingTree

1027

# TODO: In the future, WorkingTree should utilize Transport

1028

# RobertCollins 20051003 - I don't think it should - working trees are

1029

# much more complex to keep consistent than our careful .bzr subset.

1030

# instead, we should say that working trees are local only, and optimise

1031

# for that.

1032

return WorkingTree(self.base, branch=self)

601

1033

602

1034

603

1035

def basis_tree(self):

604

1036

"""Return `Tree` object for last revision.

605

1037

606

1038

If there are no revisions yet, return an `EmptyTree`.

607

608

>>> b = ScratchBranch(files=['foo'])

609

>>> b.basis_tree().has_filename('foo')

610

False

611

>>> b.working_tree().has_filename('foo')

612

True

613

>>> b.add('foo')

614

>>> b.commit('add foo')

615

>>> b.basis_tree().has_filename('foo')

616

True

617

"""

618

r = self.last_patch()

619

if r == None:

620

return EmptyTree()

621

else:

622

return RevisionTree(self.text_store, self.get_revision_inventory(r))

623

624

625

626

def write_log(self, show_timezone='original'):

627

"""Write out human-readable log of commits to this branch

628

629

:param utc: If true, show dates in universal time, not local time."""

630

## TODO: Option to choose either original, utc or local timezone

631

revno = 1

632

precursor = None

633

for p in self.revision_history():

634

print '-' * 40

635

print 'revno:', revno

636

## TODO: Show hash if --id is given.

637

##print 'revision-hash:', p

638

rev = self.get_revision(p)

639

print 'committer:', rev.committer

640

print 'timestamp: %s' % (format_date(rev.timestamp, rev.timezone or 0,

641

show_timezone))

642

643

## opportunistic consistency check, same as check_patch_chaining

644

if rev.precursor != precursor:

645

bailout("mismatched precursor!")

646

647

print 'message:'

648

if not rev.message:

649

print ' (no message)'

650

else:

651

for l in rev.message.split('\n'):

652

print ' ' + l

653

654

revno += 1

655

precursor = p

656

657

658

659

def show_status(branch, show_all=False):

660

"""Display single-line status for non-ignored working files.

661

662

The list is show sorted in order by file name.

663

664

>>> b = ScratchBranch(files=['foo', 'foo~'])

665

>>> b.show_status()

666

? foo

667

>>> b.add('foo')

668

>>> b.show_status()

669

A foo

670

>>> b.commit("add foo")

671

>>> b.show_status()

672

>>> os.unlink(b._rel('foo'))

673

>>> b.show_status()

674

D foo

675

676

677

:todo: Get state for single files.

678

679

:todo: Perhaps show a slash at the end of directory names.

680

681

"""

682

683

# We have to build everything into a list first so that it can

684

# sorted by name, incorporating all the different sources.

685

686

# FIXME: Rather than getting things in random order and then sorting,

687

# just step through in order.

688

689

# Interesting case: the old ID for a file has been removed,

690

# but a new file has been created under that name.

691

692

old = branch.basis_tree()

693

old_inv = old.inventory

694

new = branch.working_tree()

695

new_inv = new.inventory

696

697

for fs, fid, oldname, newname, kind in diff_trees(old, new):

698

if fs == 'R':

699

show_status(fs, kind,

700

oldname + ' => ' + newname)

701

elif fs == 'A' or fs == 'M':

702

show_status(fs, kind, newname)

703

elif fs == 'D':

704

show_status(fs, kind, oldname)

705

elif fs == '.':

706

if show_all:

707

show_status(fs, kind, newname)

708

elif fs == 'I':

709

if show_all:

710

show_status(fs, kind, newname)

711

elif fs == '?':

712

show_status(fs, kind, newname)

713

else:

714

bailout("wierd file state %r" % ((fs, fid),))

715

716

717

718

class ScratchBranch(Branch):

1039

"""

1040

return self.revision_tree(self.last_revision())

1041

1042

1043

def rename_one(self, from_rel, to_rel):

1044

"""Rename one file.

1045

1046

This can change the directory or the filename or both.

1047

"""

1048

self.lock_write()

1049

try:

1050

tree = self.working_tree()

1051

inv = tree.inventory

1052

if not tree.has_filename(from_rel):

1053

raise BzrError("can't rename: old working file %r does not exist" % from_rel)

1054

if tree.has_filename(to_rel):

1055

raise BzrError("can't rename: new working file %r already exists" % to_rel)

1056

1057

file_id = inv.path2id(from_rel)

1058

if file_id == None:

1059

raise BzrError("can't rename: old name %r is not versioned" % from_rel)

1060

1061

if inv.path2id(to_rel):

1062

raise BzrError("can't rename: new name %r is already versioned" % to_rel)

1063

1064

to_dir, to_tail = os.path.split(to_rel)

1065

to_dir_id = inv.path2id(to_dir)

1066

if to_dir_id == None and to_dir != '':

1067

raise BzrError("can't determine destination directory id for %r" % to_dir)

1068

1069

mutter("rename_one:")

1070

mutter(" file_id {%s}" % file_id)

1071

mutter(" from_rel %r" % from_rel)

1072

mutter(" to_rel %r" % to_rel)

1073

mutter(" to_dir %r" % to_dir)

1074

mutter(" to_dir_id {%s}" % to_dir_id)

1075

1076

inv.rename(file_id, to_dir_id, to_tail)

1077

1078

from_abs = self.abspath(from_rel)

1079

to_abs = self.abspath(to_rel)

1080

try:

1081

rename(from_abs, to_abs)

1082

except OSError, e:

1083

raise BzrError("failed to rename %r to %r: %s"

1084

% (from_abs, to_abs, e[1]),

1085

["rename rolled back"])

1086

1087

self._write_inventory(inv)

1088

finally:

1089

self.unlock()

1090

1091

1092

def move(self, from_paths, to_name):

1093

"""Rename files.

1094

1095

to_name must exist as a versioned directory.

1096

1097

If to_name exists and is a directory, the files are moved into

1098

it, keeping their old names. If it is a directory,

1099

1100

Note that to_name is only the last component of the new name;

1101

this doesn't change the directory.

1102

1103

This returns a list of (from_path, to_path) pairs for each

1104

entry that is moved.

1105

"""

1106

result = []

1107

self.lock_write()

1108

try:

1109

## TODO: Option to move IDs only

1110

assert not isinstance(from_paths, basestring)

1111

tree = self.working_tree()

1112

inv = tree.inventory

1113

to_abs = self.abspath(to_name)

1114

if not isdir(to_abs):

1115

raise BzrError("destination %r is not a directory" % to_abs)

1116

if not tree.has_filename(to_name):

1117

raise BzrError("destination %r not in working directory" % to_abs)

1118

to_dir_id = inv.path2id(to_name)

1119

if to_dir_id == None and to_name != '':

1120

raise BzrError("destination %r is not a versioned directory" % to_name)

1121

to_dir_ie = inv[to_dir_id]

1122

if to_dir_ie.kind not in ('directory', 'root_directory'):

1123

raise BzrError("destination %r is not a directory" % to_abs)

1124

1125

to_idpath = inv.get_idpath(to_dir_id)

1126

1127

for f in from_paths:

1128

if not tree.has_filename(f):

1129

raise BzrError("%r does not exist in working tree" % f)

1130

f_id = inv.path2id(f)

1131

if f_id == None:

1132

raise BzrError("%r is not versioned" % f)

1133

name_tail = splitpath(f)[-1]

1134

dest_path = appendpath(to_name, name_tail)

1135

if tree.has_filename(dest_path):

1136

raise BzrError("destination %r already exists" % dest_path)

1137

if f_id in to_idpath:

1138

raise BzrError("can't move %r to a subdirectory of itself" % f)

1139

1140

# OK, so there's a race here, it's possible that someone will

1141

# create a file in this interval and then the rename might be

1142

# left half-done. But we should have caught most problems.

1143

1144

for f in from_paths:

1145

name_tail = splitpath(f)[-1]

1146

dest_path = appendpath(to_name, name_tail)

1147

result.append((f, dest_path))

1148

inv.rename(inv.path2id(f), to_dir_id, name_tail)

1149

try:

1150

rename(self.abspath(f), self.abspath(dest_path))

1151

except OSError, e:

1152

raise BzrError("failed to rename %r to %r: %s" % (f, dest_path, e[1]),

1153

["rename rolled back"])

1154

1155

self._write_inventory(inv)

1156

finally:

1157

self.unlock()

1158

1159

return result

1160

1161

1162

def revert(self, filenames, old_tree=None, backups=True):

1163

"""Restore selected files to the versions from a previous tree.

1164

1165

backups

1166

If true (default) backups are made of files before

1167

they're renamed.

1168

"""

1169

from bzrlib.errors import NotVersionedError, BzrError

1170

from bzrlib.atomicfile import AtomicFile

1171

from bzrlib.osutils import backup_file

1172

1173

inv = self.read_working_inventory()

1174

if old_tree is None:

1175

old_tree = self.basis_tree()

1176

old_inv = old_tree.inventory

1177

1178

nids = []

1179

for fn in filenames:

1180

file_id = inv.path2id(fn)

1181

if not file_id:

1182

raise NotVersionedError("not a versioned file", fn)

1183

if not old_inv.has_id(file_id):

1184

raise BzrError("file not present in old tree", fn, file_id)

1185

nids.append((fn, file_id))

1186

1187

# TODO: Rename back if it was previously at a different location

1188

1189

# TODO: If given a directory, restore the entire contents from

1190

# the previous version.

1191

1192

# TODO: Make a backup to a temporary file.

1193

1194

# TODO: If the file previously didn't exist, delete it?

1195

for fn, file_id in nids:

1196

backup_file(fn)

1197

1198

f = AtomicFile(fn, 'wb')

1199

try:

1200

f.write(old_tree.get_file(file_id).read())

1201

f.commit()

1202

finally:

1203

f.close()

1204

1205

1206

def pending_merges(self):

1207

"""Return a list of pending merges.

1208

1209

These are revisions that have been merged into the working

1210

directory but not yet committed.

1211

"""

1212

cfn = self._rel_controlfilename('pending-merges')

1213

if not self._transport.has(cfn):

1214

return []

1215

p = []

1216

for l in self.controlfile('pending-merges', 'r').readlines():

1217

p.append(l.rstrip('\n'))

1218

return p

1219

1220

1221

def add_pending_merge(self, *revision_ids):

1222

# TODO: Perhaps should check at this point that the

1223

# history of the revision is actually present?

1224

p = self.pending_merges()

1225

updated = False

1226

for rev_id in revision_ids:

1227

if rev_id in p:

1228

continue

1229

p.append(rev_id)

1230

updated = True

1231

if updated:

1232

self.set_pending_merges(p)

1233

1234

def set_pending_merges(self, rev_list):

1235

self.lock_write()

1236

try:

1237

self.put_controlfile('pending-merges', '\n'.join(rev_list))

1238

finally:

1239

self.unlock()

1240

1241

1242

def get_parent(self):

1243

"""Return the parent location of the branch.

1244

1245

This is the default location for push/pull/missing. The usual

1246

pattern is that the user can override it by specifying a

1247

location.

1248

"""

1249

import errno

1250

_locs = ['parent', 'pull', 'x-pull']

1251

for l in _locs:

1252

try:

1253

return self.controlfile(l, 'r').read().strip('\n')

1254

except IOError, e:

1255

if e.errno != errno.ENOENT:

1256

raise

1257

return None

1258

1259

1260

def set_parent(self, url):

1261

# TODO: Maybe delete old location files?

1262

from bzrlib.atomicfile import AtomicFile

1263

self.lock_write()

1264

try:

1265

f = AtomicFile(self.controlfilename('parent'))

1266

try:

1267

f.write(url + '\n')

1268

f.commit()

1269

finally:

1270

f.close()

1271

finally:

1272

self.unlock()

1273

1274

def check_revno(self, revno):

1275

"""\

1276

Check whether a revno corresponds to any revision.

1277

Zero (the NULL revision) is considered valid.

1278

"""

1279

if revno != 0:

1280

self.check_real_revno(revno)

1281

1282

def check_real_revno(self, revno):

1283

"""\

1284

Check whether a revno corresponds to a real revision.

1285

Zero (the NULL revision) is considered invalid

1286

"""

1287

if revno < 1 or revno > self.revno():

1288

raise InvalidRevisionNumber(revno)

1289

1290

1291

1292

1293

1294

class ScratchBranch(_Branch):

719

1295

"""Special test class: a branch that cleans up after itself.

720

1296

721

1297

>>> b = ScratchBranch()

722

1298

>>> isdir(b.base)

723

1299

True

724

1300

>>> bd = b.base

725

>>> del b

1301

>>> b._transport.__del__()

726

1302

>>> isdir(bd)

727

1303

False

728

1304

"""

729

def __init__(self, files = []):

1305

1306

def __init__(self, files=[], dirs=[], transport=None):

730

1307

"""Make a test branch.

731

1308

732

1309

This creates a temporary directory and runs init-tree in it.

733

1310

734

1311

If any files are listed, they are created in the working copy.

735

1312

"""

736

Branch.__init__(self, tempfile.mkdtemp(), init=True)

1313

if transport is None:

1314

transport = bzrlib.transport.local.ScratchTransport()

1315

super(ScratchBranch, self).__init__(transport, init=True)

1316

else:

1317

super(ScratchBranch, self).__init__(transport)

1318

1319

for d in dirs:

1320

self._transport.mkdir(d)

1321

737

1322

for f in files:

738

file(os.path.join(self.base, f), 'w').write('content of %s' % f)

739

740

741

def __del__(self):

742

"""Destroy the test branch, removing the scratch directory."""

743

shutil.rmtree(self.base)

744

1323

self._transport.put(f, 'content of %s' % f)

1324

1325

1326

def clone(self):

1327

"""

1328

>>> orig = ScratchBranch(files=["file1", "file2"])

1329

>>> clone = orig.clone()

1330

>>> if os.name != 'nt':

1331

... os.path.samefile(orig.base, clone.base)

1332

... else:

1333

... orig.base == clone.base

1334

...

1335

False

1336

>>> os.path.isfile(os.path.join(clone.base, "file1"))

1337

True

1338

"""

1339

from shutil import copytree

1340

from tempfile import mkdtemp

1341

base = mkdtemp()

1342

os.rmdir(base)

1343

copytree(self.base, base, symlinks=True)

1344

return ScratchBranch(

1345

transport=bzrlib.transport.local.ScratchTransport(base))

745

1346

746

1347

747

1348

######################################################################

756

1357

## mutter('check %r for control file' % ((head, tail), ))

757

1358

if tail == bzrlib.BZRDIR:

758

1359

return True

1360

if filename == head:

1361

break

759

1362

filename = head

760

1363

return False

761

1364

762

1365

763

1366

764

def _gen_revision_id(when):

765

"""Return new revision-id."""

766

s = '%s-%s-' % (user_email(), compact_date(when))

767

s += hexlify(rand_bytes(8))

768

return s

769

770

771

def _gen_file_id(name):

1367

def gen_file_id(name):

772

1368

"""Return new file id.

773

1369

774

1370

This should probably generate proper UUIDs, but for the moment we

775

1371

cope with just randomness because running uuidgen every time is

776

1372

slow."""

777

assert '/' not in name

778

while name[0] == '.':

779

name = name[1:]

1373

import re

1374

from binascii import hexlify

1375

from time import time

1376

1377

# get last component

1378

idx = name.rfind('/')

1379

if idx != -1:

1380

name = name[idx+1 : ]

1381

idx = name.rfind('\\')

1382

if idx != -1:

1383

name = name[idx+1 : ]

1384

1385

# make it not a hidden file

1386

name = name.lstrip('.')

1387

1388

# remove any wierd characters; we don't escape them but rather

1389

# just pull them out

1390

name = re.sub(r'[^\w.]', '', name)

1391

780

1392

s = hexlify(rand_bytes(8))

781

return '-'.join((name, compact_date(time.time()), s))

1393

return '-'.join((name, compact_date(time()), s))

1394

1395

1396

def gen_root_id():

1397

"""Return a new tree-root file id."""

1398

return gen_file_id('TREE_ROOT')

782

1399

783

1400

Older »