~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/commit.py

Committer: mbp at sourcefrog
Date: 2005-03-24 00:44:18 UTC
Revision ID: mbp@sourcefrog.net-20050324004418-b4a050f656c07f5f

show space usage for various stores in the info command

files added:
bzrlib/tests.py

doc/faq.txt

doc/quickref.txt

doc/roadmap.txt

doc/testing.txt

doc/work-order.txt

files removed:
.rsyncexclude

HACKING

Makefile

TODO

bzr-man.py

bzrlib/atomicfile.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/intset.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/newinventory.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/revisionspec.py

bzrlib/selftest

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_revision_info.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testgraph.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testremotebranch.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/ui.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/ignore.txt

doc/quotes.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/split-join-files.txt

doc/switch-in-branch.txt

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

tools

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/history2weaves.py

tools/http_client.py

tools/testweave.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files renamed:
bzrlib/util/elementtree/ => elementtree/

files modified:
.bzrignore

NEWS

README

build-api

bzrlib/__init__.py

bzrlib/add.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/store.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/xml.py

doc/Makefile

doc/bitkeeper.txt

doc/formats.txt

doc/index.txt

doc/interrupted.txt

doc/merge.txt

doc/python.txt

doc/random.txt

doc/svk.txt

doc/tagging.txt

doc/todo-from-arch.txt

elementtree/ElementTree.py

notes/performance.txt

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/commit.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

def commit(branch, message,

timestamp=None,

timezone=None,

committer=None,

verbose=True,

specific_files=None,

rev_id=None,

allow_pointless=True):

"""Commit working copy as a new revision.

The basic approach is to add all the file texts into the

store, then the inventory, then make a new revision pointing

to that inventory and store that.

This is not quite safe if the working copy changes during the

commit; for the moment that is simply not allowed. A better

approach is to make a temporary copy of the files before

computing their hashes, and then add those hashes in turn to

the inventory. This should mean at least that there are no

broken hash pointers. There is no way we can get a snapshot

of the whole directory at an instant. This would also have to

be robust against files disappearing, moving, etc. So the

whole thing is a bit hard.

This raises PointlessCommit if there are no changes, no new merges,

and allow_pointless is false.

timestamp -- if not None, seconds-since-epoch for a

postdated/predated commit.

specific_files

If true, commit only those files.

rev_id

If set, use this as the new revision id.

Useful for test or import commands that need to tightly

control what revisions are assigned. If you duplicate

a revision id that exists elsewhere it is your own fault.

If null (default), a time/random revision id is generated.

"""

import time, tempfile, re

from bzrlib.osutils import local_time_offset, username

from bzrlib.branch import gen_file_id

from bzrlib.errors import BzrError, PointlessCommit

from bzrlib.revision import Revision, RevisionReference

from bzrlib.trace import mutter, note

from bzrlib.xml import serializer_v4

branch.lock_write()

try:

# First walk over the working inventory; and both update that

# and also build a new revision inventory. The revision

# inventory needs to hold the text-id, sha1 and size of the

# actual file versions committed in the revision. (These are

# not present in the working inventory.) We also need to

# detect missing/deleted files, and remove them from the

# working inventory.

work_tree = branch.working_tree()

work_inv = work_tree.inventory

basis = branch.basis_tree()

basis_inv = basis.inventory

if verbose:

# note('looking for changes...')

# print 'looking for changes...'

# disabled; should be done at a higher level

pass

pending_merges = branch.pending_merges()

missing_ids, new_inv, any_changes = \

_gather_commit(branch,

work_tree,

work_inv,

basis_inv,

specific_files,

verbose)

100

101

if not (any_changes or allow_pointless or pending_merges):

102

raise PointlessCommit()

103

104

for file_id in missing_ids:

105

# Any files that have been deleted are now removed from the

106

# working inventory. Files that were not selected for commit

107

# are left as they were in the working inventory and ommitted

108

# from the revision inventory.

109

110

# have to do this later so we don't mess up the iterator.

111

# since parents may be removed before their children we

112

# have to test.

113

114

# FIXME: There's probably a better way to do this; perhaps

115

# the workingtree should know how to filter itbranch.

116

if work_inv.has_id(file_id):

117

del work_inv[file_id]

118

119

if rev_id is None:

120

rev_id = _gen_revision_id(branch, time.time())

121

inv_id = rev_id

122

123

inv_tmp = tempfile.TemporaryFile()

124

125

serializer_v4.write_inventory(new_inv, inv_tmp)

126

inv_tmp.seek(0)

127

branch.inventory_store.add(inv_tmp, inv_id)

128

mutter('new inventory_id is {%s}' % inv_id)

129

130

# We could also just sha hash the inv_tmp file

131

# however, in the case that branch.inventory_store.add()

132

# ever actually does anything special

133

inv_sha1 = branch.get_inventory_sha1(inv_id)

134

135

branch._write_inventory(work_inv)

136

137

if timestamp == None:

138

timestamp = time.time()

139

140

if committer == None:

141

committer = username(branch)

142

143

if timezone == None:

144

timezone = local_time_offset()

145

146

mutter("building commit log message")

147

# Python strings can include characters that can't be

148

# represented in well-formed XML; escape characters that

149

# aren't listed in the XML specification

150

# (http://www.w3.org/TR/REC-xml/#NT-Char).

151

if isinstance(message, unicode):

152

char_pattern = u'[^\x09\x0A\x0D\u0020-\uD7FF\uE000-\uFFFD]'

153

else:

154

# Use a regular 'str' as pattern to avoid having re.subn

155

# return 'unicode' results.

156

char_pattern = '[^x09\x0A\x0D\x20-\xFF]'

157

message, escape_count = re.subn(

158

char_pattern,

159

lambda match: match.group(0).encode('unicode_escape'),

160

message)

161

if escape_count:

162

note("replaced %d control characters in message", escape_count)

163

rev = Revision(timestamp=timestamp,

164

timezone=timezone,

165

committer=committer,

166

message = message,

167

inventory_id=inv_id,

168

inventory_sha1=inv_sha1,

169

revision_id=rev_id)

170

171

rev.parents = []

172

precursor_id = branch.last_patch()

173

if precursor_id:

174

precursor_sha1 = branch.get_revision_sha1(precursor_id)

175

rev.parents.append(RevisionReference(precursor_id, precursor_sha1))

176

for merge_rev in pending_merges:

177

rev.parents.append(RevisionReference(merge_rev))

178

179

rev_tmp = tempfile.TemporaryFile()

180

serializer_v4.write_revision(rev, rev_tmp)

181

rev_tmp.seek(0)

182

branch.revision_store.add(rev_tmp, rev_id)

183

mutter("new revision_id is {%s}" % rev_id)

184

185

## XXX: Everything up to here can simply be orphaned if we abort

186

## the commit; it will leave junk files behind but that doesn't

187

## matter.

188

189

## TODO: Read back the just-generated changeset, and make sure it

190

## applies and recreates the right state.

191

192

## TODO: Also calculate and store the inventory SHA1

193

mutter("committing patch r%d" % (branch.revno() + 1))

194

195

branch.append_revision(rev_id)

196

197

branch.set_pending_merges([])

198

199

if verbose:

200

# disabled; should go through logging

201

# note("commited r%d" % branch.revno())

202

# print ("commited r%d" % branch.revno())

203

pass

204

finally:

205

branch.unlock()

206

207

208

209

def _gen_revision_id(branch, when):

210

"""Return new revision-id."""

211

from binascii import hexlify

212

from bzrlib.osutils import rand_bytes, compact_date, user_email

213

214

s = '%s-%s-' % (user_email(branch), compact_date(when))

215

s += hexlify(rand_bytes(8))

216

return s

217

218

219

def _gather_commit(branch, work_tree, work_inv, basis_inv, specific_files,

220

verbose):

221

"""Build inventory preparatory to commit.

222

223

Returns missing_ids, new_inv, any_changes.

224

225

This adds any changed files into the text store, and sets their

226

test-id, sha and size in the returned inventory appropriately.

227

228

missing_ids

229

Modified to hold a list of files that have been deleted from

230

the working directory; these should be removed from the

231

working inventory.

232

"""

233

from bzrlib.inventory import Inventory

234

from bzrlib.osutils import isdir, isfile, sha_string, quotefn, \

235

local_time_offset, username, kind_marker, is_inside_any

236

237

from bzrlib.branch import gen_file_id

238

from bzrlib.errors import BzrError

239

from bzrlib.revision import Revision

240

from bzrlib.trace import mutter, note

241

242

any_changes = False

243

inv = Inventory(work_inv.root.file_id)

244

missing_ids = []

245

246

for path, entry in work_inv.iter_entries():

247

## TODO: Check that the file kind has not changed from the previous

248

## revision of this file (if any).

249

250

p = branch.abspath(path)

251

file_id = entry.file_id

252

mutter('commit prep file %s, id %r ' % (p, file_id))

253

254

if specific_files and not is_inside_any(specific_files, path):

255

mutter(' skipping file excluded from commit')

256

if basis_inv.has_id(file_id):

257

# carry over with previous state

258

inv.add(basis_inv[file_id].copy())

259

else:

260

# omit this from committed inventory

261

pass

262

continue

263

264

if not work_tree.has_id(file_id):

265

if verbose:

266

print('deleted %s%s' % (path, kind_marker(entry.kind)))

267

any_changes = True

268

mutter(" file is missing, removing from inventory")

269

missing_ids.append(file_id)

270

continue

271

272

# this is present in the new inventory; may be new, modified or

273

# unchanged.

274

old_ie = basis_inv.has_id(file_id) and basis_inv[file_id]

275

276

entry = entry.copy()

277

inv.add(entry)

278

279

if old_ie:

280

old_kind = old_ie.kind

281

if old_kind != entry.kind:

282

raise BzrError("entry %r changed kind from %r to %r"

283

% (file_id, old_kind, entry.kind))

284

285

if entry.kind == 'directory':

286

if not isdir(p):

287

raise BzrError("%s is entered as directory but not a directory"

288

% quotefn(p))

289

elif entry.kind == 'file':

290

if not isfile(p):

291

raise BzrError("%s is entered as file but is not a file" % quotefn(p))

292

293

new_sha1 = work_tree.get_file_sha1(file_id)

294

295

if (old_ie

296

and old_ie.text_sha1 == new_sha1):

297

## assert content == basis.get_file(file_id).read()

298

entry.text_id = old_ie.text_id

299

entry.text_sha1 = new_sha1

300

entry.text_size = old_ie.text_size

301

mutter(' unchanged from previous text_id {%s}' %

302

entry.text_id)

303

else:

304

content = file(p, 'rb').read()

305

306

# calculate the sha again, just in case the file contents

307

# changed since we updated the cache

308

entry.text_sha1 = sha_string(content)

309

entry.text_size = len(content)

310

311

entry.text_id = gen_file_id(entry.name)

312

branch.text_store.add(content, entry.text_id)

313

mutter(' stored with text_id {%s}' % entry.text_id)

314

315

if verbose:

316

marked = path + kind_marker(entry.kind)

317

if not old_ie:

318

print 'added', marked

319

any_changes = True

320

elif old_ie == entry:

321

pass # unchanged

322

elif (old_ie.name == entry.name

323

and old_ie.parent_id == entry.parent_id):

324

print 'modified', marked

325

any_changes = True

326

else:

327

print 'renamed', marked

328

any_changes = True

329

elif old_ie != entry:

330

any_changes = True

331

332

return missing_ids, inv, any_changes

333

334

Older »