~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/commit.py

Committer: John Arbash Meinel
Date: 2005-09-17 21:57:11 UTC
mto: (1393.2.1)
mto: This revision was merged to the branch mainline in revision 1396.
Revision ID: john@arbash-meinel.com-20050917215711-9fa31e650a1f2fd8

Got HttpTransport tests to pass. Check for EAGAIN, pass permit_failure around, etc

files added:
HACKING

Makefile

bzr-man.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/delta.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/intset.py

bzrlib/lock.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revisionspec.py

bzrlib/selftest

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testgraph.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testremotebranch.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/testtransport.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/store

bzrlib/store/compressed_text.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/ui.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/weave.py

bzrlib/weavefile.py

contrib/bash/bzr

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

doc/split-join-files.txt

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testsweet.py

tools

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/history2weaves.py

tools/http_client.py

tools/testweave.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
bzrlib/remotebranch.py

bzrlib/statcache.py

bzrlib/tests.py

files renamed:
bzrlib/store.py => bzrlib/store/__init__.py

elementtree/ => bzrlib/util/elementtree/

urlgrabber/ => bzrlib/util/urlgrabber/

contrib/bash/bzr => contrib/bash/bzr.simple

files modified:
.bzrignore

NEWS

README

TODO

build-api

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/newinventory.py

bzrlib/osutils.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/status.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/workingtree.py

bzrlib/xml.py

contrib/add-bzr-to-baz

doc/formats.txt

doc/index.txt

doc/tagging.txt

doc/todo-from-arch.txt

setup.py

testbzr

Show diffs side-by-side

added added

removed removed

bzrlib/commit.py

def commit(branch, message, timestamp=None, timezone=None,

def commit(branch, message,

timestamp=None,

timezone=None,

committer=None,

verbose=False):

verbose=True,

specific_files=None,

rev_id=None,

allow_pointless=True):

"""Commit working copy as a new revision.

The basic approach is to add all the file texts into the

be robust against files disappearing, moving, etc. So the

whole thing is a bit hard.

This raises PointlessCommit if there are no changes, no new merges,

and allow_pointless is false.

timestamp -- if not None, seconds-since-epoch for a

postdated/predated commit.

"""

import os, time, tempfile

from inventory import Inventory

from osutils import isdir, isfile, sha_string, quotefn, \

local_time_offset, username

specific_files

If true, commit only those files.

rev_id

If set, use this as the new revision id.

Useful for test or import commands that need to tightly

control what revisions are assigned. If you duplicate

a revision id that exists elsewhere it is your own fault.

If null (default), a time/random revision id is generated.

"""

import time, tempfile, re

from bzrlib.osutils import local_time_offset, username

from bzrlib.branch import gen_file_id

from bzrlib.errors import BzrError, PointlessCommit

from bzrlib.revision import Revision, RevisionReference

from bzrlib.trace import mutter, note

from bzrlib.xml import serializer_v4

branch.lock_write()

try:

# First walk over the working inventory; and both update that

# and also build a new revision inventory. The revision

# inventory needs to hold the text-id, sha1 and size of the

# actual file versions committed in the revision. (These are

# not present in the working inventory.) We also need to

# detect missing/deleted files, and remove them from the

# working inventory.

work_tree = branch.working_tree()

work_inv = work_tree.inventory

basis = branch.basis_tree()

basis_inv = basis.inventory

if verbose:

# note('looking for changes...')

# print 'looking for changes...'

# disabled; should be done at a higher level

pass

pending_merges = branch.pending_merges()

missing_ids, new_inv, any_changes = \

_gather_commit(branch,

work_tree,

work_inv,

basis_inv,

specific_files,

verbose)

100

101

if not (any_changes or allow_pointless or pending_merges):

102

raise PointlessCommit()

103

104

for file_id in missing_ids:

105

# Any files that have been deleted are now removed from the

106

# working inventory. Files that were not selected for commit

107

# are left as they were in the working inventory and ommitted

108

# from the revision inventory.

109

110

# have to do this later so we don't mess up the iterator.

111

# since parents may be removed before their children we

112

# have to test.

113

114

# FIXME: There's probably a better way to do this; perhaps

115

# the workingtree should know how to filter itbranch.

116

if work_inv.has_id(file_id):

117

del work_inv[file_id]

118

119

if rev_id is None:

120

rev_id = _gen_revision_id(branch, time.time())

121

inv_id = rev_id

122

123

inv_tmp = tempfile.TemporaryFile()

124

125

serializer_v4.write_inventory(new_inv, inv_tmp)

126

inv_tmp.seek(0)

127

branch.inventory_store.add(inv_tmp, inv_id)

128

mutter('new inventory_id is {%s}' % inv_id)

129

130

# We could also just sha hash the inv_tmp file

131

# however, in the case that branch.inventory_store.add()

132

# ever actually does anything special

133

inv_sha1 = branch.get_inventory_sha1(inv_id)

134

135

branch._write_inventory(work_inv)

136

137

if timestamp == None:

138

timestamp = time.time()

139

140

if committer == None:

141

committer = username(branch)

142

143

if timezone == None:

144

timezone = local_time_offset()

145

146

mutter("building commit log message")

147

# Python strings can include characters that can't be

148

# represented in well-formed XML; escape characters that

149

# aren't listed in the XML specification

150

# (http://www.w3.org/TR/REC-xml/#NT-Char).

151

if isinstance(message, unicode):

152

char_pattern = u'[^\x09\x0A\x0D\u0020-\uD7FF\uE000-\uFFFD]'

153

else:

154

# Use a regular 'str' as pattern to avoid having re.subn

155

# return 'unicode' results.

156

char_pattern = '[^x09\x0A\x0D\x20-\xFF]'

157

message, escape_count = re.subn(

158

char_pattern,

159

lambda match: match.group(0).encode('unicode_escape'),

160

message)

161

if escape_count:

162

note("replaced %d control characters in message", escape_count)

163

rev = Revision(timestamp=timestamp,

164

timezone=timezone,

165

committer=committer,

166

message = message,

167

inventory_id=inv_id,

168

inventory_sha1=inv_sha1,

169

revision_id=rev_id)

170

171

rev.parents = []

172

precursor_id = branch.last_patch()

173

if precursor_id:

174

precursor_sha1 = branch.get_revision_sha1(precursor_id)

175

rev.parents.append(RevisionReference(precursor_id, precursor_sha1))

176

for merge_rev in pending_merges:

177

rev.parents.append(RevisionReference(merge_rev))

178

179

rev_tmp = tempfile.TemporaryFile()

180

serializer_v4.write_revision(rev, rev_tmp)

181

rev_tmp.seek(0)

182

branch.revision_store.add(rev_tmp, rev_id)

183

mutter("new revision_id is {%s}" % rev_id)

184

185

## XXX: Everything up to here can simply be orphaned if we abort

186

## the commit; it will leave junk files behind but that doesn't

187

## matter.

188

189

## TODO: Read back the just-generated changeset, and make sure it

190

## applies and recreates the right state.

191

192

## TODO: Also calculate and store the inventory SHA1

193

mutter("committing patch r%d" % (branch.revno() + 1))

194

195

branch.append_revision(rev_id)

196

197

branch.set_pending_merges([])

198

199

if verbose:

200

# disabled; should go through logging

201

# note("commited r%d" % branch.revno())

202

# print ("commited r%d" % branch.revno())

203

pass

204

finally:

205

branch.unlock()

206

207

208

209

def _gen_revision_id(branch, when):

210

"""Return new revision-id."""

211

from binascii import hexlify

212

from bzrlib.osutils import rand_bytes, compact_date, user_email

213

214

s = '%s-%s-' % (user_email(branch), compact_date(when))

215

s += hexlify(rand_bytes(8))

216

return s

217

218

219

def _gather_commit(branch, work_tree, work_inv, basis_inv, specific_files,

220

verbose):

221

"""Build inventory preparatory to commit.

222

223

Returns missing_ids, new_inv, any_changes.

224

225

This adds any changed files into the text store, and sets their

226

test-id, sha and size in the returned inventory appropriately.

227

228

missing_ids

229

Modified to hold a list of files that have been deleted from

230

the working directory; these should be removed from the

231

working inventory.

232

"""

233

from bzrlib.inventory import Inventory

234

from bzrlib.osutils import isdir, isfile, sha_string, quotefn, \

235

local_time_offset, username, kind_marker, is_inside_any

236

from branch import gen_file_id

from errors import BzrError

from revision import Revision

from textui import show_status

from trace import mutter, note

branch._need_writelock()

## TODO: Show branch names

# TODO: Don't commit if there are no changes, unless forced?

# First walk over the working inventory; and both update that

# and also build a new revision inventory. The revision

# inventory needs to hold the text-id, sha1 and size of the

# actual file versions committed in the revision. (These are

# not present in the working inventory.) We also need to

# detect missing/deleted files, and remove them from the

# working inventory.

work_inv = branch.read_working_inventory()

inv = Inventory()

basis = branch.basis_tree()

basis_inv = basis.inventory

237

from bzrlib.branch import gen_file_id

238

from bzrlib.errors import BzrError

239

from bzrlib.revision import Revision

240

from bzrlib.trace import mutter, note

241

242

any_changes = False

243

inv = Inventory(work_inv.root.file_id)

244

missing_ids = []

245

246

for path, entry in work_inv.iter_entries():

## TODO: Cope with files that have gone missing.

247

## TODO: Check that the file kind has not changed from the previous

248

## revision of this file (if any).

249

entry = entry.copy()

250

p = branch.abspath(path)

251

file_id = entry.file_id

252

mutter('commit prep file %s, id %r ' % (p, file_id))

253

if not os.path.exists(p):

254

if specific_files and not is_inside_any(specific_files, path):

255

mutter(' skipping file excluded from commit')

256

if basis_inv.has_id(file_id):

257

# carry over with previous state

258

inv.add(basis_inv[file_id].copy())

259

else:

260

# omit this from committed inventory

261

pass

262

continue

263

264

if not work_tree.has_id(file_id):

265

if verbose:

266

print('deleted %s%s' % (path, kind_marker(entry.kind)))

267

any_changes = True

268

mutter(" file is missing, removing from inventory")

if verbose:

show_status('D', entry.kind, quotefn(path))

269

missing_ids.append(file_id)

270

continue

271

# TODO: Handle files that have been deleted

# TODO: Maybe a special case for empty files? Seems a

# waste to store them many times.

272

# this is present in the new inventory; may be new, modified or

273

# unchanged.

274

old_ie = basis_inv.has_id(file_id) and basis_inv[file_id]

275

276

entry = entry.copy()

277

inv.add(entry)

278

if basis_inv.has_id(file_id):

100

old_kind = basis_inv[file_id].kind

279

if old_ie:

280

old_kind = old_ie.kind

101

281

if old_kind != entry.kind:

102

282

raise BzrError("entry %r changed kind from %r to %r"

103

283

% (file_id, old_kind, entry.kind))

104

284

105

285

if entry.kind == 'directory':

106

286

if not isdir(p):

107

raise BzrError("%s is entered as directory but not a directory" % quotefn(p))

287

raise BzrError("%s is entered as directory but not a directory"

288

% quotefn(p))

108

289

elif entry.kind == 'file':

109

290

if not isfile(p):

110

291

raise BzrError("%s is entered as file but is not a file" % quotefn(p))

111

292

112

content = file(p, 'rb').read()

113

114

entry.text_sha1 = sha_string(content)

115

entry.text_size = len(content)

116

117

old_ie = basis_inv.has_id(file_id) and basis_inv[file_id]

293

new_sha1 = work_tree.get_file_sha1(file_id)

294

118

295

if (old_ie

119

and (old_ie.text_size == entry.text_size)

120

and (old_ie.text_sha1 == entry.text_sha1)):

296

and old_ie.text_sha1 == new_sha1):

121

297

## assert content == basis.get_file(file_id).read()

122

entry.text_id = basis_inv[file_id].text_id

298

entry.text_id = old_ie.text_id

299

entry.text_sha1 = new_sha1

300

entry.text_size = old_ie.text_size

123

301

mutter(' unchanged from previous text_id {%s}' %

124

302

entry.text_id)

125

126

303

else:

304

content = file(p, 'rb').read()

305

306

# calculate the sha again, just in case the file contents

307

# changed since we updated the cache

308

entry.text_sha1 = sha_string(content)

309

entry.text_size = len(content)

310

127

311

entry.text_id = gen_file_id(entry.name)

128

312

branch.text_store.add(content, entry.text_id)

129

313

mutter(' stored with text_id {%s}' % entry.text_id)

130

if verbose:

131

if not old_ie:

132

state = 'A'

133

elif (old_ie.name == entry.name

134

and old_ie.parent_id == entry.parent_id):

135

state = 'M'

136

else:

137

state = 'R'

138

139

show_status(state, entry.kind, quotefn(path))

140

141

for file_id in missing_ids:

142

# have to do this later so we don't mess up the iterator.

143

# since parents may be removed before their children we

144

# have to test.

145

146

# FIXME: There's probably a better way to do this; perhaps

147

# the workingtree should know how to filter itbranch.

148

if work_inv.has_id(file_id):

149

del work_inv[file_id]

150

151

152

inv_id = rev_id = _gen_revision_id(time.time())

153

154

inv_tmp = tempfile.TemporaryFile()

155

inv.write_xml(inv_tmp)

156

inv_tmp.seek(0)

157

branch.inventory_store.add(inv_tmp, inv_id)

158

mutter('new inventory_id is {%s}' % inv_id)

159

160

branch._write_inventory(work_inv)

161

162

if timestamp == None:

163

timestamp = time.time()

164

165

if committer == None:

166

committer = username()

167

168

if timezone == None:

169

timezone = local_time_offset()

170

171

mutter("building commit log message")

172

rev = Revision(timestamp=timestamp,

173

timezone=timezone,

174

committer=committer,

175

precursor = branch.last_patch(),

176

message = message,

177

inventory_id=inv_id,

178

revision_id=rev_id)

179

180

rev_tmp = tempfile.TemporaryFile()

181

rev.write_xml(rev_tmp)

182

rev_tmp.seek(0)

183

branch.revision_store.add(rev_tmp, rev_id)

184

mutter("new revision_id is {%s}" % rev_id)

185

186

## XXX: Everything up to here can simply be orphaned if we abort

187

## the commit; it will leave junk files behind but that doesn't

188

## matter.

189

190

## TODO: Read back the just-generated changeset, and make sure it

191

## applies and recreates the right state.

192

193

## TODO: Also calculate and store the inventory SHA1

194

mutter("committing patch r%d" % (branch.revno() + 1))

195

196

197

branch.append_revision(rev_id)

198

199

if verbose:

200

note("commited r%d" % branch.revno())

201

202

203

204

def _gen_revision_id(when):

205

"""Return new revision-id."""

206

from binascii import hexlify

207

from osutils import rand_bytes, compact_date, user_email

208

209

s = '%s-%s-' % (user_email(), compact_date(when))

210

s += hexlify(rand_bytes(8))

211

return s

314

315

if verbose:

316

marked = path + kind_marker(entry.kind)

317

if not old_ie:

318

print 'added', marked

319

any_changes = True

320

elif old_ie == entry:

321

pass # unchanged

322

elif (old_ie.name == entry.name

323

and old_ie.parent_id == entry.parent_id):

324

print 'modified', marked

325

any_changes = True

326

else:

327

print 'renamed', marked

328

any_changes = True

329

elif old_ie != entry:

330

any_changes = True

331

332

return missing_ids, inv, any_changes

212

333

213

334

Older »