306
246
if message_callback is None:
307
247
if message is not None:
308
248
if isinstance(message, str):
309
message = message.decode(get_user_encoding())
249
message = message.decode(bzrlib.user_encoding)
310
250
message_callback = lambda x: message
312
252
raise BzrError("The message or message_callback keyword"
313
253
" parameter is required for commit().")
315
255
self.bound_branch = None
256
self.any_entries_changed = False
316
257
self.any_entries_deleted = False
317
if exclude is not None:
318
self.exclude = sorted(
319
minimum_path_selection(exclude))
322
258
self.local = local
323
259
self.master_branch = None
260
self.master_locked = False
324
261
self.recursive = recursive
325
262
self.rev_id = None
326
# self.specific_files is None to indicate no filter, or any iterable to
327
# indicate a filter - [] means no files at all, as per iter_changes.
328
263
if specific_files is not None:
329
264
self.specific_files = sorted(
330
265
minimum_path_selection(specific_files))
332
267
self.specific_files = None
268
self.specific_file_ids = None
334
269
self.allow_pointless = allow_pointless
270
self.revprops = revprops
335
271
self.message_callback = message_callback
336
272
self.timestamp = timestamp
337
273
self.timezone = timezone
338
274
self.committer = committer
339
275
self.strict = strict
340
276
self.verbose = verbose
277
# accumulates an inventory delta to the basis entry, so we can make
278
# just the necessary updates to the workingtree's cached basis.
279
self._basis_delta = []
342
281
self.work_tree.lock_write()
343
operation.add_cleanup(self.work_tree.unlock)
344
self.parents = self.work_tree.get_parent_ids()
345
# We can use record_iter_changes IFF iter_changes is compatible with
346
# the command line parameters, and the repository has fast delta
347
# generation. See bug 347649.
348
self.use_record_iter_changes = (
350
not self.branch.repository._format.supports_tree_reference and
351
(self.branch.repository._format.fast_deltas or
352
len(self.parents) < 2))
353
self.pb = ui.ui_factory.nested_progress_bar()
354
operation.add_cleanup(self.pb.finished)
282
self.pb = bzrlib.ui.ui_factory.nested_progress_bar()
355
283
self.basis_revid = self.work_tree.last_revision()
356
284
self.basis_tree = self.work_tree.basis_tree()
357
285
self.basis_tree.lock_read()
358
operation.add_cleanup(self.basis_tree.unlock)
359
# Cannot commit with conflicts present.
360
if len(self.work_tree.conflicts()) > 0:
361
raise ConflictsInTree
363
# Setup the bound branch variables as needed.
364
self._check_bound_branch(operation, possible_master_transports)
366
# Check that the working tree is up to date
367
old_revno, old_revid, new_revno = self._check_out_of_date_tree()
369
# Complete configuration setup
370
if reporter is not None:
371
self.reporter = reporter
372
elif self.reporter is None:
373
self.reporter = self._select_reporter()
374
if self.config_stack is None:
375
self.config_stack = self.work_tree.get_config_stack()
377
self._set_specific_file_ids()
379
# Setup the progress bar. As the number of files that need to be
380
# committed in unknown, progress is reported as stages.
381
# We keep track of entries separately though and include that
382
# information in the progress bar during the relevant stages.
383
self.pb_stage_name = ""
384
self.pb_stage_count = 0
385
self.pb_stage_total = 5
386
if self.bound_branch:
387
# 2 extra stages: "Uploading data to master branch" and "Merging
388
# tags to master branch"
389
self.pb_stage_total += 2
390
self.pb.show_pct = False
391
self.pb.show_spinner = False
392
self.pb.show_eta = False
393
self.pb.show_count = True
394
self.pb.show_bar = True
396
self._gather_parents()
397
# After a merge, a selected file commit is not supported.
398
# See 'bzr help merge' for an explanation as to why.
399
if len(self.parents) > 1 and self.specific_files is not None:
400
raise errors.CannotCommitSelectedFileMerge(self.specific_files)
401
# Excludes are a form of selected file commit.
402
if len(self.parents) > 1 and self.exclude:
403
raise errors.CannotCommitSelectedFileMerge(self.exclude)
405
# Collect the changes
406
self._set_progress_stage("Collecting changes", counter=True)
408
self.builder = self.branch.get_commit_builder(self.parents,
409
self.config_stack, timestamp, timezone, committer, self.revprops,
411
if not self.builder.supports_record_entry_contents and self.exclude:
413
raise errors.ExcludesUnsupported(self.branch.repository)
415
if self.builder.updates_branch and self.bound_branch:
417
raise AssertionError(
418
"bound branches not supported for commit builders "
419
"that update the branch")
422
self.builder.will_record_deletes()
423
# find the location being committed to
287
# Cannot commit with conflicts present.
288
if len(self.work_tree.conflicts()) > 0:
289
raise ConflictsInTree
291
# Setup the bound branch variables as needed.
292
self._check_bound_branch()
294
# Check that the working tree is up to date
295
old_revno, new_revno = self._check_out_of_date_tree()
297
# Complete configuration setup
298
if reporter is not None:
299
self.reporter = reporter
300
elif self.reporter is None:
301
self.reporter = self._select_reporter()
302
if self.config is None:
303
self.config = self.branch.get_config()
305
# If provided, ensure the specified files are versioned
306
if self.specific_files is not None:
307
# Note: This routine is being called because it raises
308
# PathNotVersionedError as a side effect of finding the IDs. We
309
# later use the ids we found as input to the working tree
310
# inventory iterator, so we only consider those ids rather than
311
# examining the whole tree again.
312
# XXX: Dont we have filter_unversioned to do this more
314
self.specific_file_ids = tree.find_ids_across_trees(
315
specific_files, [self.basis_tree, self.work_tree])
317
# Setup the progress bar. As the number of files that need to be
318
# committed in unknown, progress is reported as stages.
319
# We keep track of entries separately though and include that
320
# information in the progress bar during the relevant stages.
321
self.pb_stage_name = ""
322
self.pb_stage_count = 0
323
self.pb_stage_total = 5
424
324
if self.bound_branch:
425
master_location = self.master_branch.base
427
master_location = self.branch.base
429
# report the start of the commit
430
self.reporter.started(new_revno, self.rev_id, master_location)
432
self._update_builder_with_changes()
433
self._check_pointless()
435
# TODO: Now the new inventory is known, check for conflicts.
436
# ADHB 2006-08-08: If this is done, populate_new_inv should not add
437
# weave lines, because nothing should be recorded until it is known
438
# that commit will succeed.
439
self._set_progress_stage("Saving data locally")
440
self.builder.finish_inventory()
442
# Prompt the user for a commit message if none provided
443
message = message_callback(self)
444
self.message = message
446
# Add revision data to the local branch
447
self.rev_id = self.builder.commit(self.message)
450
mutter("aborting commit write group because of exception:")
451
trace.log_exception_quietly()
455
self._update_branches(old_revno, old_revid, new_revno)
457
# Make the working tree be up to date with the branch. This
458
# includes automatic changes scheduled to be made to the tree, such
459
# as updating its basis and unversioning paths that were missing.
460
self.work_tree.unversion(self.deleted_ids)
461
self._set_progress_stage("Updating the working tree")
462
self.work_tree.update_basis_by_delta(self.rev_id,
463
self.builder.get_basis_delta())
464
self.reporter.completed(new_revno, self.rev_id)
465
self._process_post_hooks(old_revno, new_revno)
468
def _update_branches(self, old_revno, old_revid, new_revno):
469
"""Update the master and local branch to the new revision.
471
This will try to make sure that the master branch is updated
472
before the local branch.
474
:param old_revno: Revision number of master branch before the
476
:param old_revid: Tip of master branch before the commit
477
:param new_revno: Revision number of the new commit
479
if not self.builder.updates_branch:
325
self.pb_stage_total += 1
326
self.pb.show_pct = False
327
self.pb.show_spinner = False
328
self.pb.show_eta = False
329
self.pb.show_count = True
330
self.pb.show_bar = True
332
# After a merge, a selected file commit is not supported.
333
# See 'bzr help merge' for an explanation as to why.
334
self.basis_inv = self.basis_tree.inventory
335
self._gather_parents()
336
if len(self.parents) > 1 and self.specific_files:
337
raise errors.CannotCommitSelectedFileMerge(self.specific_files)
339
# Collect the changes
340
self._set_progress_stage("Collecting changes",
341
entries_title="Directory")
342
self.builder = self.branch.get_commit_builder(self.parents,
343
self.config, timestamp, timezone, committer, revprops, rev_id)
346
# find the location being committed to
347
if self.bound_branch:
348
master_location = self.master_branch.base
350
master_location = self.branch.base
352
# report the start of the commit
353
self.reporter.started(new_revno, self.rev_id, master_location)
355
self._update_builder_with_changes()
356
self._report_and_accumulate_deletes()
357
self._check_pointless()
359
# TODO: Now the new inventory is known, check for conflicts.
360
# ADHB 2006-08-08: If this is done, populate_new_inv should not add
361
# weave lines, because nothing should be recorded until it is known
362
# that commit will succeed.
363
self._set_progress_stage("Saving data locally")
364
self.builder.finish_inventory()
366
# Prompt the user for a commit message if none provided
367
message = message_callback(self)
368
assert isinstance(message, unicode), type(message)
369
self.message = message
370
self._escape_commit_message()
372
# Add revision data to the local branch
373
self.rev_id = self.builder.commit(self.message)
480
379
self._process_pre_hooks(old_revno, new_revno)
482
381
# Upload revision data to the master.
483
382
# this will propagate merged revisions too if needed.
484
383
if self.bound_branch:
485
self._set_progress_stage("Uploading data to master branch")
384
if not self.master_branch.repository.has_same_location(
385
self.branch.repository):
386
self._set_progress_stage("Uploading data to master branch")
387
self.master_branch.repository.fetch(self.branch.repository,
388
revision_id=self.rev_id)
389
# now the master has the revision data
486
390
# 'commit' to the master first so a timeout here causes the
487
391
# local branch to be out of date
488
(new_revno, self.rev_id) = self.master_branch.import_last_revision_info_and_tags(
489
self.branch, new_revno, self.rev_id, lossy=self._lossy)
491
self.branch.fetch(self.master_branch, self.rev_id)
392
self.master_branch.set_last_revision_info(new_revno,
493
395
# and now do the commit locally.
494
396
self.branch.set_last_revision_info(new_revno, self.rev_id)
497
self._process_pre_hooks(old_revno, new_revno)
499
# The commit builder will already have updated the branch,
501
self.branch.set_last_revision_info(old_revno, old_revid)
504
# Merge local tags to remote
505
if self.bound_branch:
506
self._set_progress_stage("Merging tags to master branch")
507
tag_updates, tag_conflicts = self.branch.tags.merge_to(
508
self.master_branch.tags)
510
warning_lines = [' ' + name for name, _, _ in tag_conflicts]
511
note( gettext("Conflicting tags in bound branch:\n{0}".format(
512
"\n".join(warning_lines))) )
398
# Make the working tree up to date with the branch
399
self._set_progress_stage("Updating the working tree")
400
self.work_tree.update_basis_by_delta(self.rev_id,
402
self.reporter.completed(new_revno, self.rev_id)
403
self._process_post_hooks(old_revno, new_revno)
514
408
def _select_reporter(self):
515
409
"""Select the CommitReporter to use."""
661
564
old_revno, old_revid, new_revno, self.rev_id,
662
565
tree_delta, future_tree)
568
"""Cleanup any open locks, progress bars etc."""
569
cleanups = [self._cleanup_bound_branch,
570
self.basis_tree.unlock,
571
self.work_tree.unlock,
573
found_exception = None
574
for cleanup in cleanups:
577
# we want every cleanup to run no matter what.
578
# so we have a catchall here, but we will raise the
579
# last encountered exception up the stack: and
580
# typically this will be useful enough.
583
if found_exception is not None:
584
# don't do a plan raise, because the last exception may have been
585
# trashed, e is our sure-to-work exception even though it loses the
586
# full traceback. XXX: RBC 20060421 perhaps we could check the
587
# exc_info and if its the same one do a plain raise otherwise
588
# 'raise e' as we do now.
591
def _cleanup_bound_branch(self):
592
"""Executed at the end of a try/finally to cleanup a bound branch.
594
If the branch wasn't bound, this is a no-op.
595
If it was, it resents self.branch to the local branch, instead
598
if not self.bound_branch:
600
if self.master_locked:
601
self.master_branch.unlock()
603
def _escape_commit_message(self):
604
"""Replace xml-incompatible control characters."""
605
# FIXME: RBC 20060419 this should be done by the revision
606
# serialiser not by commit. Then we can also add an unescaper
607
# in the deserializer and start roundtripping revision messages
608
# precisely. See repository_implementations/test_repository.py
610
# Python strings can include characters that can't be
611
# represented in well-formed XML; escape characters that
612
# aren't listed in the XML specification
613
# (http://www.w3.org/TR/REC-xml/#NT-Char).
614
self.message, escape_count = re.subn(
615
u'[^\x09\x0A\x0D\u0020-\uD7FF\uE000-\uFFFD]+',
616
lambda match: match.group(0).encode('unicode_escape'),
619
self.reporter.escaped(escape_count, self.message)
664
621
def _gather_parents(self):
665
622
"""Record the parents of a merge for merge detection."""
666
# TODO: Make sure that this list doesn't contain duplicate
623
# TODO: Make sure that this list doesn't contain duplicate
667
624
# entries and the order is preserved when doing this.
668
if self.use_record_iter_changes:
670
self.basis_inv = self.basis_tree.inventory
625
self.parents = self.work_tree.get_parent_ids()
671
626
self.parent_invs = [self.basis_inv]
672
627
for revision in self.parents[1:]:
673
628
if self.branch.repository.has_revision(revision):
680
635
def _update_builder_with_changes(self):
681
636
"""Update the commit builder with the data about what has changed.
683
exclude = self.exclude
638
# Build the revision inventory.
640
# This starts by creating a new empty inventory. Depending on
641
# which files are selected for commit, and what is present in the
642
# current tree, the new inventory is populated. inventory entries
643
# which are candidates for modification have their revision set to
644
# None; inventory entries that are carried over untouched have their
645
# revision set to their prior value.
647
# ESEPARATIONOFCONCERNS: this function is diffing and using the diff
648
# results to create a new inventory at the same time, which results
649
# in bugs like #46635. Any reason not to use/enhance Tree.changes_from?
684
652
specific_files = self.specific_files
685
653
mutter("Selecting files for commit with filter %s", specific_files)
688
if self.use_record_iter_changes:
689
iter_changes = self.work_tree.iter_changes(self.basis_tree,
690
specific_files=specific_files)
691
iter_changes = self._filter_iter_changes(iter_changes)
692
for file_id, path, fs_hash in self.builder.record_iter_changes(
693
self.work_tree, self.basis_revid, iter_changes):
694
self.work_tree._observed_sha1(file_id, path, fs_hash)
696
# Build the new inventory
697
self._populate_from_inventory()
698
self._record_unselected()
699
self._report_and_accumulate_deletes()
701
def _filter_iter_changes(self, iter_changes):
702
"""Process iter_changes.
704
This method reports on the changes in iter_changes to the user, and
705
converts 'missing' entries in the iter_changes iterator to 'deleted'
706
entries. 'missing' entries have their
708
:param iter_changes: An iter_changes to process.
709
:return: A generator of changes.
711
reporter = self.reporter
712
report_changes = reporter.is_verbose()
714
for change in iter_changes:
716
old_path = change[1][0]
717
new_path = change[1][1]
718
versioned = change[3][1]
720
versioned = change[3][1]
721
if kind is None and versioned:
724
reporter.missing(new_path)
725
deleted_ids.append(change[0])
726
# Reset the new path (None) and new versioned flag (False)
727
change = (change[0], (change[1][0], None), change[2],
728
(change[3][0], False)) + change[4:]
729
new_path = change[1][1]
731
elif kind == 'tree-reference':
732
if self.recursive == 'down':
733
self._commit_nested_tree(change[0], change[1][1])
734
if change[3][0] or change[3][1]:
738
reporter.deleted(old_path)
739
elif old_path is None:
740
reporter.snapshot_change(gettext('added'), new_path)
741
elif old_path != new_path:
742
reporter.renamed(gettext('renamed'), old_path, new_path)
745
self.work_tree.branch.repository._format.rich_root_data):
746
# Don't report on changes to '' in non rich root
748
reporter.snapshot_change(gettext('modified'), new_path)
749
self._next_progress_entry()
750
# Unversion IDs that were found to be deleted
751
self.deleted_ids = deleted_ids
753
def _record_unselected(self):
655
# Build the new inventory
656
self._populate_from_inventory(specific_files)
754
658
# If specific files are selected, then all un-selected files must be
755
659
# recorded in their previous state. For more details, see
756
660
# https://lists.ubuntu.com/archives/bazaar/2007q3/028476.html.
757
if self.specific_files or self.exclude:
758
specific_files = self.specific_files or []
759
662
for path, old_ie in self.basis_inv.iter_entries():
760
if self.builder.new_inventory.has_id(old_ie.file_id):
663
if old_ie.file_id in self.builder.new_inventory:
761
664
# already added - skip.
763
if (is_inside_any(specific_files, path)
764
and not is_inside_any(self.exclude, path)):
765
# was inside the selected path, and not excluded - if not
766
# present it has been deleted so skip.
666
if is_inside_any(specific_files, path):
667
# was inside the selected path, if not present it has been
768
# From here down it was either not selected, or was excluded:
769
# We preserve the entry unaltered.
670
if old_ie.kind == 'directory':
671
self._next_progress_entry()
672
# not in final inv yet, was not in the selected files, so is an
673
# entry to be preserved unaltered.
770
674
ie = old_ie.copy()
771
675
# Note: specific file commits after a merge are currently
772
676
# prohibited. This test is for sanity/safety in case it's
773
677
# required after that changes.
774
678
if len(self.parents) > 1:
775
679
ie.revision = None
776
self.builder.record_entry_contents(ie, self.parent_invs, path,
777
self.basis_tree, None)
680
delta, version_recorded = self.builder.record_entry_contents(
681
ie, self.parent_invs, path, self.basis_tree, None)
683
self.any_entries_changed = True
684
if delta: self._basis_delta.append(delta)
779
686
def _report_and_accumulate_deletes(self):
780
if (isinstance(self.basis_inv, Inventory)
781
and isinstance(self.builder.new_inventory, Inventory)):
782
# the older Inventory classes provide a _byid dict, and building a
783
# set from the keys of this dict is substantially faster than even
784
# getting a set of ids from the inventory
786
# <lifeless> set(dict) is roughly the same speed as
787
# set(iter(dict)) and both are significantly slower than
789
deleted_ids = set(self.basis_inv._byid.keys()) - \
790
set(self.builder.new_inventory._byid.keys())
792
deleted_ids = set(self.basis_inv) - set(self.builder.new_inventory)
687
# XXX: Could the list of deleted paths and ids be instead taken from
688
# _populate_from_inventory?
689
deleted_ids = set(self.basis_inv._byid.keys()) - \
690
set(self.builder.new_inventory._byid.keys())
794
692
self.any_entries_deleted = True
795
693
deleted = [(self.basis_tree.id2path(file_id), file_id)