299
265
self.verbose = verbose
301
267
self.work_tree.lock_write()
302
operation.add_cleanup(self.work_tree.unlock)
303
self.parents = self.work_tree.get_parent_ids()
304
# We can use record_iter_changes IFF iter_changes is compatible with
305
# the command line parameters, and the repository has fast delta
306
# generation. See bug 347649.
307
self.use_record_iter_changes = (
309
not self.branch.repository._format.supports_tree_reference and
310
(self.branch.repository._format.fast_deltas or
311
len(self.parents) < 2))
312
268
self.pb = bzrlib.ui.ui_factory.nested_progress_bar()
313
operation.add_cleanup(self.pb.finished)
314
self.basis_revid = self.work_tree.last_revision()
315
269
self.basis_tree = self.work_tree.basis_tree()
316
270
self.basis_tree.lock_read()
317
operation.add_cleanup(self.basis_tree.unlock)
318
# Cannot commit with conflicts present.
319
if len(self.work_tree.conflicts()) > 0:
320
raise ConflictsInTree
322
# Setup the bound branch variables as needed.
323
self._check_bound_branch(operation, possible_master_transports)
325
# Check that the working tree is up to date
326
old_revno, new_revno = self._check_out_of_date_tree()
328
# Complete configuration setup
329
if reporter is not None:
330
self.reporter = reporter
331
elif self.reporter is None:
332
self.reporter = self._select_reporter()
333
if self.config is None:
334
self.config = self.branch.get_config()
336
self._set_specific_file_ids()
338
# Setup the progress bar. As the number of files that need to be
339
# committed in unknown, progress is reported as stages.
340
# We keep track of entries separately though and include that
341
# information in the progress bar during the relevant stages.
342
self.pb_stage_name = ""
343
self.pb_stage_count = 0
344
self.pb_stage_total = 5
345
if self.bound_branch:
346
self.pb_stage_total += 1
347
self.pb.show_pct = False
348
self.pb.show_spinner = False
349
self.pb.show_eta = False
350
self.pb.show_count = True
351
self.pb.show_bar = True
353
self._gather_parents()
354
# After a merge, a selected file commit is not supported.
355
# See 'bzr help merge' for an explanation as to why.
356
if len(self.parents) > 1 and self.specific_files is not None:
357
raise errors.CannotCommitSelectedFileMerge(self.specific_files)
358
# Excludes are a form of selected file commit.
359
if len(self.parents) > 1 and self.exclude:
360
raise errors.CannotCommitSelectedFileMerge(self.exclude)
362
# Collect the changes
363
self._set_progress_stage("Collecting changes", counter=True)
364
self.builder = self.branch.get_commit_builder(self.parents,
365
self.config, timestamp, timezone, committer, self.revprops, rev_id)
368
self.builder.will_record_deletes()
369
# find the location being committed to
370
if self.bound_branch:
371
master_location = self.master_branch.base
373
master_location = self.branch.base
375
# report the start of the commit
376
self.reporter.started(new_revno, self.rev_id, master_location)
378
self._update_builder_with_changes()
379
self._check_pointless()
381
# TODO: Now the new inventory is known, check for conflicts.
382
# ADHB 2006-08-08: If this is done, populate_new_inv should not add
383
# weave lines, because nothing should be recorded until it is known
384
# that commit will succeed.
385
self._set_progress_stage("Saving data locally")
386
self.builder.finish_inventory()
388
# Prompt the user for a commit message if none provided
389
message = message_callback(self)
390
self.message = message
392
# Add revision data to the local branch
393
self.rev_id = self.builder.commit(self.message)
396
mutter("aborting commit write group because of exception:")
397
trace.log_exception_quietly()
398
note("aborting commit write group: %r" % (e,))
402
self._process_pre_hooks(old_revno, new_revno)
404
# Upload revision data to the master.
405
# this will propagate merged revisions too if needed.
406
if self.bound_branch:
407
self._set_progress_stage("Uploading data to master branch")
408
# 'commit' to the master first so a timeout here causes the
409
# local branch to be out of date
410
self.master_branch.import_last_revision_info(
411
self.branch.repository, new_revno, self.rev_id)
413
# and now do the commit locally.
414
self.branch.set_last_revision_info(new_revno, self.rev_id)
416
# Make the working tree be up to date with the branch. This
417
# includes automatic changes scheduled to be made to the tree, such
418
# as updating its basis and unversioning paths that were missing.
419
self.work_tree.unversion(self.deleted_ids)
420
self._set_progress_stage("Updating the working tree")
421
self.work_tree.update_basis_by_delta(self.rev_id,
422
self.builder.get_basis_delta())
423
self.reporter.completed(new_revno, self.rev_id)
424
self._process_post_hooks(old_revno, new_revno)
272
# Cannot commit with conflicts present.
273
if len(self.work_tree.conflicts()) > 0:
274
raise ConflictsInTree
276
# Setup the bound branch variables as needed.
277
self._check_bound_branch()
279
# Check that the working tree is up to date
280
old_revno, new_revno = self._check_out_of_date_tree()
282
# Complete configuration setup
283
if reporter is not None:
284
self.reporter = reporter
285
elif self.reporter is None:
286
self.reporter = self._select_reporter()
287
if self.config is None:
288
self.config = self.branch.get_config()
290
# If provided, ensure the specified files are versioned
291
if self.specific_files is not None:
293
# is being called because it raises PathNotVerisonedError
294
# as a side effect of finding the IDs. We later use the ids we
295
# found as input to the working tree inventory iterator, so we
296
# only consider those ids rather than examining the whole tree
298
# XXX: Dont we have filter_unversioned to do this more
300
self.specific_file_ids = tree.find_ids_across_trees(
301
specific_files, [self.basis_tree, self.work_tree])
303
# Setup the progress bar. As the number of files that need to be
304
# committed in unknown, progress is reported as stages.
305
# We keep track of entries separately though and include that
306
# information in the progress bar during the relevant stages.
307
self.pb_stage_name = ""
308
self.pb_stage_count = 0
309
self.pb_stage_total = 5
310
if self.bound_branch:
311
self.pb_stage_total += 1
312
self.pb.show_pct = False
313
self.pb.show_spinner = False
314
self.pb.show_eta = False
315
self.pb.show_count = True
316
self.pb.show_bar = True
318
# After a merge, a selected file commit is not supported.
319
# See 'bzr help merge' for an explanation as to why.
320
self.basis_inv = self.basis_tree.inventory
321
self._gather_parents()
322
if len(self.parents) > 1 and self.specific_files:
323
raise errors.CannotCommitSelectedFileMerge(self.specific_files)
325
# Collect the changes
326
self._set_progress_stage("Collecting changes",
327
entries_title="Directory")
328
self.builder = self.branch.get_commit_builder(self.parents,
329
self.config, timestamp, timezone, committer, revprops, rev_id)
332
# find the location being committed to
333
if self.bound_branch:
334
master_location = self.master_branch.base
336
master_location = self.branch.base
338
# report the start of the commit
339
self.reporter.started(new_revno, self.rev_id, master_location)
341
self._update_builder_with_changes()
342
self._check_pointless()
344
# TODO: Now the new inventory is known, check for conflicts.
345
# ADHB 2006-08-08: If this is done, populate_new_inv should not add
346
# weave lines, because nothing should be recorded until it is known
347
# that commit will succeed.
348
self._set_progress_stage("Saving data locally")
349
self.builder.finish_inventory()
351
# Prompt the user for a commit message if none provided
352
message = message_callback(self)
353
assert isinstance(message, unicode), type(message)
354
self.message = message
355
self._escape_commit_message()
357
# Add revision data to the local branch
358
self.rev_id = self.builder.commit(self.message)
364
self._process_pre_hooks(old_revno, new_revno)
366
# Upload revision data to the master.
367
# this will propagate merged revisions too if needed.
368
if self.bound_branch:
369
self._set_progress_stage("Uploading data to master branch")
370
self.master_branch.repository.fetch(self.branch.repository,
371
revision_id=self.rev_id)
372
# now the master has the revision data
373
# 'commit' to the master first so a timeout here causes the
374
# local branch to be out of date
375
self.master_branch.set_last_revision_info(new_revno,
378
# and now do the commit locally.
379
self.branch.set_last_revision_info(new_revno, self.rev_id)
381
# Make the working tree up to date with the branch
382
self._set_progress_stage("Updating the working tree")
383
rev_tree = self.builder.revision_tree()
384
self.work_tree.set_parent_trees([(self.rev_id, rev_tree)])
385
self.reporter.completed(new_revno, self.rev_id)
386
self._process_post_hooks(old_revno, new_revno)
425
389
return self.rev_id
427
391
def _select_reporter(self):
581
546
old_revno, old_revid, new_revno, self.rev_id,
582
547
tree_delta, future_tree)
550
"""Cleanup any open locks, progress bars etc."""
551
cleanups = [self._cleanup_bound_branch,
552
self.basis_tree.unlock,
553
self.work_tree.unlock,
555
found_exception = None
556
for cleanup in cleanups:
559
# we want every cleanup to run no matter what.
560
# so we have a catchall here, but we will raise the
561
# last encountered exception up the stack: and
562
# typically this will be useful enough.
565
if found_exception is not None:
566
# don't do a plan raise, because the last exception may have been
567
# trashed, e is our sure-to-work exception even though it loses the
568
# full traceback. XXX: RBC 20060421 perhaps we could check the
569
# exc_info and if its the same one do a plain raise otherwise
570
# 'raise e' as we do now.
573
def _cleanup_bound_branch(self):
574
"""Executed at the end of a try/finally to cleanup a bound branch.
576
If the branch wasn't bound, this is a no-op.
577
If it was, it resents self.branch to the local branch, instead
580
if not self.bound_branch:
582
if self.master_locked:
583
self.master_branch.unlock()
585
def _escape_commit_message(self):
586
"""Replace xml-incompatible control characters."""
587
# FIXME: RBC 20060419 this should be done by the revision
588
# serialiser not by commit. Then we can also add an unescaper
589
# in the deserializer and start roundtripping revision messages
590
# precisely. See repository_implementations/test_repository.py
592
# Python strings can include characters that can't be
593
# represented in well-formed XML; escape characters that
594
# aren't listed in the XML specification
595
# (http://www.w3.org/TR/REC-xml/#NT-Char).
596
self.message, escape_count = re.subn(
597
u'[^\x09\x0A\x0D\u0020-\uD7FF\uE000-\uFFFD]+',
598
lambda match: match.group(0).encode('unicode_escape'),
601
self.reporter.escaped(escape_count, self.message)
584
603
def _gather_parents(self):
585
604
"""Record the parents of a merge for merge detection."""
586
# TODO: Make sure that this list doesn't contain duplicate
605
# TODO: Make sure that this list doesn't contain duplicate
587
606
# entries and the order is preserved when doing this.
588
if self.use_record_iter_changes:
590
self.basis_inv = self.basis_tree.inventory
607
self.parents = self.work_tree.get_parent_ids()
591
608
self.parent_invs = [self.basis_inv]
592
609
for revision in self.parents[1:]:
593
610
if self.branch.repository.has_revision(revision):
600
617
def _update_builder_with_changes(self):
601
618
"""Update the commit builder with the data about what has changed.
603
exclude = self.exclude
620
# Build the revision inventory.
622
# This starts by creating a new empty inventory. Depending on
623
# which files are selected for commit, and what is present in the
624
# current tree, the new inventory is populated. inventory entries
625
# which are candidates for modification have their revision set to
626
# None; inventory entries that are carried over untouched have their
627
# revision set to their prior value.
629
# ESEPARATIONOFCONCERNS: this function is diffing and using the diff
630
# results to create a new inventory at the same time, which results
631
# in bugs like #46635. Any reason not to use/enhance Tree.changes_from?
604
634
specific_files = self.specific_files
605
635
mutter("Selecting files for commit with filter %s", specific_files)
608
if self.use_record_iter_changes:
609
iter_changes = self.work_tree.iter_changes(self.basis_tree,
610
specific_files=specific_files)
611
iter_changes = self._filter_iter_changes(iter_changes)
612
for file_id, path, fs_hash in self.builder.record_iter_changes(
613
self.work_tree, self.basis_revid, iter_changes):
614
self.work_tree._observed_sha1(file_id, path, fs_hash)
616
# Build the new inventory
617
self._populate_from_inventory()
618
self._record_unselected()
619
self._report_and_accumulate_deletes()
621
def _filter_iter_changes(self, iter_changes):
622
"""Process iter_changes.
624
This method reports on the changes in iter_changes to the user, and
625
converts 'missing' entries in the iter_changes iterator to 'deleted'
626
entries. 'missing' entries have their
628
:param iter_changes: An iter_changes to process.
629
:return: A generator of changes.
631
reporter = self.reporter
632
report_changes = reporter.is_verbose()
634
for change in iter_changes:
636
old_path = change[1][0]
637
new_path = change[1][1]
638
versioned = change[3][1]
640
versioned = change[3][1]
641
if kind is None and versioned:
644
reporter.missing(new_path)
645
deleted_ids.append(change[0])
646
# Reset the new path (None) and new versioned flag (False)
647
change = (change[0], (change[1][0], None), change[2],
648
(change[3][0], False)) + change[4:]
649
elif kind == 'tree-reference':
650
if self.recursive == 'down':
651
self._commit_nested_tree(change[0], change[1][1])
652
if change[3][0] or change[3][1]:
656
reporter.deleted(old_path)
657
elif old_path is None:
658
reporter.snapshot_change('added', new_path)
659
elif old_path != new_path:
660
reporter.renamed('renamed', old_path, new_path)
663
self.work_tree.branch.repository._format.rich_root_data):
664
# Don't report on changes to '' in non rich root
666
reporter.snapshot_change('modified', new_path)
667
self._next_progress_entry()
668
# Unversion IDs that were found to be deleted
669
self.deleted_ids = deleted_ids
671
def _record_unselected(self):
637
# Check and warn about old CommitBuilders
638
if not self.builder.record_root_entry:
639
symbol_versioning.warn('CommitBuilders should support recording'
640
' the root entry as of bzr 0.10.', DeprecationWarning,
642
self.builder.new_inventory.add(self.basis_inv.root.copy())
644
# Build the new inventory
645
self._populate_from_inventory(specific_files)
672
647
# If specific files are selected, then all un-selected files must be
673
648
# recorded in their previous state. For more details, see
674
649
# https://lists.ubuntu.com/archives/bazaar/2007q3/028476.html.
675
if self.specific_files or self.exclude:
676
specific_files = self.specific_files or []
677
651
for path, old_ie in self.basis_inv.iter_entries():
678
652
if old_ie.file_id in self.builder.new_inventory:
679
# already added - skip.
681
if (is_inside_any(specific_files, path)
682
and not is_inside_any(self.exclude, path)):
683
# was inside the selected path, and not excluded - if not
684
# present it has been deleted so skip.
686
# From here down it was either not selected, or was excluded:
687
# We preserve the entry unaltered.
654
if is_inside_any(specific_files, path):
656
if old_ie.kind == 'directory':
657
self._next_progress_entry()
688
658
ie = old_ie.copy()
689
659
# Note: specific file commits after a merge are currently
690
660
# prohibited. This test is for sanity/safety in case it's
691
661
# required after that changes.
692
662
if len(self.parents) > 1:
693
663
ie.revision = None
694
self.builder.record_entry_contents(ie, self.parent_invs, path,
695
self.basis_tree, None)
664
if self.builder.record_entry_contents(ie, self.parent_invs, path,
666
self.any_entries_changed = True
697
def _report_and_accumulate_deletes(self):
698
if (isinstance(self.basis_inv, Inventory)
699
and isinstance(self.builder.new_inventory, Inventory)):
700
# the older Inventory classes provide a _byid dict, and building a
701
# set from the keys of this dict is substantially faster than even
702
# getting a set of ids from the inventory
704
# <lifeless> set(dict) is roughly the same speed as
705
# set(iter(dict)) and both are significantly slower than
707
deleted_ids = set(self.basis_inv._byid.keys()) - \
708
set(self.builder.new_inventory._byid.keys())
710
deleted_ids = set(self.basis_inv) - set(self.builder.new_inventory)
668
# note that deletes have occurred
669
if set(self.basis_inv._byid.keys()) - set(self.builder.new_inventory._byid.keys()):
712
670
self.any_entries_deleted = True
713
deleted = [(self.basis_tree.id2path(file_id), file_id)
714
for file_id in deleted_ids]
716
# XXX: this is not quite directory-order sorting
717
for path, file_id in deleted:
718
self.builder.record_delete(path, file_id)
719
self.reporter.deleted(path)
671
# Report what was deleted.
672
if self.any_entries_deleted and self.reporter.is_verbose():
673
for path, ie in self.basis_inv.iter_entries():
674
if ie.file_id not in self.builder.new_inventory:
675
self.reporter.deleted(path)
721
def _check_strict(self):
722
# XXX: when we use iter_changes this would likely be faster if
723
# iter_changes would check for us (even in the presence of
677
def _populate_from_inventory(self, specific_files):
678
"""Populate the CommitBuilder by walking the working tree inventory."""
726
680
# raise an exception as soon as we find a single unknown.
727
681
for unknown in self.work_tree.unknowns():
728
682
raise StrictCommitFailed()
730
def _populate_from_inventory(self):
731
"""Populate the CommitBuilder by walking the working tree inventory."""
732
# Build the revision inventory.
734
# This starts by creating a new empty inventory. Depending on
735
# which files are selected for commit, and what is present in the
736
# current tree, the new inventory is populated. inventory entries
737
# which are candidates for modification have their revision set to
738
# None; inventory entries that are carried over untouched have their
739
# revision set to their prior value.
741
# ESEPARATIONOFCONCERNS: this function is diffing and using the diff
742
# results to create a new inventory at the same time, which results
743
# in bugs like #46635. Any reason not to use/enhance Tree.changes_from?
746
specific_files = self.specific_files
747
exclude = self.exclude
748
684
report_changes = self.reporter.is_verbose()
750
# A tree of paths that have been deleted. E.g. if foo/bar has been
751
# deleted, then we have {'foo':{'bar':{}}}
753
# XXX: Note that entries may have the wrong kind because the entry does
754
# not reflect the status on disk.
686
deleted_paths = set()
755
687
work_inv = self.work_tree.inventory
756
# NB: entries will include entries within the excluded ids/paths
757
# because iter_entries_by_dir has no 'exclude' facility today.
688
assert work_inv.root is not None
758
689
entries = work_inv.iter_entries_by_dir(
759
690
specific_file_ids=self.specific_file_ids, yield_parents=True)
691
if not self.builder.record_root_entry:
760
693
for path, existing_ie in entries:
761
694
file_id = existing_ie.file_id
762
695
name = existing_ie.name
763
696
parent_id = existing_ie.parent_id
764
697
kind = existing_ie.kind
698
if kind == 'directory':
699
self._next_progress_entry()
765
700
# Skip files that have been deleted from the working tree.
766
# The deleted path ids are also recorded so they can be explicitly
769
path_segments = splitpath(path)
770
deleted_dict = deleted_paths
771
for segment in path_segments:
772
deleted_dict = deleted_dict.get(segment, None)
774
# We either took a path not present in the dict
775
# (deleted_dict was None), or we've reached an empty
776
# child dir in the dict, so are now a sub-path.
780
if deleted_dict is not None:
781
# the path has a deleted parent, do not add it.
783
if exclude and is_inside_any(exclude, path):
784
# Skip excluded paths. Excluded paths are processed by
785
# _update_builder_with_changes.
787
content_summary = self.work_tree.path_content_summary(path)
788
kind = content_summary[0]
789
# Note that when a filter of specific files is given, we must only
790
# skip/record deleted files matching that filter.
791
if not specific_files or is_inside_any(specific_files, path):
792
if kind == 'missing':
793
if not deleted_paths:
794
# path won't have been split yet.
795
path_segments = splitpath(path)
796
deleted_dict = deleted_paths
797
for segment in path_segments:
798
deleted_dict = deleted_dict.setdefault(segment, {})
799
self.reporter.missing(path)
800
self._next_progress_entry()
801
deleted_ids.append(file_id)
803
# TODO: have the builder do the nested commit just-in-time IF and
805
if kind == 'tree-reference':
806
# enforce repository nested tree policy.
807
if (not self.work_tree.supports_tree_reference() or
808
# repository does not support it either.
809
not self.branch.repository._format.supports_tree_reference):
811
content_summary = (kind, None, None, None)
812
elif self.recursive == 'down':
813
nested_revision_id = self._commit_nested_tree(
815
content_summary = (kind, None, None, nested_revision_id)
817
nested_revision_id = self.work_tree.get_reference_revision(file_id)
818
content_summary = (kind, None, None, nested_revision_id)
701
# The deleted files/directories are also recorded so they
702
# can be explicitly unversioned later. Note that when a
703
# filter of specific files is given, we must only skip/record
704
# deleted files matching that filter.
705
if is_inside_any(deleted_paths, path):
707
if not self.work_tree.has_filename(path):
708
deleted_paths.add(path)
709
self.reporter.missing(path)
710
deleted_ids.append(file_id)
713
kind = self.work_tree.kind(file_id)
714
# TODO: specific_files filtering before nested tree processing
715
if kind == 'tree-reference' and self.recursive == 'down':
716
self._commit_nested_tree(file_id, path)
717
except errors.NoSuchFile:
820
720
# Record an entry for this item
821
721
# Note: I don't particularly want to have the existing_ie