/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/transform.py

  • Committer: mbp at sourcefrog
  • Date: 2011-04-11 01:23:58 UTC
  • mfrom: (5777 +trunk)
  • mto: This revision was merged to the branch mainline in revision 5802.
  • Revision ID: mbp@sourcefrog.net-20110411012358-gl07rdtxydlq7fh1
merge news

Show diffs side-by-side

added added

removed removed

Lines of Context:
1
 
# Copyright (C) 2006-2010 Canonical Ltd
 
1
# Copyright (C) 2006-2011 Canonical Ltd
2
2
#
3
3
# This program is free software; you can redistribute it and/or modify
4
4
# it under the terms of the GNU General Public License as published by
19
19
from stat import S_ISREG, S_IEXEC
20
20
import time
21
21
 
22
 
from bzrlib.lazy_import import lazy_import
23
 
lazy_import(globals(), """
 
22
from bzrlib import (
 
23
    errors,
 
24
    lazy_import,
 
25
    registry,
 
26
    trace,
 
27
    tree,
 
28
    )
 
29
lazy_import.lazy_import(globals(), """
24
30
from bzrlib import (
25
31
    annotate,
26
32
    bencode,
33
39
    osutils,
34
40
    revision as _mod_revision,
35
41
    ui,
 
42
    urlutils,
36
43
    )
37
44
""")
38
45
from bzrlib.errors import (DuplicateKey, MalformedTransform, NoSuchFile,
40
47
                           ExistingLimbo, ImmortalLimbo, NoFinalPath,
41
48
                           UnableCreateSymlink)
42
49
from bzrlib.filters import filtered_output_bytes, ContentFilterContext
43
 
from bzrlib.inventory import InventoryEntry
44
50
from bzrlib.osutils import (
45
51
    delete_any,
46
52
    file_kind,
47
53
    has_symlinks,
48
 
    lexists,
49
54
    pathjoin,
50
55
    sha_file,
51
56
    splitpath,
52
57
    supports_executable,
53
 
)
 
58
    )
54
59
from bzrlib.progress import ProgressPhase
55
60
from bzrlib.symbol_versioning import (
56
 
        deprecated_function,
57
 
        deprecated_in,
58
 
        )
59
 
from bzrlib.trace import mutter, warning
60
 
from bzrlib import tree
61
 
import bzrlib.ui
62
 
import bzrlib.urlutils as urlutils
 
61
    deprecated_function,
 
62
    deprecated_in,
 
63
    deprecated_method,
 
64
    )
63
65
 
64
66
 
65
67
ROOT_PARENT = "root-parent"
66
68
 
67
 
 
68
69
def unique_add(map, key, value):
69
70
    if key in map:
70
71
        raise DuplicateKey(key=key)
71
72
    map[key] = value
72
73
 
73
74
 
 
75
 
74
76
class _TransformResults(object):
75
77
    def __init__(self, modified_paths, rename_count):
76
78
        object.__init__(self)
100
102
        self._new_parent = {}
101
103
        # mapping of trans_id with new contents -> new file_kind
102
104
        self._new_contents = {}
 
105
        # mapping of trans_id => (sha1 of content, stat_value)
 
106
        self._observed_sha1s = {}
103
107
        # Set of trans_ids whose contents will be removed
104
108
        self._removed_contents = set()
105
109
        # Mapping of trans_id -> new execute-bit value
124
128
            self._new_root = self.trans_id_tree_file_id(root_id)
125
129
        else:
126
130
            self._new_root = None
127
 
        # Indictor of whether the transform has been applied
 
131
        # Indicator of whether the transform has been applied
128
132
        self._done = False
129
133
        # A progress bar
130
134
        self._pb = pb
315
319
 
316
320
    def delete_contents(self, trans_id):
317
321
        """Schedule the contents of a path entry for deletion"""
318
 
        # Ensure that the object exists in the WorkingTree, this will raise an
319
 
        # exception if there is a problem
320
 
        self.tree_kind(trans_id)
321
 
        self._removed_contents.add(trans_id)
 
322
        kind = self.tree_kind(trans_id)
 
323
        if kind is not None:
 
324
            self._removed_contents.add(trans_id)
322
325
 
323
326
    def cancel_deletion(self, trans_id):
324
327
        """Cancel a scheduled deletion"""
389
392
        changed_kind = set(self._removed_contents)
390
393
        changed_kind.intersection_update(self._new_contents)
391
394
        changed_kind.difference_update(new_ids)
392
 
        changed_kind = (t for t in changed_kind if self.tree_kind(t) !=
393
 
                        self.final_kind(t))
 
395
        changed_kind = (t for t in changed_kind
 
396
                        if self.tree_kind(t) != self.final_kind(t))
394
397
        new_ids.update(changed_kind)
395
398
        return sorted(FinalPaths(self).get_paths(new_ids))
396
399
 
397
400
    def final_kind(self, trans_id):
398
401
        """Determine the final file kind, after any changes applied.
399
402
 
400
 
        Raises NoSuchFile if the file does not exist/has no contents.
401
 
        (It is conceivable that a path would be created without the
402
 
        corresponding contents insertion command)
 
403
        :return: None if the file does not exist/has no contents.  (It is
 
404
            conceivable that a path would be created without the corresponding
 
405
            contents insertion command)
403
406
        """
404
407
        if trans_id in self._new_contents:
405
408
            return self._new_contents[trans_id]
406
409
        elif trans_id in self._removed_contents:
407
 
            raise NoSuchFile(None)
 
410
            return None
408
411
        else:
409
412
            return self.tree_kind(trans_id)
410
413
 
523
526
        for trans_id in self._removed_id:
524
527
            file_id = self.tree_file_id(trans_id)
525
528
            if file_id is not None:
 
529
                # XXX: This seems like something that should go via a different
 
530
                #      indirection.
526
531
                if self._tree.inventory[file_id].kind == 'directory':
527
532
                    parents.append(trans_id)
528
533
            elif self.tree_kind(trans_id) == 'directory':
532
537
            # ensure that all children are registered with the transaction
533
538
            list(self.iter_tree_children(parent_id))
534
539
 
 
540
    @deprecated_method(deprecated_in((2, 3, 0)))
535
541
    def has_named_child(self, by_parent, parent_id, name):
536
 
        try:
537
 
            children = by_parent[parent_id]
538
 
        except KeyError:
539
 
            children = []
540
 
        for child in children:
 
542
        return self._has_named_child(
 
543
            name, parent_id, known_children=by_parent.get(parent_id, []))
 
544
 
 
545
    def _has_named_child(self, name, parent_id, known_children):
 
546
        """Does a parent already have a name child.
 
547
 
 
548
        :param name: The searched for name.
 
549
 
 
550
        :param parent_id: The parent for which the check is made.
 
551
 
 
552
        :param known_children: The already known children. This should have
 
553
            been recently obtained from `self.by_parent.get(parent_id)`
 
554
            (or will be if None is passed).
 
555
        """
 
556
        if known_children is None:
 
557
            known_children = self.by_parent().get(parent_id, [])
 
558
        for child in known_children:
541
559
            if self.final_name(child) == name:
542
560
                return True
543
 
        try:
544
 
            path = self._tree_id_paths[parent_id]
545
 
        except KeyError:
 
561
        parent_path = self._tree_id_paths.get(parent_id, None)
 
562
        if parent_path is None:
 
563
            # No parent... no children
546
564
            return False
547
 
        childpath = joinpath(path, name)
548
 
        child_id = self._tree_path_ids.get(childpath)
 
565
        child_path = joinpath(parent_path, name)
 
566
        child_id = self._tree_path_ids.get(child_path, None)
549
567
        if child_id is None:
550
 
            return lexists(self._tree.abspath(childpath))
 
568
            # Not known by the tree transform yet, check the filesystem
 
569
            return osutils.lexists(self._tree.abspath(child_path))
551
570
        else:
552
 
            if self.final_parent(child_id) != parent_id:
553
 
                return False
554
 
            if child_id in self._removed_contents:
555
 
                # XXX What about dangling file-ids?
556
 
                return False
557
 
            else:
558
 
                return True
 
571
            raise AssertionError('child_id is missing: %s, %s, %s'
 
572
                                 % (name, parent_id, child_id))
 
573
 
 
574
    def _available_backup_name(self, name, target_id):
 
575
        """Find an available backup name.
 
576
 
 
577
        :param name: The basename of the file.
 
578
 
 
579
        :param target_id: The directory trans_id where the backup should 
 
580
            be placed.
 
581
        """
 
582
        known_children = self.by_parent().get(target_id, [])
 
583
        return osutils.available_backup_name(
 
584
            name,
 
585
            lambda base: self._has_named_child(
 
586
                base, target_id, known_children))
559
587
 
560
588
    def _parent_loops(self):
561
589
        """No entry should be its own ancestor"""
596
624
        """
597
625
        conflicts = []
598
626
        for trans_id in self._new_id.iterkeys():
599
 
            try:
600
 
                kind = self.final_kind(trans_id)
601
 
            except NoSuchFile:
 
627
            kind = self.final_kind(trans_id)
 
628
            if kind is None:
602
629
                conflicts.append(('versioning no contents', trans_id))
603
630
                continue
604
 
            if not InventoryEntry.versionable_kind(kind):
 
631
            if not inventory.InventoryEntry.versionable_kind(kind):
605
632
                conflicts.append(('versioning bad kind', trans_id, kind))
606
633
        return conflicts
607
634
 
618
645
            if self.final_file_id(trans_id) is None:
619
646
                conflicts.append(('unversioned executability', trans_id))
620
647
            else:
621
 
                try:
622
 
                    non_file = self.final_kind(trans_id) != "file"
623
 
                except NoSuchFile:
624
 
                    non_file = True
625
 
                if non_file is True:
 
648
                if self.final_kind(trans_id) != "file":
626
649
                    conflicts.append(('non-file executability', trans_id))
627
650
        return conflicts
628
651
 
630
653
        """Check for overwrites (not permitted on Win32)"""
631
654
        conflicts = []
632
655
        for trans_id in self._new_contents:
633
 
            try:
634
 
                self.tree_kind(trans_id)
635
 
            except NoSuchFile:
 
656
            if self.tree_kind(trans_id) is None:
636
657
                continue
637
658
            if trans_id not in self._removed_contents:
638
659
                conflicts.append(('overwrite', trans_id,
645
666
        if (self._new_name, self._new_parent) == ({}, {}):
646
667
            return conflicts
647
668
        for children in by_parent.itervalues():
648
 
            name_ids = [(self.final_name(t), t) for t in children]
649
 
            if not self._case_sensitive_target:
650
 
                name_ids = [(n.lower(), t) for n, t in name_ids]
 
669
            name_ids = []
 
670
            for child_tid in children:
 
671
                name = self.final_name(child_tid)
 
672
                if name is not None:
 
673
                    # Keep children only if they still exist in the end
 
674
                    if not self._case_sensitive_target:
 
675
                        name = name.lower()
 
676
                    name_ids.append((name, child_tid))
651
677
            name_ids.sort()
652
678
            last_name = None
653
679
            last_trans_id = None
654
680
            for name, trans_id in name_ids:
655
 
                try:
656
 
                    kind = self.final_kind(trans_id)
657
 
                except NoSuchFile:
658
 
                    kind = None
 
681
                kind = self.final_kind(trans_id)
659
682
                file_id = self.final_file_id(trans_id)
660
683
                if kind is None and file_id is None:
661
684
                    continue
680
703
        return conflicts
681
704
 
682
705
    def _parent_type_conflicts(self, by_parent):
683
 
        """parents must have directory 'contents'."""
 
706
        """Children must have a directory parent"""
684
707
        conflicts = []
685
708
        for parent_id, children in by_parent.iteritems():
686
709
            if parent_id is ROOT_PARENT:
687
710
                continue
688
 
            if not self._any_contents(children):
 
711
            no_children = True
 
712
            for child_id in children:
 
713
                if self.final_kind(child_id) is not None:
 
714
                    no_children = False
 
715
                    break
 
716
            if no_children:
689
717
                continue
690
 
            for child in children:
691
 
                try:
692
 
                    self.final_kind(child)
693
 
                except NoSuchFile:
694
 
                    continue
695
 
            try:
696
 
                kind = self.final_kind(parent_id)
697
 
            except NoSuchFile:
698
 
                kind = None
 
718
            # There is at least a child, so we need an existing directory to
 
719
            # contain it.
 
720
            kind = self.final_kind(parent_id)
699
721
            if kind is None:
 
722
                # The directory will be deleted
700
723
                conflicts.append(('missing parent', parent_id))
701
724
            elif kind != "directory":
 
725
                # Meh, we need a *directory* to put something in it
702
726
                conflicts.append(('non-directory parent', parent_id))
703
727
        return conflicts
704
728
 
705
 
    def _any_contents(self, trans_ids):
706
 
        """Return true if any of the trans_ids, will have contents."""
707
 
        for trans_id in trans_ids:
708
 
            try:
709
 
                kind = self.final_kind(trans_id)
710
 
            except NoSuchFile:
711
 
                continue
712
 
            return True
713
 
        return False
714
 
 
715
729
    def _set_executability(self, path, trans_id):
716
730
        """Set the executability of versioned files """
717
731
        if supports_executable():
739
753
        return trans_id
740
754
 
741
755
    def new_file(self, name, parent_id, contents, file_id=None,
742
 
                 executable=None):
 
756
                 executable=None, sha1=None):
743
757
        """Convenience method to create files.
744
758
 
745
759
        name is the name of the file to create.
752
766
        trans_id = self._new_entry(name, parent_id, file_id)
753
767
        # TODO: rather than scheduling a set_executable call,
754
768
        # have create_file create the file with the right mode.
755
 
        self.create_file(contents, trans_id)
 
769
        self.create_file(contents, trans_id, sha1=sha1)
756
770
        if executable is not None:
757
771
            self.set_executability(executable, trans_id)
758
772
        return trans_id
781
795
        self.create_symlink(target, trans_id)
782
796
        return trans_id
783
797
 
 
798
    def new_orphan(self, trans_id, parent_id):
 
799
        """Schedule an item to be orphaned.
 
800
 
 
801
        When a directory is about to be removed, its children, if they are not
 
802
        versioned are moved out of the way: they don't have a parent anymore.
 
803
 
 
804
        :param trans_id: The trans_id of the existing item.
 
805
        :param parent_id: The parent trans_id of the item.
 
806
        """
 
807
        raise NotImplementedError(self.new_orphan)
 
808
 
 
809
    def _get_potential_orphans(self, dir_id):
 
810
        """Find the potential orphans in a directory.
 
811
 
 
812
        A directory can't be safely deleted if there are versioned files in it.
 
813
        If all the contained files are unversioned then they can be orphaned.
 
814
 
 
815
        The 'None' return value means that the directory contains at least one
 
816
        versioned file and should not be deleted.
 
817
 
 
818
        :param dir_id: The directory trans id.
 
819
 
 
820
        :return: A list of the orphan trans ids or None if at least one
 
821
             versioned file is present.
 
822
        """
 
823
        orphans = []
 
824
        # Find the potential orphans, stop if one item should be kept
 
825
        for child_tid in self.by_parent()[dir_id]:
 
826
            if child_tid in self._removed_contents:
 
827
                # The child is removed as part of the transform. Since it was
 
828
                # versioned before, it's not an orphan
 
829
                continue
 
830
            elif self.final_file_id(child_tid) is None:
 
831
                # The child is not versioned
 
832
                orphans.append(child_tid)
 
833
            else:
 
834
                # We have a versioned file here, searching for orphans is
 
835
                # meaningless.
 
836
                orphans = None
 
837
                break
 
838
        return orphans
 
839
 
784
840
    def _affected_ids(self):
785
841
        """Return the set of transform ids affected by the transform"""
786
842
        trans_ids = set(self._removed_id)
845
901
        Return a (name, parent, kind, executable) tuple
846
902
        """
847
903
        to_name = self.final_name(to_trans_id)
848
 
        try:
849
 
            to_kind = self.final_kind(to_trans_id)
850
 
        except NoSuchFile:
851
 
            to_kind = None
 
904
        to_kind = self.final_kind(to_trans_id)
852
905
        to_parent = self.final_file_id(self.final_parent(to_trans_id))
853
906
        if to_trans_id in self._new_executability:
854
907
            to_executable = self._new_executability[to_trans_id]
1182
1235
            if trans_id not in self._new_contents:
1183
1236
                continue
1184
1237
            new_path = self._limbo_name(trans_id)
1185
 
            osutils.rename(old_path, new_path)
 
1238
            os.rename(old_path, new_path)
1186
1239
            for descendant in self._limbo_descendants(trans_id):
1187
1240
                desc_path = self._limbo_files[descendant]
1188
1241
                desc_path = new_path + desc_path[len(old_path):]
1195
1248
            descendants.update(self._limbo_descendants(descendant))
1196
1249
        return descendants
1197
1250
 
1198
 
    def create_file(self, contents, trans_id, mode_id=None):
 
1251
    def create_file(self, contents, trans_id, mode_id=None, sha1=None):
1199
1252
        """Schedule creation of a new file.
1200
1253
 
1201
 
        See also new_file.
1202
 
 
1203
 
        Contents is an iterator of strings, all of which will be written
1204
 
        to the target destination.
1205
 
 
1206
 
        New file takes the permissions of any existing file with that id,
1207
 
        unless mode_id is specified.
 
1254
        :seealso: new_file.
 
1255
 
 
1256
        :param contents: an iterator of strings, all of which will be written
 
1257
            to the target destination.
 
1258
        :param trans_id: TreeTransform handle
 
1259
        :param mode_id: If not None, force the mode of the target file to match
 
1260
            the mode of the object referenced by mode_id.
 
1261
            Otherwise, we will try to preserve mode bits of an existing file.
 
1262
        :param sha1: If the sha1 of this content is already known, pass it in.
 
1263
            We can use it to prevent future sha1 computations.
1208
1264
        """
1209
1265
        name = self._limbo_name(trans_id)
1210
1266
        f = open(name, 'wb')
1217
1273
                f.close()
1218
1274
                os.unlink(name)
1219
1275
                raise
1220
 
 
1221
1276
            f.writelines(contents)
1222
1277
        finally:
1223
1278
            f.close()
1224
1279
        self._set_mtime(name)
1225
1280
        self._set_mode(trans_id, mode_id, S_ISREG)
 
1281
        # It is unfortunate we have to use lstat instead of fstat, but we just
 
1282
        # used utime and chmod on the file, so we need the accurate final
 
1283
        # details.
 
1284
        if sha1 is not None:
 
1285
            self._observed_sha1s[trans_id] = (sha1, osutils.lstat(name))
1226
1286
 
1227
1287
    def _read_file_chunks(self, trans_id):
1228
1288
        cur_file = open(self._limbo_name(trans_id), 'rb')
1287
1347
    def cancel_creation(self, trans_id):
1288
1348
        """Cancel the creation of new file contents."""
1289
1349
        del self._new_contents[trans_id]
 
1350
        if trans_id in self._observed_sha1s:
 
1351
            del self._observed_sha1s[trans_id]
1290
1352
        children = self._limbo_children.get(trans_id)
1291
1353
        # if this is a limbo directory with children, move them before removing
1292
1354
        # the directory
1296
1358
            del self._limbo_children_names[trans_id]
1297
1359
        delete_any(self._limbo_name(trans_id))
1298
1360
 
 
1361
    def new_orphan(self, trans_id, parent_id):
 
1362
        # FIXME: There is no tree config, so we use the branch one (it's weird
 
1363
        # to define it this way as orphaning can only occur in a working tree,
 
1364
        # but that's all we have (for now). It will find the option in
 
1365
        # locations.conf or bazaar.conf though) -- vila 20100916
 
1366
        conf = self._tree.branch.get_config()
 
1367
        conf_var_name = 'bzr.transform.orphan_policy'
 
1368
        orphan_policy = conf.get_user_option(conf_var_name)
 
1369
        default_policy = orphaning_registry.default_key
 
1370
        if orphan_policy is None:
 
1371
            orphan_policy = default_policy
 
1372
        if orphan_policy not in orphaning_registry:
 
1373
            trace.warning('%s (from %s) is not a known policy, defaulting '
 
1374
                'to %s' % (orphan_policy, conf_var_name, default_policy))
 
1375
            orphan_policy = default_policy
 
1376
        handle_orphan = orphaning_registry.get(orphan_policy)
 
1377
        handle_orphan(self, trans_id, parent_id)
 
1378
 
 
1379
 
 
1380
class OrphaningError(errors.BzrError):
 
1381
 
 
1382
    # Only bugs could lead to such exception being seen by the user
 
1383
    internal_error = True
 
1384
    _fmt = "Error while orphaning %s in %s directory"
 
1385
 
 
1386
    def __init__(self, orphan, parent):
 
1387
        errors.BzrError.__init__(self)
 
1388
        self.orphan = orphan
 
1389
        self.parent = parent
 
1390
 
 
1391
 
 
1392
class OrphaningForbidden(OrphaningError):
 
1393
 
 
1394
    _fmt = "Policy: %s doesn't allow creating orphans."
 
1395
 
 
1396
    def __init__(self, policy):
 
1397
        errors.BzrError.__init__(self)
 
1398
        self.policy = policy
 
1399
 
 
1400
 
 
1401
def move_orphan(tt, orphan_id, parent_id):
 
1402
    """See TreeTransformBase.new_orphan.
 
1403
 
 
1404
    This creates a new orphan in the `bzr-orphans` dir at the root of the
 
1405
    `TreeTransform`.
 
1406
 
 
1407
    :param tt: The TreeTransform orphaning `trans_id`.
 
1408
 
 
1409
    :param orphan_id: The trans id that should be orphaned.
 
1410
 
 
1411
    :param parent_id: The orphan parent trans id.
 
1412
    """
 
1413
    # Add the orphan dir if it doesn't exist
 
1414
    orphan_dir_basename = 'bzr-orphans'
 
1415
    od_id = tt.trans_id_tree_path(orphan_dir_basename)
 
1416
    if tt.final_kind(od_id) is None:
 
1417
        tt.create_directory(od_id)
 
1418
    parent_path = tt._tree_id_paths[parent_id]
 
1419
    # Find a name that doesn't exist yet in the orphan dir
 
1420
    actual_name = tt.final_name(orphan_id)
 
1421
    new_name = tt._available_backup_name(actual_name, od_id)
 
1422
    tt.adjust_path(new_name, od_id, orphan_id)
 
1423
    trace.warning('%s has been orphaned in %s'
 
1424
                  % (joinpath(parent_path, actual_name), orphan_dir_basename))
 
1425
 
 
1426
 
 
1427
def refuse_orphan(tt, orphan_id, parent_id):
 
1428
    """See TreeTransformBase.new_orphan.
 
1429
 
 
1430
    This refuses to create orphan, letting the caller handle the conflict.
 
1431
    """
 
1432
    raise OrphaningForbidden('never')
 
1433
 
 
1434
 
 
1435
orphaning_registry = registry.Registry()
 
1436
orphaning_registry.register(
 
1437
    'conflict', refuse_orphan,
 
1438
    'Leave orphans in place and create a conflict on the directory.')
 
1439
orphaning_registry.register(
 
1440
    'move', move_orphan,
 
1441
    'Move orphans into the bzr-orphans directory.')
 
1442
orphaning_registry._set_default_key('conflict')
 
1443
 
1299
1444
 
1300
1445
class TreeTransform(DiskTreeTransform):
1301
1446
    """Represent a tree transformation.
1419
1564
    def tree_kind(self, trans_id):
1420
1565
        """Determine the file kind in the working tree.
1421
1566
 
1422
 
        Raises NoSuchFile if the file does not exist
 
1567
        :returns: The file kind or None if the file does not exist
1423
1568
        """
1424
1569
        path = self._tree_id_paths.get(trans_id)
1425
1570
        if path is None:
1426
 
            raise NoSuchFile(None)
 
1571
            return None
1427
1572
        try:
1428
1573
            return file_kind(self._tree.abspath(path))
1429
 
        except OSError, e:
1430
 
            if e.errno != errno.ENOENT:
1431
 
                raise
1432
 
            else:
1433
 
                raise NoSuchFile(path)
 
1574
        except errors.NoSuchFile:
 
1575
            return None
1434
1576
 
1435
1577
    def _set_mode(self, trans_id, mode_id, typefunc):
1436
1578
        """Set the mode of new file contents.
1542
1684
        """
1543
1685
        if not no_conflicts:
1544
1686
            self._check_malformed()
1545
 
        child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
1687
        child_pb = ui.ui_factory.nested_progress_bar()
1546
1688
        try:
1547
1689
            if precomputed_delta is None:
1548
1690
                child_pb.update('Apply phase', 0, 2)
1568
1710
        finally:
1569
1711
            child_pb.finished()
1570
1712
        self._tree.apply_inventory_delta(inventory_delta)
 
1713
        self._apply_observed_sha1s()
1571
1714
        self._done = True
1572
1715
        self.finalize()
1573
1716
        return _TransformResults(modified_paths, self.rename_count)
1575
1718
    def _generate_inventory_delta(self):
1576
1719
        """Generate an inventory delta for the current transform."""
1577
1720
        inventory_delta = []
1578
 
        child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
1721
        child_pb = ui.ui_factory.nested_progress_bar()
1579
1722
        new_paths = self._inventory_altered()
1580
1723
        total_entries = len(new_paths) + len(self._removed_id)
1581
1724
        try:
1605
1748
                if file_id is None:
1606
1749
                    continue
1607
1750
                needs_entry = False
1608
 
                try:
1609
 
                    kind = self.final_kind(trans_id)
1610
 
                except NoSuchFile:
 
1751
                kind = self.final_kind(trans_id)
 
1752
                if kind is None:
1611
1753
                    kind = self._tree.stored_kind(file_id)
1612
1754
                parent_trans_id = self.final_parent(trans_id)
1613
1755
                parent_file_id = new_path_file_ids.get(parent_trans_id)
1644
1786
        """
1645
1787
        tree_paths = list(self._tree_path_ids.iteritems())
1646
1788
        tree_paths.sort(reverse=True)
1647
 
        child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
1789
        child_pb = ui.ui_factory.nested_progress_bar()
1648
1790
        try:
1649
1791
            for num, data in enumerate(tree_paths):
1650
1792
                path, trans_id = data
1657
1799
                      or trans_id in self._new_parent):
1658
1800
                    try:
1659
1801
                        mover.rename(full_path, self._limbo_name(trans_id))
1660
 
                    except OSError, e:
 
1802
                    except errors.TransformRenameFailed, e:
1661
1803
                        if e.errno != errno.ENOENT:
1662
1804
                            raise
1663
1805
                    else:
1679
1821
        modified_paths = []
1680
1822
        new_path_file_ids = dict((t, self.final_file_id(t)) for p, t in
1681
1823
                                 new_paths)
1682
 
        child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
1824
        child_pb = ui.ui_factory.nested_progress_bar()
1683
1825
        try:
1684
1826
            for num, (path, trans_id) in enumerate(new_paths):
1685
1827
                if (num % 10) == 0:
1688
1830
                if trans_id in self._needs_rename:
1689
1831
                    try:
1690
1832
                        mover.rename(self._limbo_name(trans_id), full_path)
1691
 
                    except OSError, e:
 
1833
                    except errors.TransformRenameFailed, e:
1692
1834
                        # We may be renaming a dangling inventory id
1693
1835
                        if e.errno != errno.ENOENT:
1694
1836
                            raise
1695
1837
                    else:
1696
1838
                        self.rename_count += 1
 
1839
                    # TODO: if trans_id in self._observed_sha1s, we should
 
1840
                    #       re-stat the final target, since ctime will be
 
1841
                    #       updated by the change.
1697
1842
                if (trans_id in self._new_contents or
1698
1843
                    self.path_changed(trans_id)):
1699
1844
                    if trans_id in self._new_contents:
1700
1845
                        modified_paths.append(full_path)
1701
1846
                if trans_id in self._new_executability:
1702
1847
                    self._set_executability(path, trans_id)
 
1848
                if trans_id in self._observed_sha1s:
 
1849
                    o_sha1, o_st_val = self._observed_sha1s[trans_id]
 
1850
                    st = osutils.lstat(full_path)
 
1851
                    self._observed_sha1s[trans_id] = (o_sha1, st)
1703
1852
        finally:
1704
1853
            child_pb.finished()
1705
1854
        self._new_contents.clear()
1706
1855
        return modified_paths
1707
1856
 
 
1857
    def _apply_observed_sha1s(self):
 
1858
        """After we have finished renaming everything, update observed sha1s
 
1859
 
 
1860
        This has to be done after self._tree.apply_inventory_delta, otherwise
 
1861
        it doesn't know anything about the files we are updating. Also, we want
 
1862
        to do this as late as possible, so that most entries end up cached.
 
1863
        """
 
1864
        # TODO: this doesn't update the stat information for directories. So
 
1865
        #       the first 'bzr status' will still need to rewrite
 
1866
        #       .bzr/checkout/dirstate. However, we at least don't need to
 
1867
        #       re-read all of the files.
 
1868
        # TODO: If the operation took a while, we could do a time.sleep(3) here
 
1869
        #       to allow the clock to tick over and ensure we won't have any
 
1870
        #       problems. (we could observe start time, and finish time, and if
 
1871
        #       it is less than eg 10% overhead, add a sleep call.)
 
1872
        paths = FinalPaths(self)
 
1873
        for trans_id, observed in self._observed_sha1s.iteritems():
 
1874
            path = paths.get_path(trans_id)
 
1875
            # We could get the file_id, but dirstate prefers to use the path
 
1876
            # anyway, and it is 'cheaper' to determine.
 
1877
            # file_id = self._new_id[trans_id]
 
1878
            self._tree._observed_sha1(None, path, observed)
 
1879
 
1708
1880
 
1709
1881
class TransformPreview(DiskTreeTransform):
1710
1882
    """A TreeTransform for generating preview trees.
1725
1897
    def tree_kind(self, trans_id):
1726
1898
        path = self._tree_id_paths.get(trans_id)
1727
1899
        if path is None:
1728
 
            raise NoSuchFile(None)
 
1900
            return None
1729
1901
        file_id = self._tree.path2id(path)
1730
 
        return self._tree.kind(file_id)
 
1902
        try:
 
1903
            return self._tree.kind(file_id)
 
1904
        except errors.NoSuchFile:
 
1905
            return None
1731
1906
 
1732
1907
    def _set_mode(self, trans_id, mode_id, typefunc):
1733
1908
        """Set the mode of new file contents.
1753
1928
            childpath = joinpath(path, child)
1754
1929
            yield self.trans_id_tree_path(childpath)
1755
1930
 
 
1931
    def new_orphan(self, trans_id, parent_id):
 
1932
        raise NotImplementedError(self.new_orphan)
 
1933
 
1756
1934
 
1757
1935
class _PreviewTree(tree.Tree):
1758
1936
    """Partial implementation of Tree to support show_diff_trees"""
1792
1970
        parent_keys = [(file_id, self._file_revision(t, file_id)) for t in
1793
1971
                       self._iter_parent_trees()]
1794
1972
        vf.add_lines((file_id, tree_revision), parent_keys,
1795
 
                     self.get_file(file_id).readlines())
 
1973
                     self.get_file_lines(file_id))
1796
1974
        repo = self._get_repository()
1797
1975
        base_vf = repo.texts
1798
1976
        if base_vf not in vf.fallback_versionedfiles:
1929
2107
            if (specific_file_ids is not None
1930
2108
                and file_id not in specific_file_ids):
1931
2109
                continue
1932
 
            try:
1933
 
                kind = self._transform.final_kind(trans_id)
1934
 
            except NoSuchFile:
 
2110
            kind = self._transform.final_kind(trans_id)
 
2111
            if kind is None:
1935
2112
                kind = self._transform._tree.stored_kind(file_id)
1936
2113
            new_entry = inventory.make_entry(
1937
2114
                kind,
2169
2346
                path_from_root = self._final_paths.get_path(child_id)
2170
2347
                basename = self._transform.final_name(child_id)
2171
2348
                file_id = self._transform.final_file_id(child_id)
2172
 
                try:
2173
 
                    kind = self._transform.final_kind(child_id)
 
2349
                kind  = self._transform.final_kind(child_id)
 
2350
                if kind is not None:
2174
2351
                    versioned_kind = kind
2175
 
                except NoSuchFile:
 
2352
                else:
2176
2353
                    kind = 'unknown'
2177
2354
                    versioned_kind = self._transform._tree.stored_kind(file_id)
2178
2355
                if versioned_kind == 'directory':
2291
2468
    for num, _unused in enumerate(wt.all_file_ids()):
2292
2469
        if num > 0:  # more than just a root
2293
2470
            raise errors.WorkingTreeAlreadyPopulated(base=wt.basedir)
2294
 
    existing_files = set()
2295
 
    for dir, files in wt.walkdirs():
2296
 
        existing_files.update(f[0] for f in files)
2297
2471
    file_trans_id = {}
2298
 
    top_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
2472
    top_pb = ui.ui_factory.nested_progress_bar()
2299
2473
    pp = ProgressPhase("Build phase", 2, top_pb)
2300
2474
    if tree.inventory.root is not None:
2301
2475
        # This is kind of a hack: we should be altering the root
2314
2488
        pp.next_phase()
2315
2489
        file_trans_id[wt.get_root_id()] = \
2316
2490
            tt.trans_id_tree_file_id(wt.get_root_id())
2317
 
        pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
2491
        pb = ui.ui_factory.nested_progress_bar()
2318
2492
        try:
2319
2493
            deferred_contents = []
2320
2494
            num = 0
2323
2497
                precomputed_delta = []
2324
2498
            else:
2325
2499
                precomputed_delta = None
 
2500
            # Check if tree inventory has content. If so, we populate
 
2501
            # existing_files with the directory content. If there are no
 
2502
            # entries we skip populating existing_files as its not used.
 
2503
            # This improves performance and unncessary work on large
 
2504
            # directory trees. (#501307)
 
2505
            if total > 0:
 
2506
                existing_files = set()
 
2507
                for dir, files in wt.walkdirs():
 
2508
                    existing_files.update(f[0] for f in files)
2326
2509
            for num, (tree_path, entry) in \
2327
2510
                enumerate(tree.inventory.iter_entries_by_dir()):
2328
2511
                pb.update("Building tree", num - len(deferred_contents), total)
2358
2541
                    executable = tree.is_executable(file_id, tree_path)
2359
2542
                    if executable:
2360
2543
                        tt.set_executability(executable, trans_id)
2361
 
                    trans_data = (trans_id, tree_path)
 
2544
                    trans_data = (trans_id, tree_path, entry.text_sha1)
2362
2545
                    deferred_contents.append((file_id, trans_data))
2363
2546
                else:
2364
2547
                    file_trans_id[file_id] = new_by_entry(tt, entry, parent_id,
2380
2563
            precomputed_delta = None
2381
2564
        conflicts = cook_conflicts(raw_conflicts, tt)
2382
2565
        for conflict in conflicts:
2383
 
            warning(conflict)
 
2566
            trace.warning(conflict)
2384
2567
        try:
2385
2568
            wt.add_conflicts(conflicts)
2386
2569
        except errors.UnsupportedOperation:
2409
2592
        unchanged = dict(unchanged)
2410
2593
        new_desired_files = []
2411
2594
        count = 0
2412
 
        for file_id, (trans_id, tree_path) in desired_files:
 
2595
        for file_id, (trans_id, tree_path, text_sha1) in desired_files:
2413
2596
            accelerator_path = unchanged.get(file_id)
2414
2597
            if accelerator_path is None:
2415
 
                new_desired_files.append((file_id, (trans_id, tree_path)))
 
2598
                new_desired_files.append((file_id,
 
2599
                    (trans_id, tree_path, text_sha1)))
2416
2600
                continue
2417
2601
            pb.update('Adding file contents', count + offset, total)
2418
2602
            if hardlink:
2425
2609
                    contents = filtered_output_bytes(contents, filters,
2426
2610
                        ContentFilterContext(tree_path, tree))
2427
2611
                try:
2428
 
                    tt.create_file(contents, trans_id)
 
2612
                    tt.create_file(contents, trans_id, sha1=text_sha1)
2429
2613
                finally:
2430
2614
                    try:
2431
2615
                        contents.close()
2434
2618
                        pass
2435
2619
            count += 1
2436
2620
        offset += count
2437
 
    for count, ((trans_id, tree_path), contents) in enumerate(
 
2621
    for count, ((trans_id, tree_path, text_sha1), contents) in enumerate(
2438
2622
            tree.iter_files_bytes(new_desired_files)):
2439
2623
        if wt.supports_content_filtering():
2440
2624
            filters = wt._content_filter_stack(tree_path)
2441
2625
            contents = filtered_output_bytes(contents, filters,
2442
2626
                ContentFilterContext(tree_path, tree))
2443
 
        tt.create_file(contents, trans_id)
 
2627
        tt.create_file(contents, trans_id, sha1=text_sha1)
2444
2628
        pb.update('Adding file contents', count + offset, total)
2445
2629
 
2446
2630
 
2448
2632
    for child in tt.iter_tree_children(old_parent):
2449
2633
        tt.adjust_path(tt.final_name(child), new_parent, child)
2450
2634
 
 
2635
 
2451
2636
def _reparent_transform_children(tt, old_parent, new_parent):
2452
2637
    by_parent = tt.by_parent()
2453
2638
    for child in by_parent[old_parent]:
2454
2639
        tt.adjust_path(tt.final_name(child), new_parent, child)
2455
2640
    return by_parent[old_parent]
2456
2641
 
 
2642
 
2457
2643
def _content_match(tree, entry, file_id, kind, target_path):
2458
2644
    if entry.kind != kind:
2459
2645
        return False
2460
2646
    if entry.kind == "directory":
2461
2647
        return True
2462
2648
    if entry.kind == "file":
2463
 
        if tree.get_file(file_id).read() == file(target_path, 'rb').read():
2464
 
            return True
 
2649
        f = file(target_path, 'rb')
 
2650
        try:
 
2651
            if tree.get_file_text(file_id) == f.read():
 
2652
                return True
 
2653
        finally:
 
2654
            f.close()
2465
2655
    elif entry.kind == "symlink":
2466
2656
        if tree.get_symlink_target(file_id) == os.readlink(target_path):
2467
2657
            return True
2519
2709
        raise errors.BadFileKindError(name, kind)
2520
2710
 
2521
2711
 
2522
 
@deprecated_function(deprecated_in((1, 9, 0)))
2523
 
def create_by_entry(tt, entry, tree, trans_id, lines=None, mode_id=None):
2524
 
    """Create new file contents according to an inventory entry.
2525
 
 
2526
 
    DEPRECATED.  Use create_from_tree instead.
2527
 
    """
2528
 
    if entry.kind == "file":
2529
 
        if lines is None:
2530
 
            lines = tree.get_file(entry.file_id).readlines()
2531
 
        tt.create_file(lines, trans_id, mode_id=mode_id)
2532
 
    elif entry.kind == "symlink":
2533
 
        tt.create_symlink(tree.get_symlink_target(entry.file_id), trans_id)
2534
 
    elif entry.kind == "directory":
2535
 
        tt.create_directory(trans_id)
2536
 
 
2537
 
 
2538
2712
def create_from_tree(tt, trans_id, tree, file_id, bytes=None,
2539
2713
    filter_tree_path=None):
2540
2714
    """Create new file contents according to tree contents.
2571
2745
        tt.set_executability(entry.executable, trans_id)
2572
2746
 
2573
2747
 
 
2748
@deprecated_function(deprecated_in((2, 3, 0)))
2574
2749
def get_backup_name(entry, by_parent, parent_trans_id, tt):
2575
2750
    return _get_backup_name(entry.name, by_parent, parent_trans_id, tt)
2576
2751
 
2577
2752
 
 
2753
@deprecated_function(deprecated_in((2, 3, 0)))
2578
2754
def _get_backup_name(name, by_parent, parent_trans_id, tt):
2579
2755
    """Produce a backup-style name that appears to be available"""
2580
2756
    def name_gen():
2629
2805
                unversioned_filter=working_tree.is_ignored)
2630
2806
            delta.report_changes(tt.iter_changes(), change_reporter)
2631
2807
        for conflict in conflicts:
2632
 
            warning(conflict)
 
2808
            trace.warning(conflict)
2633
2809
        pp.next_phase()
2634
2810
        tt.apply()
2635
2811
        working_tree.set_merge_modified(merge_modified)
2643
2819
def _prepare_revert_transform(working_tree, target_tree, tt, filenames,
2644
2820
                              backups, pp, basis_tree=None,
2645
2821
                              merge_modified=None):
2646
 
    child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
2822
    child_pb = ui.ui_factory.nested_progress_bar()
2647
2823
    try:
2648
2824
        if merge_modified is None:
2649
2825
            merge_modified = working_tree.merge_modified()
2652
2828
                                      merge_modified, basis_tree)
2653
2829
    finally:
2654
2830
        child_pb.finished()
2655
 
    child_pb = bzrlib.ui.ui_factory.nested_progress_bar()
 
2831
    child_pb = ui.ui_factory.nested_progress_bar()
2656
2832
    try:
2657
2833
        raw_conflicts = resolve_conflicts(tt, child_pb,
2658
2834
            lambda t, c: conflict_pass(t, c, target_tree))
2701
2877
                        tt.delete_contents(trans_id)
2702
2878
                    elif kind[1] is not None:
2703
2879
                        parent_trans_id = tt.trans_id_file_id(parent[0])
2704
 
                        by_parent = tt.by_parent()
2705
 
                        backup_name = _get_backup_name(name[0], by_parent,
2706
 
                                                       parent_trans_id, tt)
 
2880
                        backup_name = tt._available_backup_name(
 
2881
                            name[0], parent_trans_id)
2707
2882
                        tt.adjust_path(backup_name, parent_trans_id, trans_id)
2708
2883
                        new_trans_id = tt.create_path(name[0], parent_trans_id)
2709
2884
                        if versioned == (True, True):
2832
3007
 
2833
3008
        elif c_type == 'missing parent':
2834
3009
            trans_id = conflict[1]
2835
 
            try:
2836
 
                tt.cancel_deletion(trans_id)
2837
 
                new_conflicts.add(('deleting parent', 'Not deleting',
2838
 
                                   trans_id))
2839
 
            except KeyError:
 
3010
            if trans_id in tt._removed_contents:
 
3011
                cancel_deletion = True
 
3012
                orphans = tt._get_potential_orphans(trans_id)
 
3013
                if orphans:
 
3014
                    cancel_deletion = False
 
3015
                    # All children are orphans
 
3016
                    for o in orphans:
 
3017
                        try:
 
3018
                            tt.new_orphan(o, trans_id)
 
3019
                        except OrphaningError:
 
3020
                            # Something bad happened so we cancel the directory
 
3021
                            # deletion which will leave it in place with a
 
3022
                            # conflict. The user can deal with it from there.
 
3023
                            # Note that this also catch the case where we don't
 
3024
                            # want to create orphans and leave the directory in
 
3025
                            # place.
 
3026
                            cancel_deletion = True
 
3027
                            break
 
3028
                if cancel_deletion:
 
3029
                    # Cancel the directory deletion
 
3030
                    tt.cancel_deletion(trans_id)
 
3031
                    new_conflicts.add(('deleting parent', 'Not deleting',
 
3032
                                       trans_id))
 
3033
            else:
2840
3034
                create = True
2841
3035
                try:
2842
3036
                    tt.final_name(trans_id)
2867
3061
            file_id = tt.inactive_file_id(conflict[1])
2868
3062
            # special-case the other tree root (move its children instead)
2869
3063
            if path_tree and file_id in path_tree:
2870
 
                if path_tree.inventory[file_id].parent_id is None:
 
3064
                if path_tree.path2id('') == file_id:
 
3065
                    # This is the root entry, skip it
2871
3066
                    continue
2872
3067
            tt.version_file(file_id, conflict[1])
2873
3068
            new_conflicts.add((c_type, 'Versioned directory', conflict[1]))
2925
3120
    def rename(self, from_, to):
2926
3121
        """Rename a file from one path to another."""
2927
3122
        try:
2928
 
            osutils.rename(from_, to)
 
3123
            os.rename(from_, to)
2929
3124
        except OSError, e:
2930
3125
            if e.errno in (errno.EEXIST, errno.ENOTEMPTY):
2931
3126
                raise errors.FileExists(to, str(e))
2932
 
            raise
 
3127
            # normal OSError doesn't include filenames so it's hard to see where
 
3128
            # the problem is, see https://bugs.launchpad.net/bzr/+bug/491763
 
3129
            raise errors.TransformRenameFailed(from_, to, str(e), e.errno)
2933
3130
        self.past_renames.append((from_, to))
2934
3131
 
2935
3132
    def pre_delete(self, from_, to):
2945
3142
    def rollback(self):
2946
3143
        """Reverse all renames that have been performed"""
2947
3144
        for from_, to in reversed(self.past_renames):
2948
 
            osutils.rename(to, from_)
 
3145
            try:
 
3146
                os.rename(to, from_)
 
3147
            except OSError, e:
 
3148
                raise errors.TransformRenameFailed(to, from_, str(e), e.errno)
2949
3149
        # after rollback, don't reuse _FileMover
2950
3150
        past_renames = None
2951
3151
        pending_deletions = None