/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1
# Copyright (C) 2005, 2006, 2007, 2008 Canonical Ltd
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
"""WorkingTree4 format and implementation.
18
19
WorkingTree4 provides the dirstate based working tree logic.
20
21
To get a WorkingTree, call bzrdir.open_workingtree() or
22
WorkingTree.open(dir).
23
"""
24
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
25
from cStringIO import StringIO
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
26
import os
2255.2.138 by John Arbash Meinel
implement several new WorkingTree.move() tests
27
import sys
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
28
29
from bzrlib.lazy_import import lazy_import
30
lazy_import(globals(), """
31
from bisect import bisect_left
32
import collections
33
from copy import deepcopy
34
import errno
35
import itertools
36
import operator
37
import stat
38
from time import time
39
import warnings
40
41
import bzrlib
42
from bzrlib import (
43
    bzrdir,
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
44
    cache_utf8,
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
45
    conflicts as _mod_conflicts,
2745.1.1 by Robert Collins
Add a number of -Devil checkpoints.
46
    debug,
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
47
    delta,
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
48
    dirstate,
49
    errors,
50
    generate_ids,
51
    globbing,
52
    ignores,
53
    merge,
54
    osutils,
2598.5.2 by Aaron Bentley
Got all tests passing with Branch returning 'null:' for null revision
55
    revision as _mod_revision,
2255.2.117 by Robert Collins
Add an InterDirStateTree InterTree optimiser.
56
    revisiontree,
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
57
    textui,
2745.1.2 by Robert Collins
Ensure mutter_callsite is not directly called on a lazy_load object, to make the stacklevel parameter work correctly.
58
    trace,
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
59
    transform,
60
    urlutils,
61
    xml5,
62
    xml6,
63
    )
64
import bzrlib.branch
65
from bzrlib.transport import get_transport
66
import bzrlib.ui
67
""")
68
69
from bzrlib import symbol_versioning
70
from bzrlib.decorators import needs_read_lock, needs_write_lock
2255.2.74 by Robert Collins
Minor performance optimisation in _generate_inventory by avoiding normalisation checks and just using a factory to create the inventory entries.
71
from bzrlib.inventory import InventoryEntry, Inventory, ROOT_ID, entry_factory
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
72
from bzrlib.lockable_files import LockableFiles, TransportLock
73
from bzrlib.lockdir import LockDir
74
import bzrlib.mutabletree
75
from bzrlib.mutabletree import needs_tree_write_lock
76
from bzrlib.osutils import (
2255.2.202 by Martin Pool
WorkingTree_4.kind should report tree-references if they're
77
    file_kind,
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
78
    isdir,
79
    normpath,
80
    pathjoin,
81
    rand_chars,
82
    realpath,
83
    safe_unicode,
84
    splitpath,
85
    )
86
from bzrlib.trace import mutter, note
87
from bzrlib.transport.local import LocalTransport
2255.2.117 by Robert Collins
Add an InterDirStateTree InterTree optimiser.
88
from bzrlib.tree import InterTree
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
89
from bzrlib.progress import DummyProgress, ProgressPhase
90
from bzrlib.revision import NULL_REVISION, CURRENT_REVISION
91
from bzrlib.rio import RioReader, rio_file, Stanza
92
from bzrlib.symbol_versioning import (deprecated_passed,
93
        deprecated_method,
94
        deprecated_function,
95
        DEPRECATED_PARAMETER,
96
        )
97
from bzrlib.tree import Tree
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
98
from bzrlib.workingtree import WorkingTree, WorkingTree3, WorkingTreeFormat3
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
99
100
2363.1.1 by John Arbash Meinel
Catch Windows ERROR_DIRECTORY when doing os.listdir('file')
101
# This is the Windows equivalent of ENOTDIR
102
# It is defined in pywin32.winerror, but we don't want a strong dependency for
103
# just an error code.
2408.1.5 by Alexander Belchenko
John's patch for WT4 on Windows+Python2.4
104
ERROR_PATH_NOT_FOUND = 3
2363.1.1 by John Arbash Meinel
Catch Windows ERROR_DIRECTORY when doing os.listdir('file')
105
ERROR_DIRECTORY = 267
106
107
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
108
class WorkingTree4(WorkingTree3):
109
    """This is the Format 4 working tree.
110
111
    This differs from WorkingTree3 by:
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
112
     - Having a consolidated internal dirstate, stored in a
113
       randomly-accessible sorted file on disk.
114
     - Not having a regular inventory attribute.  One can be synthesized 
115
       on demand but this is expensive and should be avoided.
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
116
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
117
    This is new in bzr 0.15.
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
118
    """
119
120
    def __init__(self, basedir,
121
                 branch,
122
                 _control_files=None,
123
                 _format=None,
124
                 _bzrdir=None):
125
        """Construct a WorkingTree for basedir.
126
127
        If the branch is not supplied, it is opened automatically.
128
        If the branch is supplied, it must be the branch for this basedir.
129
        (branch.base is not cross checked, because for remote branches that
130
        would be meaningless).
131
        """
132
        self._format = _format
133
        self.bzrdir = _bzrdir
134
        basedir = safe_unicode(basedir)
135
        mutter("opening working tree %r", basedir)
136
        self._branch = branch
137
        self.basedir = realpath(basedir)
138
        # if branch is at our basedir and is a format 6 or less
139
        # assume all other formats have their own control files.
140
        self._control_files = _control_files
3407.2.1 by Martin Pool
Deprecate LockableFiles.get
141
        self._transport = self._control_files._transport
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
142
        self._dirty = None
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
143
        #-------------
144
        # during a read or write lock these objects are set, and are
145
        # None the rest of the time.
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
146
        self._dirstate = None
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
147
        self._inventory = None
148
        #-------------
2974.2.2 by John Arbash Meinel
Only one test failed, because it was incorrectly succeeding.
149
        self._setup_directory_is_tree_reference()
3034.4.3 by Aaron Bentley
Add case-sensitivity handling to WorkingTree
150
        self._detect_case_handling()
3398.1.24 by Ian Clatworthy
make iter_search_rules a tree method
151
        self._rules_searcher = None
3586.1.4 by Ian Clatworthy
first cut at tree-level view tests
152
        self.views = self._make_views()
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
153
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
154
    @needs_tree_write_lock
2255.2.12 by Robert Collins
Partial implementation of WorkingTree4._add.
155
    def _add(self, files, ids, kinds):
156
        """See MutableTree._add."""
157
        state = self.current_dirstate()
158
        for f, file_id, kind in zip(files, ids, kinds):
2255.2.14 by Robert Collins
Dirstate: fix adding of directories to setup the next directories block, and test representation of symlinks. Also fix iter_rows to not reset the dirty bit.
159
            f = f.strip('/')
2255.7.74 by Robert Collins
Test adding of roots to trees, it was broken on WorkingTree4.
160
            if self.path2id(f):
161
                # special case tree root handling.
162
                if f == '' and self.path2id(f) == ROOT_ID:
163
                    state.set_path_id('', generate_ids.gen_file_id(f))
164
                continue
2255.2.12 by Robert Collins
Partial implementation of WorkingTree4._add.
165
            if file_id is None:
2255.2.20 by Robert Collins
Bypass irrelevant basis_inventory tests for dirstate.
166
                file_id = generate_ids.gen_file_id(f)
2255.2.43 by Robert Collins
WorkingTree4.add must not require a file to exist to add it when kind etc is given.
167
            # deliberately add the file with no cached stat or sha1
168
            # - on the first access it will be gathered, and we can
169
            # always change this once tests are all passing.
170
            state.add(f, file_id, kind, None, '')
2255.7.67 by Robert Collins
Fix test_inv - make setting WorkingTree4._dirty use a helper to reduce code duplication, and reset the inventory when we dont manually update it, if it exists.
171
        self._make_dirty(reset_inventory=True)
172
173
    def _make_dirty(self, reset_inventory):
174
        """Make the tree state dirty.
175
176
        :param reset_inventory: True if the cached inventory should be removed
177
            (presuming there is one).
178
        """
2255.2.16 by Robert Collins
Implement WorkingTreeFormat4._write_inventory for better compatability with existing code, letting more test_test_trees pass, now up to test_tree_with_subdirs_and_all_content_types.
179
        self._dirty = True
2255.7.67 by Robert Collins
Fix test_inv - make setting WorkingTree4._dirty use a helper to reduce code duplication, and reset the inventory when we dont manually update it, if it exists.
180
        if reset_inventory and self._inventory is not None:
181
            self._inventory = None
2255.2.12 by Robert Collins
Partial implementation of WorkingTree4._add.
182
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
183
    @needs_tree_write_lock
184
    def add_reference(self, sub_tree):
185
        # use standard implementation, which calls back to self._add
186
        # 
187
        # So we don't store the reference_revision in the working dirstate,
188
        # it's just recorded at the moment of commit. 
189
        self._add_reference(sub_tree)
190
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
191
    def break_lock(self):
192
        """Break a lock if one is present from another instance.
193
194
        Uses the ui factory to ask for confirmation if the lock may be from
195
        an active process.
196
197
        This will probe the repository for its lock as well.
198
        """
199
        # if the dirstate is locked by an active process, reject the break lock
200
        # call.
201
        try:
202
            if self._dirstate is None:
203
                clear = True
204
            else:
205
                clear = False
206
            state = self._current_dirstate()
207
            if state._lock_token is not None:
208
                # we already have it locked. sheese, cant break our own lock.
209
                raise errors.LockActive(self.basedir)
210
            else:
211
                try:
212
                    # try for a write lock - need permission to get one anyhow
213
                    # to break locks.
214
                    state.lock_write()
215
                except errors.LockContention:
216
                    # oslocks fail when a process is still live: fail.
217
                    # TODO: get the locked lockdir info and give to the user to
218
                    # assist in debugging.
219
                    raise errors.LockActive(self.basedir)
220
                else:
221
                    state.unlock()
222
        finally:
223
            if clear:
224
                self._dirstate = None
225
        self._control_files.break_lock()
226
        self.branch.break_lock()
227
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
228
    def _comparison_data(self, entry, path):
229
        kind, executable, stat_value = \
230
            WorkingTree3._comparison_data(self, entry, path)
2255.2.205 by Martin Pool
factor out WorkingTree4._directory_is_tree_reference
231
        # it looks like a plain directory, but it's really a reference -- see
232
        # also kind()
2255.2.232 by Robert Collins
Make WorkingTree4 report support for references based on the repositories capabilities.
233
        if (self._repo_supports_tree_reference and
234
            kind == 'directory' and
235
            self._directory_is_tree_reference(path)):
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
236
            kind = 'tree-reference'
237
        return kind, executable, stat_value
238
2255.7.74 by Robert Collins
Test adding of roots to trees, it was broken on WorkingTree4.
239
    @needs_write_lock
240
    def commit(self, message=None, revprops=None, *args, **kwargs):
241
        # mark the tree as dirty post commit - commit
242
        # can change the current versioned list by doing deletes.
243
        result = WorkingTree3.commit(self, message, revprops, *args, **kwargs)
244
        self._make_dirty(reset_inventory=True)
245
        return result
246
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
247
    def current_dirstate(self):
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
248
        """Return the current dirstate object.
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
249
250
        This is not part of the tree interface and only exposed for ease of
251
        testing.
252
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
253
        :raises errors.NotWriteLocked: when not in a lock.
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
254
        """
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
255
        self._must_be_locked()
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
256
        return self._current_dirstate()
257
258
    def _current_dirstate(self):
259
        """Internal function that does not check lock status.
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
260
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
261
        This is needed for break_lock which also needs the dirstate.
262
        """
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
263
        if self._dirstate is not None:
264
            return self._dirstate
265
        local_path = self.bzrdir.get_workingtree_transport(None
266
            ).local_abspath('dirstate')
267
        self._dirstate = dirstate.DirState.on_file(local_path)
268
        return self._dirstate
269
2255.2.81 by Robert Collins
WorkingTree4: Implement filter_unversioned_files to use dirstate bisection.
270
    def filter_unversioned_files(self, paths):
2255.7.62 by Robert Collins
Update the Tree.filter_unversioned_files docstring to reflect what the existing implementations actually do, and change the WorkingTree4 implementation to match a newly created test for it.
271
        """Filter out paths that are versioned.
2255.2.81 by Robert Collins
WorkingTree4: Implement filter_unversioned_files to use dirstate bisection.
272
273
        :return: set of paths.
274
        """
275
        # TODO: make a generic multi-bisect routine roughly that should list
276
        # the paths, then process one half at a time recursively, and feed the
277
        # results of each bisect in further still
278
        paths = sorted(paths)
279
        result = set()
2255.2.176 by Martin Pool
Merge dirstate and some small cleanups
280
        state = self.current_dirstate()
2255.2.81 by Robert Collins
WorkingTree4: Implement filter_unversioned_files to use dirstate bisection.
281
        # TODO we want a paths_to_dirblocks helper I think
282
        for path in paths:
283
            dirname, basename = os.path.split(path.encode('utf8'))
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
284
            _, _, _, path_is_versioned = state._get_block_entry_index(
285
                dirname, basename, 0)
2255.7.62 by Robert Collins
Update the Tree.filter_unversioned_files docstring to reflect what the existing implementations actually do, and change the WorkingTree4 implementation to match a newly created test for it.
286
            if not path_is_versioned:
2255.2.81 by Robert Collins
WorkingTree4: Implement filter_unversioned_files to use dirstate bisection.
287
                result.add(path)
288
        return result
289
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
290
    def flush(self):
291
        """Write all cached data to disk."""
2255.2.39 by Robert Collins
WorkingTree4: flush can only be used during write locks.
292
        if self._control_files._lock_mode != 'w':
293
            raise errors.NotWriteLocked(self)
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
294
        self.current_dirstate().save()
295
        self._inventory = None
296
        self._dirty = False
297
2323.4.2 by Robert Collins
Fix the behaviour of dirstate optimised iter_changes recursing its disk iterator into subtrees inappropriately.
298
    @needs_tree_write_lock
299
    def _gather_kinds(self, files, kinds):
300
        """See MutableTree._gather_kinds."""
301
        for pos, f in enumerate(files):
302
            if kinds[pos] is None:
303
                kinds[pos] = self._kind(f)
304
2255.2.34 by Robert Collins
Fix WorkingTree4 parent_ids logic to use the dirstate to answer parent ids list queries.
305
    def _generate_inventory(self):
306
        """Create and set self.inventory from the dirstate object.
307
        
308
        This is relatively expensive: we have to walk the entire dirstate.
309
        Ideally we would not, and can deprecate this function.
310
        """
2255.2.82 by Robert Collins
various notes about find_ids_across_trees
311
        #: uncomment to trap on inventory requests.
312
        # import pdb;pdb.set_trace()
2255.2.75 by Robert Collins
Correct generation of revisiontree inventories to handle out of order parents.
313
        state = self.current_dirstate()
314
        state._read_dirblocks_if_needed()
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
315
        root_key, current_entry = self._get_entry(path='')
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
316
        current_id = root_key[2]
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
317
        if not (current_entry[0][0] == 'd'): # directory
318
            raise AssertionError(current_entry)
2255.2.75 by Robert Collins
Correct generation of revisiontree inventories to handle out of order parents.
319
        inv = Inventory(root_id=current_id)
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
320
        # Turn some things into local variables
321
        minikind_to_kind = dirstate.DirState._minikind_to_kind
322
        factory = entry_factory
323
        utf8_decode = cache_utf8._utf8_decode
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
324
        inv_byid = inv._byid
2255.2.73 by Robert Collins
50% speedup in the dirstate->inventory conversion logic by caching the parent ids as we walk the tree. Some further work would be to maintain a stack of parents as we know we visit depth first.
325
        # we could do this straight out of the dirstate; it might be fast
326
        # and should be profiled - RBC 20070216
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
327
        parent_ies = {'' : inv.root}
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
328
        for block in state._dirblocks[1:]: # skip the root
2255.2.77 by Robert Collins
Tune working inventory generation more: walk the blocks, skipping deleted rows.
329
            dirname = block[0]
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
330
            try:
2255.8.4 by John Arbash Meinel
Rather than using split hunks, implement a bisect_dirblocks
331
                parent_ie = parent_ies[dirname]
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
332
            except KeyError:
333
                # all the paths in this block are not versioned in this tree
334
                continue
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
335
            for key, entry in block[1]:
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
336
                minikind, link_or_sha1, size, executable, stat = entry[0]
337
                if minikind in ('a', 'r'): # absent, relocated
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
338
                    # a parent tree only entry
339
                    continue
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
340
                name = key[1]
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
341
                name_unicode = utf8_decode(name)[0]
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
342
                file_id = key[2]
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
343
                kind = minikind_to_kind[minikind]
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
344
                inv_entry = factory[kind](file_id, name_unicode,
345
                                          parent_ie.file_id)
2255.2.77 by Robert Collins
Tune working inventory generation more: walk the blocks, skipping deleted rows.
346
                if kind == 'file':
2325.3.4 by John Arbash Meinel
Rather than setting the executable bit for every file, properly create the working inventory to include it.
347
                    # This is only needed on win32, where this is the only way
348
                    # we know the executable bit.
349
                    inv_entry.executable = executable
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
350
                    # not strictly needed: working tree
2325.3.4 by John Arbash Meinel
Rather than setting the executable bit for every file, properly create the working inventory to include it.
351
                    #inv_entry.text_size = size
352
                    #inv_entry.text_sha1 = sha1
2255.2.77 by Robert Collins
Tune working inventory generation more: walk the blocks, skipping deleted rows.
353
                elif kind == 'directory':
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
354
                    # add this entry to the parent map.
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
355
                    parent_ies[(dirname + '/' + name).strip('/')] = inv_entry
2255.2.194 by Robert Collins
[BROKEN] Many updates to stop using experimental formats in tests.
356
                elif kind == 'tree-reference':
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
357
                    if not self._repo_supports_tree_reference:
358
                        raise AssertionError(
359
                            "repository of %r "
360
                            "doesn't support tree references "
361
                            "required by entry %r"
362
                            % (self, name))
2255.2.218 by Robert Collins
Make the nested tree commit smoke test be more rigourous.
363
                    inv_entry.reference_revision = link_or_sha1 or None
2338.4.5 by Marien Zwart
Make an assert actually assert something.
364
                elif kind != 'symlink':
2348.1.1 by Martin Pool
(marienz) fixes for error committing merge with symlinks in dirstate
365
                    raise AssertionError("unknown kind %r" % kind)
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
366
                # These checks cost us around 40ms on a 55k entry tree
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
367
                if file_id in inv_byid:
368
                    raise AssertionError('file_id %s already in'
369
                        ' inventory as %s' % (file_id, inv_byid[file_id]))
370
                if name_unicode in parent_ie.children:
371
                    raise AssertionError('name %r already in parent'
372
                        % (name_unicode,))
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
373
                inv_byid[file_id] = inv_entry
374
                parent_ie.children[name_unicode] = inv_entry
2255.2.34 by Robert Collins
Fix WorkingTree4 parent_ids logic to use the dirstate to answer parent ids list queries.
375
        self._inventory = inv
376
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
377
    def _get_entry(self, file_id=None, path=None):
378
        """Get the dirstate row for file_id or path.
379
380
        If either file_id or path is supplied, it is used as the key to lookup.
381
        If both are supplied, the fastest lookup is used, and an error is
382
        raised if they do not both point at the same row.
383
        
384
        :param file_id: An optional unicode file_id to be looked up.
385
        :param path: An optional unicode path to be looked up.
386
        :return: The dirstate row tuple for path/file_id, or (None, None)
387
        """
388
        if file_id is None and path is None:
389
            raise errors.BzrError('must supply file_id or path')
390
        state = self.current_dirstate()
391
        if path is not None:
392
            path = path.encode('utf8')
393
        return state._get_entry(0, fileid_utf8=file_id, path_utf8=path)
394
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
395
    def get_file_sha1(self, file_id, path=None, stat_value=None):
2255.2.88 by Robert Collins
Significant steps back to operation.
396
        # check file id is valid unconditionally.
2255.10.1 by John Arbash Meinel
Update WorkingTree4 so that it doesn't use a HashCache,
397
        entry = self._get_entry(file_id=file_id, path=path)
1551.15.56 by Aaron Bentley
Raise NoSuchId when get_file_sha1 is invoked with a baed file id
398
        if entry[0] is None:
399
            raise errors.NoSuchId(self, file_id)
2255.2.73 by Robert Collins
50% speedup in the dirstate->inventory conversion logic by caching the parent ids as we walk the tree. Some further work would be to maintain a stack of parents as we know we visit depth first.
400
        if path is None:
2255.10.1 by John Arbash Meinel
Update WorkingTree4 so that it doesn't use a HashCache,
401
            path = pathjoin(entry[0][0], entry[0][1]).decode('utf8')
402
403
        file_abspath = self.abspath(path)
404
        state = self.current_dirstate()
2485.3.3 by John Arbash Meinel
Avoid extra work in inner 'DirState.update_entry' code.
405
        if stat_value is None:
2499.3.1 by Aaron Bentley
Fix Workingtree4.get_file_sha1 on missing files
406
            try:
407
                stat_value = os.lstat(file_abspath)
408
            except OSError, e:
409
                if e.errno == errno.ENOENT:
410
                    return None
411
                else:
412
                    raise
2255.10.3 by John Arbash Meinel
(broken) Change get_sha1_for_entry into update_entry
413
        link_or_sha1 = state.update_entry(entry, file_abspath,
414
                                          stat_value=stat_value)
415
        if entry[1][0][0] == 'f':
416
            return link_or_sha1
417
        return None
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
418
2255.2.17 by Robert Collins
tweaks - finishes off all the test_test_trees tests for dirstate.
419
    def _get_inventory(self):
420
        """Get the inventory for the tree. This is only valid within a lock."""
2745.1.1 by Robert Collins
Add a number of -Devil checkpoints.
421
        if 'evil' in debug.debug_flags:
2745.1.2 by Robert Collins
Ensure mutter_callsite is not directly called on a lazy_load object, to make the stacklevel parameter work correctly.
422
            trace.mutter_callsite(2,
2745.1.1 by Robert Collins
Add a number of -Devil checkpoints.
423
                "accessing .inventory forces a size of tree translation.")
2255.2.17 by Robert Collins
tweaks - finishes off all the test_test_trees tests for dirstate.
424
        if self._inventory is not None:
425
            return self._inventory
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
426
        self._must_be_locked()
2255.2.17 by Robert Collins
tweaks - finishes off all the test_test_trees tests for dirstate.
427
        self._generate_inventory()
428
        return self._inventory
429
430
    inventory = property(_get_inventory,
431
                         doc="Inventory of this Tree")
432
433
    @needs_read_lock
2255.2.34 by Robert Collins
Fix WorkingTree4 parent_ids logic to use the dirstate to answer parent ids list queries.
434
    def get_parent_ids(self):
435
        """See Tree.get_parent_ids.
436
        
437
        This implementation requests the ids list from the dirstate file.
438
        """
439
        return self.current_dirstate().get_parent_ids()
440
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
441
    def get_reference_revision(self, file_id, path=None):
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
442
        # referenced tree's revision is whatever's currently there
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
443
        return self.get_nested_tree(file_id, path).last_revision()
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
444
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
445
    def get_nested_tree(self, file_id, path=None):
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
446
        if path is None:
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
447
            path = self.id2path(file_id)
448
        # else: check file_id is at path?
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
449
        return WorkingTree.open(self.abspath(path))
450
2255.2.34 by Robert Collins
Fix WorkingTree4 parent_ids logic to use the dirstate to answer parent ids list queries.
451
    @needs_read_lock
2255.2.17 by Robert Collins
tweaks - finishes off all the test_test_trees tests for dirstate.
452
    def get_root_id(self):
453
        """Return the id of this trees root"""
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
454
        return self._get_entry(path='')[0][2]
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
455
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
456
    def has_id(self, file_id):
457
        state = self.current_dirstate()
2255.2.92 by James Westby
Make the WorkingTree4 has_id use the new _get_entry rather than _get_row.
458
        row, parents = self._get_entry(file_id=file_id)
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
459
        if row is None:
460
            return False
461
        return osutils.lexists(pathjoin(
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
462
                    self.basedir, row[0].decode('utf8'), row[1].decode('utf8')))
463
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
464
    @needs_read_lock
2255.2.144 by John Arbash Meinel
Simplify update_minimal a bit more, by making id_index a
465
    def id2path(self, file_id):
2511.1.3 by Ian Clatworthy
remove implicit read locks for kind() and is_executable() in wt4
466
        "Convert a file-id to a path."
2255.2.144 by John Arbash Meinel
Simplify update_minimal a bit more, by making id_index a
467
        state = self.current_dirstate()
2255.2.147 by John Arbash Meinel
Move fast id => path lookups down into DirState
468
        entry = self._get_entry(file_id=file_id)
469
        if entry == (None, None):
2255.11.5 by Martin Pool
Tree.id2path should raise NoSuchId, not return None.
470
            raise errors.NoSuchId(tree=self, file_id=file_id)
2255.2.147 by John Arbash Meinel
Move fast id => path lookups down into DirState
471
        path_utf8 = osutils.pathjoin(entry[0][0], entry[0][1])
472
        return path_utf8.decode('utf8')
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
473
2911.5.4 by John Arbash Meinel
Switch around to properly look up the executable bit in the basis.
474
    def _is_executable_from_path_and_stat_from_basis(self, path, stat_result):
475
        entry = self._get_entry(path=path)
476
        if entry == (None, None):
477
            return False # Missing entries are not executable
478
        return entry[1][0][3] # Executable?
479
2325.3.2 by John Arbash Meinel
Implement is_executable for WorkingTree4 and win32
480
    if not osutils.supports_executable():
481
        def is_executable(self, file_id, path=None):
2511.1.3 by Ian Clatworthy
remove implicit read locks for kind() and is_executable() in wt4
482
            """Test if a file is executable or not.
483
484
            Note: The caller is expected to take a read-lock before calling this.
485
            """
2325.3.2 by John Arbash Meinel
Implement is_executable for WorkingTree4 and win32
486
            entry = self._get_entry(file_id=file_id, path=path)
487
            if entry == (None, None):
488
                return False
489
            return entry[1][0][3]
2911.5.4 by John Arbash Meinel
Switch around to properly look up the executable bit in the basis.
490
491
        _is_executable_from_path_and_stat = \
492
            _is_executable_from_path_and_stat_from_basis
2325.3.2 by John Arbash Meinel
Implement is_executable for WorkingTree4 and win32
493
    else:
494
        def is_executable(self, file_id, path=None):
2511.1.3 by Ian Clatworthy
remove implicit read locks for kind() and is_executable() in wt4
495
            """Test if a file is executable or not.
496
497
            Note: The caller is expected to take a read-lock before calling this.
498
            """
3146.4.5 by Aaron Bentley
Require a read lock in POSIX is_exectuable implementations, matching win32
499
            self._must_be_locked()
2325.3.2 by John Arbash Meinel
Implement is_executable for WorkingTree4 and win32
500
            if not path:
501
                path = self.id2path(file_id)
502
            mode = os.lstat(self.abspath(path)).st_mode
503
            return bool(stat.S_ISREG(mode) and stat.S_IEXEC & mode)
504
3146.8.16 by Aaron Bentley
Updates from review
505
    def all_file_ids(self):
3146.8.2 by Aaron Bentley
Introduce iter_all_file_ids, to avoid hitting Inventory for this case
506
        """See Tree.iter_all_file_ids"""
507
        self._must_be_locked()
3146.8.16 by Aaron Bentley
Updates from review
508
        result = set()
3146.8.2 by Aaron Bentley
Introduce iter_all_file_ids, to avoid hitting Inventory for this case
509
        for key, tree_details in self.current_dirstate()._iter_entries():
510
            if tree_details[0][0] in ('a', 'r'): # relocated
511
                continue
3146.8.16 by Aaron Bentley
Updates from review
512
            result.add(key[2])
513
        return result
3146.8.2 by Aaron Bentley
Introduce iter_all_file_ids, to avoid hitting Inventory for this case
514
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
515
    @needs_read_lock
516
    def __iter__(self):
517
        """Iterate through file_ids for this tree.
518
519
        file_ids are in a WorkingTree if they are in the working inventory
520
        and the working file exists.
521
        """
522
        result = []
2255.2.88 by Robert Collins
Significant steps back to operation.
523
        for key, tree_details in self.current_dirstate()._iter_entries():
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
524
            if tree_details[0][0] in ('a', 'r'): # absent, relocated
2255.2.88 by Robert Collins
Significant steps back to operation.
525
                # not relevant to the working tree
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
526
                continue
2255.2.88 by Robert Collins
Significant steps back to operation.
527
            path = pathjoin(self.basedir, key[0].decode('utf8'), key[1].decode('utf8'))
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
528
            if osutils.lexists(path):
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
529
                result.append(key[2])
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
530
        return iter(result)
531
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
532
    def iter_references(self):
3504.2.1 by John Arbash Meinel
Shortcut iter_references when we know references aren't supported.
533
        if not self._repo_supports_tree_reference:
534
            # When the repo doesn't support references, we will have nothing to
535
            # return
536
            return
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
537
        for key, tree_details in self.current_dirstate()._iter_entries():
538
            if tree_details[0][0] in ('a', 'r'): # absent, relocated
539
                # not relevant to the working tree
540
                continue
541
            if not key[1]:
542
                # the root is not a reference.
543
                continue
3504.2.1 by John Arbash Meinel
Shortcut iter_references when we know references aren't supported.
544
            relpath = pathjoin(key[0].decode('utf8'), key[1].decode('utf8'))
2255.2.229 by Robert Collins
Fix remaining test failures.
545
            try:
3504.2.1 by John Arbash Meinel
Shortcut iter_references when we know references aren't supported.
546
                if self._kind(relpath) == 'tree-reference':
547
                    yield relpath, key[2]
2255.2.229 by Robert Collins
Fix remaining test failures.
548
            except errors.NoSuchFile:
549
                # path is missing on disk.
550
                continue
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
551
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
552
    def kind(self, file_id):
2255.2.202 by Martin Pool
WorkingTree_4.kind should report tree-references if they're
553
        """Return the kind of a file.
554
555
        This is always the actual kind that's on disk, regardless of what it
556
        was added as.
2511.1.3 by Ian Clatworthy
remove implicit read locks for kind() and is_executable() in wt4
557
558
        Note: The caller is expected to take a read-lock before calling this.
2255.2.202 by Martin Pool
WorkingTree_4.kind should report tree-references if they're
559
        """
560
        relpath = self.id2path(file_id)
3376.2.11 by Martin Pool
Compare to None using is/is not not ==
561
        if relpath is None:
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
562
            raise AssertionError(
563
                "path for id {%s} is None!" % file_id)
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
564
        return self._kind(relpath)
565
566
    def _kind(self, relpath):
2255.2.202 by Martin Pool
WorkingTree_4.kind should report tree-references if they're
567
        abspath = self.abspath(relpath)
568
        kind = file_kind(abspath)
2255.2.232 by Robert Collins
Make WorkingTree4 report support for references based on the repositories capabilities.
569
        if (self._repo_supports_tree_reference and
570
            kind == 'directory' and
571
            self._directory_is_tree_reference(relpath)):
2255.2.205 by Martin Pool
factor out WorkingTree4._directory_is_tree_reference
572
            kind = 'tree-reference'
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
573
        return kind
574
2255.2.21 by Robert Collins
Add WorkingTree4._last_revision, making workingtree_implementations.test_changes_from pass.
575
    @needs_read_lock
576
    def _last_revision(self):
577
        """See Mutable.last_revision."""
578
        parent_ids = self.current_dirstate().get_parent_ids()
579
        if parent_ids:
2255.2.84 by John Arbash Meinel
Remove now-unecessary encode/decode calls for revision ids.
580
            return parent_ids[0]
2255.2.21 by Robert Collins
Add WorkingTree4._last_revision, making workingtree_implementations.test_changes_from pass.
581
        else:
2598.5.10 by Aaron Bentley
Return NULL_REVISION instead of None for the null revision
582
            return _mod_revision.NULL_REVISION
2255.2.21 by Robert Collins
Add WorkingTree4._last_revision, making workingtree_implementations.test_changes_from pass.
583
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
584
    def lock_read(self):
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
585
        """See Branch.lock_read, and WorkingTree.unlock."""
586
        self.branch.lock_read()
587
        try:
588
            self._control_files.lock_read()
589
            try:
590
                state = self.current_dirstate()
591
                if not state._lock_token:
592
                    state.lock_read()
2255.2.232 by Robert Collins
Make WorkingTree4 report support for references based on the repositories capabilities.
593
                # set our support for tree references from the repository in
594
                # use.
595
                self._repo_supports_tree_reference = getattr(
2323.5.16 by Martin Pool
rename support_tree_reference to supports_
596
                    self.branch.repository._format, "supports_tree_reference",
2255.2.232 by Robert Collins
Make WorkingTree4 report support for references based on the repositories capabilities.
597
                    False)
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
598
            except:
599
                self._control_files.unlock()
600
                raise
601
        except:
602
            self.branch.unlock()
603
            raise
604
605
    def _lock_self_write(self):
606
        """This should be called after the branch is locked."""
607
        try:
608
            self._control_files.lock_write()
609
            try:
610
                state = self.current_dirstate()
611
                if not state._lock_token:
612
                    state.lock_write()
2255.2.232 by Robert Collins
Make WorkingTree4 report support for references based on the repositories capabilities.
613
                # set our support for tree references from the repository in
614
                # use.
615
                self._repo_supports_tree_reference = getattr(
2323.5.16 by Martin Pool
rename support_tree_reference to supports_
616
                    self.branch.repository._format, "supports_tree_reference",
2255.2.232 by Robert Collins
Make WorkingTree4 report support for references based on the repositories capabilities.
617
                    False)
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
618
            except:
619
                self._control_files.unlock()
620
                raise
621
        except:
622
            self.branch.unlock()
623
            raise
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
624
625
    def lock_tree_write(self):
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
626
        """See MutableTree.lock_tree_write, and WorkingTree.unlock."""
627
        self.branch.lock_read()
628
        self._lock_self_write()
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
629
630
    def lock_write(self):
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
631
        """See MutableTree.lock_write, and WorkingTree.unlock."""
632
        self.branch.lock_write()
633
        self._lock_self_write()
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
634
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
635
    @needs_tree_write_lock
2255.2.137 by John Arbash Meinel
Move the WorkingTree.move() tests into their own module
636
    def move(self, from_paths, to_dir, after=False):
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
637
        """See WorkingTree.move()."""
2255.7.46 by Robert Collins
Fix WorkingTree4.move to return the moved paths, and update the tree implementation tests for move to check them.
638
        result = []
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
639
        if not from_paths:
2255.7.46 by Robert Collins
Fix WorkingTree4.move to return the moved paths, and update the tree implementation tests for move to check them.
640
            return result
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
641
        state = self.current_dirstate()
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
642
        if isinstance(from_paths, basestring):
643
            raise ValueError()
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
644
        to_dir_utf8 = to_dir.encode('utf8')
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
645
        to_entry_dirname, to_basename = os.path.split(to_dir_utf8)
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
646
        id_index = state._get_id_index()
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
647
        # check destination directory
648
        # get the details for it
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
649
        to_entry_block_index, to_entry_entry_index, dir_present, entry_present = \
650
            state._get_block_entry_index(to_entry_dirname, to_basename, 0)
651
        if not entry_present:
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
652
            raise errors.BzrMoveFailedError('', to_dir,
2255.7.71 by Robert Collins
Fix blackbox test_mv usage of inventory, and the errors raised by workingtree4.move - though that should be made into a workingtree conformance test.
653
                errors.NotVersionedError(to_dir))
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
654
        to_entry = state._dirblocks[to_entry_block_index][1][to_entry_entry_index]
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
655
        # get a handle on the block itself.
656
        to_block_index = state._ensure_block(
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
657
            to_entry_block_index, to_entry_entry_index, to_dir_utf8)
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
658
        to_block = state._dirblocks[to_block_index]
659
        to_abs = self.abspath(to_dir)
660
        if not isdir(to_abs):
661
            raise errors.BzrMoveFailedError('',to_dir,
662
                errors.NotADirectory(to_abs))
663
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
664
        if to_entry[1][0][0] != 'd':
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
665
            raise errors.BzrMoveFailedError('',to_dir,
666
                errors.NotADirectory(to_abs))
667
668
        if self._inventory is not None:
669
            update_inventory = True
670
            inv = self.inventory
3201.2.1 by Lukáš Lalinský
Make 'mv a b' work for already renamed directories, like it does for files
671
            to_dir_id = to_entry[0][2]
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
672
            to_dir_ie = inv[to_dir_id]
673
        else:
674
            update_inventory = False
675
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
676
        rollbacks = []
677
        def move_one(old_entry, from_path_utf8, minikind, executable,
678
                     fingerprint, packed_stat, size,
679
                     to_block, to_key, to_path_utf8):
680
            state._make_absent(old_entry)
681
            from_key = old_entry[0]
682
            rollbacks.append(
683
                lambda:state.update_minimal(from_key,
684
                    minikind,
685
                    executable=executable,
686
                    fingerprint=fingerprint,
687
                    packed_stat=packed_stat,
688
                    size=size,
689
                    path_utf8=from_path_utf8))
690
            state.update_minimal(to_key,
691
                    minikind,
692
                    executable=executable,
693
                    fingerprint=fingerprint,
694
                    packed_stat=packed_stat,
695
                    size=size,
696
                    path_utf8=to_path_utf8)
697
            added_entry_index, _ = state._find_entry_index(to_key, to_block[1])
698
            new_entry = to_block[1][added_entry_index]
699
            rollbacks.append(lambda:state._make_absent(new_entry))
700
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
701
        for from_rel in from_paths:
702
            # from_rel is 'pathinroot/foo/bar'
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
703
            from_rel_utf8 = from_rel.encode('utf8')
704
            from_dirname, from_tail = osutils.split(from_rel)
705
            from_dirname, from_tail_utf8 = osutils.split(from_rel_utf8)
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
706
            from_entry = self._get_entry(path=from_rel)
707
            if from_entry == (None, None):
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
708
                raise errors.BzrMoveFailedError(from_rel,to_dir,
709
                    errors.NotVersionedError(path=str(from_rel)))
710
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
711
            from_id = from_entry[0][2]
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
712
            to_rel = pathjoin(to_dir, from_tail)
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
713
            to_rel_utf8 = pathjoin(to_dir_utf8, from_tail_utf8)
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
714
            item_to_entry = self._get_entry(path=to_rel)
715
            if item_to_entry != (None, None):
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
716
                raise errors.BzrMoveFailedError(from_rel, to_rel,
717
                    "Target is already versioned.")
718
719
            if from_rel == to_rel:
720
                raise errors.BzrMoveFailedError(from_rel, to_rel,
721
                    "Source and target are identical.")
722
723
            from_missing = not self.has_filename(from_rel)
724
            to_missing = not self.has_filename(to_rel)
725
            if after:
726
                move_file = False
727
            else:
728
                move_file = True
729
            if to_missing:
730
                if not move_file:
731
                    raise errors.BzrMoveFailedError(from_rel, to_rel,
732
                        errors.NoSuchFile(path=to_rel,
733
                        extra="New file has not been created yet"))
734
                elif from_missing:
735
                    # neither path exists
736
                    raise errors.BzrRenameFailedError(from_rel, to_rel,
737
                        errors.PathsDoNotExist(paths=(from_rel, to_rel)))
738
            else:
739
                if from_missing: # implicitly just update our path mapping
740
                    move_file = False
2255.2.139 by John Arbash Meinel
test cases for moving after a file has already been moved.
741
                elif not after:
2967.3.6 by Daniel Watkins
Extracted the string from every use of RenameFailedFilesExist to RenameFailedFilesExist itself.
742
                    raise errors.RenameFailedFilesExist(from_rel, to_rel)
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
743
744
            rollbacks = []
745
            def rollback_rename():
746
                """A single rename has failed, roll it back."""
2255.2.236 by Martin Pool
Review cleanups: mostly updating or removing todo comments.
747
                # roll back everything, even if we encounter trouble doing one
748
                # of them.
749
                #
750
                # TODO: at least log the other exceptions rather than just
751
                # losing them mbp 20070307
2255.2.138 by John Arbash Meinel
implement several new WorkingTree.move() tests
752
                exc_info = None
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
753
                for rollback in reversed(rollbacks):
754
                    try:
755
                        rollback()
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
756
                    except Exception, e:
2255.2.138 by John Arbash Meinel
implement several new WorkingTree.move() tests
757
                        exc_info = sys.exc_info()
758
                if exc_info:
759
                    raise exc_info[0], exc_info[1], exc_info[2]
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
760
761
            # perform the disk move first - its the most likely failure point.
2255.2.139 by John Arbash Meinel
test cases for moving after a file has already been moved.
762
            if move_file:
763
                from_rel_abs = self.abspath(from_rel)
764
                to_rel_abs = self.abspath(to_rel)
765
                try:
766
                    osutils.rename(from_rel_abs, to_rel_abs)
767
                except OSError, e:
768
                    raise errors.BzrMoveFailedError(from_rel, to_rel, e[1])
2255.2.140 by John Arbash Meinel
Update tests to ensure basis tree is not modified
769
                rollbacks.append(lambda: osutils.rename(to_rel_abs, from_rel_abs))
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
770
            try:
771
                # perform the rename in the inventory next if needed: its easy
772
                # to rollback
773
                if update_inventory:
774
                    # rename the entry
775
                    from_entry = inv[from_id]
776
                    current_parent = from_entry.parent_id
777
                    inv.rename(from_id, to_dir_id, from_tail)
778
                    rollbacks.append(
779
                        lambda: inv.rename(from_id, current_parent, from_tail))
780
                # finally do the rename in the dirstate, which is a little
781
                # tricky to rollback, but least likely to need it.
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
782
                old_block_index, old_entry_index, dir_present, file_present = \
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
783
                    state._get_block_entry_index(from_dirname, from_tail_utf8, 0)
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
784
                old_block = state._dirblocks[old_block_index][1]
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
785
                old_entry = old_block[old_entry_index]
786
                from_key, old_entry_details = old_entry
787
                cur_details = old_entry_details[0]
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
788
                # remove the old row
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
789
                to_key = ((to_block[0],) + from_key[1:3])
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
790
                minikind = cur_details[0]
791
                move_one(old_entry, from_path_utf8=from_rel_utf8,
792
                         minikind=minikind,
793
                         executable=cur_details[3],
794
                         fingerprint=cur_details[1],
795
                         packed_stat=cur_details[4],
796
                         size=cur_details[2],
797
                         to_block=to_block,
798
                         to_key=to_key,
799
                         to_path_utf8=to_rel_utf8)
800
801
                if minikind == 'd':
802
                    def update_dirblock(from_dir, to_key, to_dir_utf8):
2438.1.5 by John Arbash Meinel
Fix the bug by not iterating over the same list we are modifying.
803
                        """Recursively update all entries in this dirblock."""
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
804
                        if from_dir == '':
805
                            raise AssertionError("renaming root not supported")
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
806
                        from_key = (from_dir, '')
807
                        from_block_idx, present = \
808
                            state._find_block_index_from_key(from_key)
809
                        if not present:
810
                            # This is the old record, if it isn't present, then
811
                            # there is theoretically nothing to update.
812
                            # (Unless it isn't present because of lazy loading,
813
                            # but we don't do that yet)
814
                            return
815
                        from_block = state._dirblocks[from_block_idx]
816
                        to_block_index, to_entry_index, _, _ = \
817
                            state._get_block_entry_index(to_key[0], to_key[1], 0)
818
                        to_block_index = state._ensure_block(
819
                            to_block_index, to_entry_index, to_dir_utf8)
820
                        to_block = state._dirblocks[to_block_index]
2438.1.5 by John Arbash Meinel
Fix the bug by not iterating over the same list we are modifying.
821
822
                        # Grab a copy since move_one may update the list.
823
                        for entry in from_block[1][:]:
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
824
                            if not (entry[0][0] == from_dir):
825
                                raise AssertionError()
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
826
                            cur_details = entry[1][0]
827
                            to_key = (to_dir_utf8, entry[0][1], entry[0][2])
828
                            from_path_utf8 = osutils.pathjoin(entry[0][0], entry[0][1])
829
                            to_path_utf8 = osutils.pathjoin(to_dir_utf8, entry[0][1])
830
                            minikind = cur_details[0]
2438.1.10 by John Arbash Meinel
Make WT4.move() properly handle moving a directory with a renamed child.
831
                            if minikind in 'ar':
2438.1.8 by John Arbash Meinel
Fix the case when renaming a directory with deleted children.
832
                                # Deleted children of a renamed directory
833
                                # Do not need to be updated.
2438.1.10 by John Arbash Meinel
Make WT4.move() properly handle moving a directory with a renamed child.
834
                                # Children that have been renamed out of this
835
                                # directory should also not be updated
2438.1.8 by John Arbash Meinel
Fix the case when renaming a directory with deleted children.
836
                                continue
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
837
                            move_one(entry, from_path_utf8=from_path_utf8,
838
                                     minikind=minikind,
839
                                     executable=cur_details[3],
840
                                     fingerprint=cur_details[1],
841
                                     packed_stat=cur_details[4],
842
                                     size=cur_details[2],
843
                                     to_block=to_block,
844
                                     to_key=to_key,
2371.2.1 by John Arbash Meinel
Update DirState._validate() to detect rename errors.
845
                                     to_path_utf8=to_path_utf8)
2255.2.146 by John Arbash Meinel
Implement move_directory by factoring out move_one
846
                            if minikind == 'd':
847
                                # We need to move all the children of this
848
                                # entry
849
                                update_dirblock(from_path_utf8, to_key,
850
                                                to_path_utf8)
851
                    update_dirblock(from_rel_utf8, to_key, to_rel_utf8)
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
852
            except:
853
                rollback_rename()
854
                raise
2255.7.46 by Robert Collins
Fix WorkingTree4.move to return the moved paths, and update the tree implementation tests for move to check them.
855
            result.append((from_rel, to_rel))
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
856
            state._dirblock_state = dirstate.DirState.IN_MEMORY_MODIFIED
2255.7.67 by Robert Collins
Fix test_inv - make setting WorkingTree4._dirty use a helper to reduce code duplication, and reset the inventory when we dont manually update it, if it exists.
857
            self._make_dirty(reset_inventory=False)
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
858
2255.7.46 by Robert Collins
Fix WorkingTree4.move to return the moved paths, and update the tree implementation tests for move to check them.
859
        return result
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
860
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
861
    def _must_be_locked(self):
862
        if not self._control_files._lock_count:
863
            raise errors.ObjectNotLocked(self)
864
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
865
    def _new_tree(self):
866
        """Initialize the state in this tree to be a new tree."""
867
        self._dirty = True
868
869
    @needs_read_lock
2255.2.17 by Robert Collins
tweaks - finishes off all the test_test_trees tests for dirstate.
870
    def path2id(self, path):
871
        """Return the id for path in this tree."""
2255.7.56 by Robert Collins
Document behaviour of tree.path2id("path/").
872
        path = path.strip('/')
2255.2.88 by Robert Collins
Significant steps back to operation.
873
        entry = self._get_entry(path=path)
874
        if entry == (None, None):
2255.2.59 by Robert Collins
All WorkingTree4 and dirstate tests passing.
875
            return None
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
876
        return entry[0][2]
2255.2.17 by Robert Collins
tweaks - finishes off all the test_test_trees tests for dirstate.
877
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
878
    def paths2ids(self, paths, trees=[], require_versioned=True):
879
        """See Tree.paths2ids().
2255.7.24 by John Arbash Meinel
Rework cmd_inventory so that it uses paths2ids and locks the trees for read.
880
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
881
        This specialisation fast-paths the case where all the trees are in the
882
        dirstate.
883
        """
884
        if paths is None:
885
            return None
886
        parents = self.get_parent_ids()
887
        for tree in trees:
888
            if not (isinstance(tree, DirStateRevisionTree) and tree._revision_id in
889
                parents):
890
                return super(WorkingTree4, self).paths2ids(paths, trees, require_versioned)
891
        search_indexes = [0] + [1 + parents.index(tree._revision_id) for tree in trees]
892
        # -- make all paths utf8 --
893
        paths_utf8 = set()
894
        for path in paths:
895
            paths_utf8.add(path.encode('utf8'))
896
        paths = paths_utf8
897
        # -- paths is now a utf8 path set --
898
        # -- get the state object and prepare it.
899
        state = self.current_dirstate()
2255.2.133 by John Arbash Meinel
Implement _paths2ids using bisect recursive rather than loading
900
        if False and (state._dirblock_state == dirstate.DirState.NOT_IN_MEMORY
901
            and '' not in paths):
902
            paths2ids = self._paths2ids_using_bisect
903
        else:
904
            paths2ids = self._paths2ids_in_memory
905
        return paths2ids(paths, search_indexes,
906
                         require_versioned=require_versioned)
907
908
    def _paths2ids_in_memory(self, paths, search_indexes,
909
                             require_versioned=True):
910
        state = self.current_dirstate()
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
911
        state._read_dirblocks_if_needed()
912
        def _entries_for_path(path):
913
            """Return a list with all the entries that match path for all ids.
914
            """
915
            dirname, basename = os.path.split(path)
916
            key = (dirname, basename, '')
917
            block_index, present = state._find_block_index_from_key(key)
918
            if not present:
919
                # the block which should contain path is absent.
920
                return []
921
            result = []
922
            block = state._dirblocks[block_index][1]
923
            entry_index, _ = state._find_entry_index(key, block)
924
            # we may need to look at multiple entries at this path: walk while the paths match.
925
            while (entry_index < len(block) and
926
                block[entry_index][0][0:2] == key[0:2]):
927
                result.append(block[entry_index])
928
                entry_index += 1
929
            return result
930
        if require_versioned:
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
931
            # -- check all supplied paths are versioned in a search tree. --
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
932
            all_versioned = True
933
            for path in paths:
934
                path_entries = _entries_for_path(path)
935
                if not path_entries:
936
                    # this specified path is not present at all: error
937
                    all_versioned = False
938
                    break
939
                found_versioned = False
940
                # for each id at this path
941
                for entry in path_entries:
942
                    # for each tree.
943
                    for index in search_indexes:
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
944
                        if entry[1][index][0] != 'a': # absent
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
945
                            found_versioned = True
946
                            # all good: found a versioned cell
947
                            break
948
                if not found_versioned:
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
949
                    # none of the indexes was not 'absent' at all ids for this
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
950
                    # path.
951
                    all_versioned = False
952
                    break
953
            if not all_versioned:
954
                raise errors.PathsNotVersionedError(paths)
955
        # -- remove redundancy in supplied paths to prevent over-scanning --
2825.7.1 by Robert Collins
* Partial commits are now approximately 40% faster by walking over the
956
        search_paths = osutils.minimum_path_selection(paths)
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
957
        # sketch: 
958
        # for all search_indexs in each path at or under each element of
959
        # search_paths, if the detail is relocated: add the id, and add the
960
        # relocated path as one to search if its not searched already. If the
961
        # detail is not relocated, add the id.
962
        searched_paths = set()
963
        found_ids = set()
964
        def _process_entry(entry):
965
            """Look at search_indexes within entry.
966
967
            If a specific tree's details are relocated, add the relocation
968
            target to search_paths if not searched already. If it is absent, do
969
            nothing. Otherwise add the id to found_ids.
970
            """
971
            for index in search_indexes:
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
972
                if entry[1][index][0] == 'r': # relocated
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
973
                    if not osutils.is_inside_any(searched_paths, entry[1][index][1]):
974
                        search_paths.add(entry[1][index][1])
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
975
                elif entry[1][index][0] != 'a': # absent
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
976
                    found_ids.add(entry[0][2])
977
        while search_paths:
978
            current_root = search_paths.pop()
979
            searched_paths.add(current_root)
980
            # process the entries for this containing directory: the rest will be
981
            # found by their parents recursively.
982
            root_entries = _entries_for_path(current_root)
983
            if not root_entries:
984
                # this specified path is not present at all, skip it.
985
                continue
986
            for entry in root_entries:
987
                _process_entry(entry)
988
            initial_key = (current_root, '', '')
989
            block_index, _ = state._find_block_index_from_key(initial_key)
990
            while (block_index < len(state._dirblocks) and
991
                osutils.is_inside(current_root, state._dirblocks[block_index][0])):
992
                for entry in state._dirblocks[block_index][1]:
993
                    _process_entry(entry)
994
                block_index += 1
995
        return found_ids
996
2255.2.133 by John Arbash Meinel
Implement _paths2ids using bisect recursive rather than loading
997
    def _paths2ids_using_bisect(self, paths, search_indexes,
998
                                require_versioned=True):
999
        state = self.current_dirstate()
1000
        found_ids = set()
1001
1002
        split_paths = sorted(osutils.split(p) for p in paths)
1003
        found = state._bisect_recursive(split_paths)
1004
1005
        if require_versioned:
1006
            found_dir_names = set(dir_name_id[:2] for dir_name_id in found)
1007
            for dir_name in split_paths:
1008
                if dir_name not in found_dir_names:
1009
                    raise errors.PathsNotVersionedError(paths)
1010
1011
        for dir_name_id, trees_info in found.iteritems():
1012
            for index in search_indexes:
1013
                if trees_info[index][0] not in ('r', 'a'):
1014
                    found_ids.add(dir_name_id[2])
1015
        return found_ids
1016
2255.2.45 by Robert Collins
Dirstate - fix revision_tree() behaviour to match the interface contract.
1017
    def read_working_inventory(self):
1018
        """Read the working inventory.
1019
        
1020
        This is a meaningless operation for dirstate, but we obey it anyhow.
1021
        """
1022
        return self.inventory
1023
2255.2.17 by Robert Collins
tweaks - finishes off all the test_test_trees tests for dirstate.
1024
    @needs_read_lock
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1025
    def revision_tree(self, revision_id):
1026
        """See Tree.revision_tree.
1027
1028
        WorkingTree4 supplies revision_trees for any basis tree.
1029
        """
1030
        dirstate = self.current_dirstate()
1031
        parent_ids = dirstate.get_parent_ids()
1032
        if revision_id not in parent_ids:
1033
            raise errors.NoSuchRevisionInTree(self, revision_id)
2255.2.45 by Robert Collins
Dirstate - fix revision_tree() behaviour to match the interface contract.
1034
        if revision_id in dirstate.get_ghosts():
1035
            raise errors.NoSuchRevisionInTree(self, revision_id)
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1036
        return DirStateRevisionTree(dirstate, revision_id,
1037
            self.branch.repository)
1038
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1039
    @needs_tree_write_lock
2255.2.37 by Robert Collins
Get TestExecutable.test_06_pull working on DirState: fix cloning and the set_last_revision api on WorkingTree4.
1040
    def set_last_revision(self, new_revision):
1041
        """Change the last revision in the working tree."""
1042
        parents = self.get_parent_ids()
1043
        if new_revision in (NULL_REVISION, None):
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1044
            if len(parents) >= 2:
1045
                raise AssertionError(
1046
                    "setting the last parent to none with a pending merge is "
1047
                    "unsupported.")
2255.2.37 by Robert Collins
Get TestExecutable.test_06_pull working on DirState: fix cloning and the set_last_revision api on WorkingTree4.
1048
            self.set_parent_ids([])
1049
        else:
2255.2.56 by Robert Collins
Dirstate: bring set_last_revision into line with the tested API.
1050
            self.set_parent_ids([new_revision] + parents[1:],
1051
                allow_leftmost_as_ghost=True)
2255.2.37 by Robert Collins
Get TestExecutable.test_06_pull working on DirState: fix cloning and the set_last_revision api on WorkingTree4.
1052
1053
    @needs_tree_write_lock
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1054
    def set_parent_ids(self, revision_ids, allow_leftmost_as_ghost=False):
1055
        """Set the parent ids to revision_ids.
1056
        
1057
        See also set_parent_trees. This api will try to retrieve the tree data
1058
        for each element of revision_ids from the trees repository. If you have
1059
        tree data already available, it is more efficient to use
1060
        set_parent_trees rather than set_parent_ids. set_parent_ids is however
1061
        an easier API to use.
1062
1063
        :param revision_ids: The revision_ids to set as the parent ids of this
1064
            working tree. Any of these may be ghosts.
1065
        """
1066
        trees = []
1067
        for revision_id in revision_ids:
1068
            try:
1069
                revtree = self.branch.repository.revision_tree(revision_id)
2255.2.24 by John Arbash Meinel
When adding ghosts revision_tree() raises RevisionNotPresent because of Knit, not NoSuchRevision
1070
                # TODO: jam 20070213 KnitVersionedFile raises
1071
                #       RevisionNotPresent rather than NoSuchRevision if a
1072
                #       given revision_id is not present. Should Repository be
1073
                #       catching it and re-raising NoSuchRevision?
1074
            except (errors.NoSuchRevision, errors.RevisionNotPresent):
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1075
                revtree = None
1076
            trees.append((revision_id, revtree))
1077
        self.set_parent_trees(trees,
1078
            allow_leftmost_as_ghost=allow_leftmost_as_ghost)
1079
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1080
    @needs_tree_write_lock
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1081
    def set_parent_trees(self, parents_list, allow_leftmost_as_ghost=False):
1082
        """Set the parents of the working tree.
1083
2255.2.84 by John Arbash Meinel
Remove now-unecessary encode/decode calls for revision ids.
1084
        :param parents_list: A list of (revision_id, tree) tuples.
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1085
            If tree is None, then that element is treated as an unreachable
1086
            parent tree - i.e. a ghost.
1087
        """
1088
        dirstate = self.current_dirstate()
1089
        if len(parents_list) > 0:
1090
            if not allow_leftmost_as_ghost and parents_list[0][1] is None:
2255.2.42 by Robert Collins
Fix WorkingTree4.set_parent_trees.
1091
                raise errors.GhostRevisionUnusableHere(parents_list[0][0])
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1092
        real_trees = []
1093
        ghosts = []
3462.1.2 by John Arbash Meinel
Change WT.set_parent_(ids/trees) to filter out ancestors.
1094
1095
        parent_ids = [rev_id for rev_id, tree in parents_list]
1096
        graph = self.branch.repository.get_graph()
1097
        heads = graph.heads(parent_ids)
1098
        accepted_revisions = set()
1099
2255.2.84 by John Arbash Meinel
Remove now-unecessary encode/decode calls for revision ids.
1100
        # convert absent trees to the null tree, which we convert back to
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1101
        # missing on access.
1102
        for rev_id, tree in parents_list:
3462.1.2 by John Arbash Meinel
Change WT.set_parent_(ids/trees) to filter out ancestors.
1103
            if len(accepted_revisions) > 0:
1104
                # we always accept the first tree
1105
                if rev_id in accepted_revisions or rev_id not in heads:
1106
                    # We have already included either this tree, or its
1107
                    # descendent, so we skip it.
1108
                    continue
2598.5.2 by Aaron Bentley
Got all tests passing with Branch returning 'null:' for null revision
1109
            _mod_revision.check_not_reserved_id(rev_id)
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1110
            if tree is not None:
1111
                real_trees.append((rev_id, tree))
1112
            else:
1113
                real_trees.append((rev_id,
1114
                    self.branch.repository.revision_tree(None)))
1115
                ghosts.append(rev_id)
3462.1.2 by John Arbash Meinel
Change WT.set_parent_(ids/trees) to filter out ancestors.
1116
            accepted_revisions.add(rev_id)
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1117
        dirstate.set_parent_trees(real_trees, ghosts=ghosts)
2255.7.67 by Robert Collins
Fix test_inv - make setting WorkingTree4._dirty use a helper to reduce code duplication, and reset the inventory when we dont manually update it, if it exists.
1118
        self._make_dirty(reset_inventory=False)
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1119
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
1120
    def _set_root_id(self, file_id):
1121
        """See WorkingTree.set_root_id."""
2255.2.37 by Robert Collins
Get TestExecutable.test_06_pull working on DirState: fix cloning and the set_last_revision api on WorkingTree4.
1122
        state = self.current_dirstate()
1123
        state.set_path_id('', file_id)
2255.7.67 by Robert Collins
Fix test_inv - make setting WorkingTree4._dirty use a helper to reduce code duplication, and reset the inventory when we dont manually update it, if it exists.
1124
        if state._dirblock_state == dirstate.DirState.IN_MEMORY_MODIFIED:
1125
            self._make_dirty(reset_inventory=True)
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
1126
2776.1.8 by Robert Collins
Retrieve the sha from the dirstate for path_content_summary on hash cache hits; slight performance hit but a big win for incremental commits.
1127
    def _sha_from_stat(self, path, stat_result):
1128
        """Get a sha digest from the tree's stat cache.
1129
1130
        The default implementation assumes no stat cache is present.
1131
1132
        :param path: The path.
1133
        :param stat_result: The stat result being looked up.
1134
        """
2929.1.1 by Robert Collins
Use a dict to access stat cache information from dirstate.
1135
        return self.current_dirstate().sha1_from_stat(path, stat_result)
2776.1.8 by Robert Collins
Retrieve the sha from the dirstate for path_content_summary on hash cache hits; slight performance hit but a big win for incremental commits.
1136
2255.2.232 by Robert Collins
Make WorkingTree4 report support for references based on the repositories capabilities.
1137
    @needs_read_lock
1138
    def supports_tree_reference(self):
1139
        return self._repo_supports_tree_reference
1140
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1141
    def unlock(self):
1142
        """Unlock in format 4 trees needs to write the entire dirstate."""
2665.3.3 by Daniel Watkins
Added _cleanup() to the unlock() method of all implementations of WorkingTree so that the cached ignore definitions are wiped when a lock is lost.
1143
        # do non-implementation specific cleanup
1144
        self._cleanup()
1145
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1146
        if self._control_files._lock_count == 1:
1147
            # eventually we should do signature checking during read locks for
1148
            # dirstate updates.
1149
            if self._control_files._lock_mode == 'w':
1150
                if self._dirty:
1151
                    self.flush()
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
1152
            if self._dirstate is not None:
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
1153
                # This is a no-op if there are no modifications.
1154
                self._dirstate.save()
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
1155
                self._dirstate.unlock()
2255.10.2 by John Arbash Meinel
Update to dirstate locking.
1156
            # TODO: jam 20070301 We shouldn't have to wipe the dirstate at this
1157
            #       point. Instead, it could check if the header has been
1158
            #       modified when it is locked, and if not, it can hang on to
1159
            #       the data it has in memory.
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1160
            self._dirstate = None
2255.2.15 by Robert Collins
Dirstate - truncate state file fixing bug in saving a smaller file, get more tree_implementation tests passing.
1161
            self._inventory = None
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1162
        # reverse order of locking.
1163
        try:
1164
            return self._control_files.unlock()
1165
        finally:
1166
            self.branch.unlock()
1167
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1168
    @needs_tree_write_lock
1169
    def unversion(self, file_ids):
1170
        """Remove the file ids in file_ids from the current versioned set.
1171
1172
        When a file_id is unversioned, all of its children are automatically
1173
        unversioned.
1174
1175
        :param file_ids: The file ids to stop versioning.
1176
        :raises: NoSuchId if any fileid is not currently versioned.
1177
        """
1178
        if not file_ids:
1179
            return
1180
        state = self.current_dirstate()
1181
        state._read_dirblocks_if_needed()
2858.2.1 by Martin Pool
Remove most calls to safe_file_id and safe_revision_id.
1182
        ids_to_unversion = set(file_ids)
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1183
        paths_to_unversion = set()
1184
        # sketch:
1185
        # check if the root is to be unversioned, if so, assert for now.
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1186
        # walk the state marking unversioned things as absent.
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1187
        # if there are any un-unversioned ids at the end, raise
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
1188
        for key, details in state._dirblocks[0][1]:
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
1189
            if (details[0][0] not in ('a', 'r') and # absent or relocated
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1190
                key[2] in ids_to_unversion):
1191
                # I haven't written the code to unversion / yet - it should be
1192
                # supported.
1193
                raise errors.BzrError('Unversioning the / is not currently supported')
1194
        block_index = 0
1195
        while block_index < len(state._dirblocks):
1196
            # process one directory at a time.
1197
            block = state._dirblocks[block_index]
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1198
            # first check: is the path one to remove - it or its children
1199
            delete_block = False
1200
            for path in paths_to_unversion:
1201
                if (block[0].startswith(path) and
1202
                    (len(block[0]) == len(path) or
1203
                     block[0][len(path)] == '/')):
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1204
                    # this entire block should be deleted - its the block for a
1205
                    # path to unversion; or the child of one
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1206
                    delete_block = True
1207
                    break
1208
            # TODO: trim paths_to_unversion as we pass by paths
1209
            if delete_block:
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1210
                # this block is to be deleted: process it.
1211
                # TODO: we can special case the no-parents case and
1212
                # just forget the whole block.
1213
                entry_index = 0
1214
                while entry_index < len(block[1]):
2255.7.41 by John Arbash Meinel
WorkingTree.unversion() should not raise if unversioning a child and a parent.
1215
                    # Mark this file id as having been removed
2363.2.3 by John Arbash Meinel
Just check if the entry is absent before calling _make_absent.
1216
                    entry = block[1][entry_index]
1217
                    ids_to_unversion.discard(entry[0][2])
2922.2.4 by John Arbash Meinel
Fix bug #114615 by teaching unversion() to not touch renamed entries.
1218
                    if (entry[1][0][0] in 'ar' # don't remove absent or renamed
1219
                                               # entries
2363.2.3 by John Arbash Meinel
Just check if the entry is absent before calling _make_absent.
1220
                        or not state._make_absent(entry)):
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1221
                        entry_index += 1
1222
                # go to the next block. (At the moment we dont delete empty
1223
                # dirblocks)
1224
                block_index += 1
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1225
                continue
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1226
            entry_index = 0
1227
            while entry_index < len(block[1]):
1228
                entry = block[1][entry_index]
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
1229
                if (entry[1][0][0] in ('a', 'r') or # absent, relocated
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1230
                    # ^ some parent row.
1231
                    entry[0][2] not in ids_to_unversion):
1232
                    # ^ not an id to unversion
1233
                    entry_index += 1
1234
                    continue
2255.2.113 by John Arbash Meinel
545ms, 600ms: Switch memory model from storing kind to using minikind
1235
                if entry[1][0][0] == 'd':
2255.7.41 by John Arbash Meinel
WorkingTree.unversion() should not raise if unversioning a child and a parent.
1236
                    paths_to_unversion.add(pathjoin(entry[0][0], entry[0][1]))
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1237
                if not state._make_absent(entry):
1238
                    entry_index += 1
1239
                # we have unversioned this id
1240
                ids_to_unversion.remove(entry[0][2])
1241
            block_index += 1
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1242
        if ids_to_unversion:
1243
            raise errors.NoSuchId(self, iter(ids_to_unversion).next())
2255.7.67 by Robert Collins
Fix test_inv - make setting WorkingTree4._dirty use a helper to reduce code duplication, and reset the inventory when we dont manually update it, if it exists.
1244
        self._make_dirty(reset_inventory=False)
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1245
        # have to change the legacy inventory too.
1246
        if self._inventory is not None:
1247
            for file_id in file_ids:
2255.2.33 by Robert Collins
Correct thunko in refactoring a few commits back.
1248
                self._inventory.remove_recursive_id(file_id)
2255.2.22 by Robert Collins
Dirstate: implement WorkingTree4.unversion, letting some test_commit tests pass.
1249
3146.8.5 by Aaron Bentley
Get apply_inventory_delta kinda working, but not children
1250
    @needs_tree_write_lock
3146.8.12 by Aaron Bentley
Add a flush to rename_one
1251
    def rename_one(self, from_rel, to_rel, after=False):
1252
        """See WorkingTree.rename_one"""
1253
        self.flush()
1254
        WorkingTree.rename_one(self, from_rel, to_rel, after)
1255
1256
    @needs_tree_write_lock
3146.8.5 by Aaron Bentley
Get apply_inventory_delta kinda working, but not children
1257
    def apply_inventory_delta(self, changes):
1258
        """See MutableTree.apply_inventory_delta"""
3146.8.11 by Aaron Bentley
Fix dirstate/inventory dance, mark dirstate modified and in memory
1259
        state = self.current_dirstate()
3146.8.15 by Aaron Bentley
Cleanup and docs
1260
        state.update_by_delta(changes)
3146.8.11 by Aaron Bentley
Fix dirstate/inventory dance, mark dirstate modified and in memory
1261
        self._make_dirty(reset_inventory=True)
3146.8.5 by Aaron Bentley
Get apply_inventory_delta kinda working, but not children
1262
2929.2.1 by Robert Collins
* Commit updates the state of the working tree via a delta rather than
1263
    def update_basis_by_delta(self, new_revid, delta):
1264
        """See MutableTree.update_basis_by_delta."""
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1265
        if self.last_revision() == new_revid:
1266
            raise AssertionError()
2929.2.1 by Robert Collins
* Commit updates the state of the working tree via a delta rather than
1267
        self.current_dirstate().update_basis_by_delta(delta, new_revid)
1268
2371.2.1 by John Arbash Meinel
Update DirState._validate() to detect rename errors.
1269
    @needs_read_lock
1270
    def _validate(self):
1271
        self._dirstate._validate()
1272
2255.2.16 by Robert Collins
Implement WorkingTreeFormat4._write_inventory for better compatability with existing code, letting more test_test_trees pass, now up to test_tree_with_subdirs_and_all_content_types.
1273
    @needs_tree_write_lock
1274
    def _write_inventory(self, inv):
1275
        """Write inventory as the current inventory."""
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1276
        if self._dirty:
1277
            raise AssertionError("attempting to write an inventory when the "
1278
                "dirstate is dirty will lose pending changes")
2255.2.16 by Robert Collins
Implement WorkingTreeFormat4._write_inventory for better compatability with existing code, letting more test_test_trees pass, now up to test_tree_with_subdirs_and_all_content_types.
1279
        self.current_dirstate().set_state_from_inventory(inv)
2255.7.67 by Robert Collins
Fix test_inv - make setting WorkingTree4._dirty use a helper to reduce code duplication, and reset the inventory when we dont manually update it, if it exists.
1280
        self._make_dirty(reset_inventory=False)
1281
        if self._inventory is not None:
1282
            self._inventory = inv
2255.2.16 by Robert Collins
Implement WorkingTreeFormat4._write_inventory for better compatability with existing code, letting more test_test_trees pass, now up to test_tree_with_subdirs_and_all_content_types.
1283
        self.flush()
1284
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1285
1286
class WorkingTreeFormat4(WorkingTreeFormat3):
1287
    """The first consolidated dirstate working tree format.
1288
1289
    This format:
1290
        - exists within a metadir controlling .bzr
1291
        - includes an explicit version marker for the workingtree control
1292
          files, separate from the BzrDir format
1293
        - modifies the hash cache format
2255.2.230 by Robert Collins
Update tree format signatures to mention introducing bzr version.
1294
        - is new in bzr 0.15
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1295
        - uses a LockDir to guard access to it.
1296
    """
1297
2323.6.4 by Martin Pool
BzrDir._check_supported now also takes care of recommending upgrades, which
1298
    upgrade_recommended = False
1299
3588.2.1 by Ian Clatworthy
make it easier to subclass WorkingTreeFormat4
1300
    _tree_class = WorkingTree4
1301
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1302
    def get_format_string(self):
1303
        """See WorkingTreeFormat.get_format_string()."""
2255.2.230 by Robert Collins
Update tree format signatures to mention introducing bzr version.
1304
        return "Bazaar Working Tree Format 4 (bzr 0.15)\n"
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1305
1306
    def get_format_description(self):
1307
        """See WorkingTreeFormat.get_format_description()."""
1308
        return "Working tree format 4"
1309
3123.5.2 by Aaron Bentley
Allow checkout --files_from
1310
    def initialize(self, a_bzrdir, revision_id=None, from_branch=None,
3136.1.3 by Aaron Bentley
Implement hard-link support for branch and checkout
1311
                   accelerator_tree=None, hardlink=False):
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1312
        """See WorkingTreeFormat.initialize().
2255.2.84 by John Arbash Meinel
Remove now-unecessary encode/decode calls for revision ids.
1313
2255.2.166 by Martin Pool
(broken) Add Tree.get_root_id() & test
1314
        :param revision_id: allows creating a working tree at a different
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1315
        revision than the branch is at.
3123.5.17 by Aaron Bentley
Update docs
1316
        :param accelerator_tree: A tree which can be used for retrieving file
1317
            contents more quickly than the revision tree, i.e. a workingtree.
1318
            The revision tree will be used for cases where accelerator_tree's
1319
            content is different.
3136.1.3 by Aaron Bentley
Implement hard-link support for branch and checkout
1320
        :param hardlink: If true, hard-link files from accelerator_tree,
1321
            where possible.
2255.2.166 by Martin Pool
(broken) Add Tree.get_root_id() & test
1322
1551.15.6 by Aaron Bentley
Use ROOT_ID when the repository supports old clients (Bug #107168)
1323
        These trees get an initial random root id, if their repository supports
1324
        rich root data, TREE_ROOT otherwise.
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1325
        """
1326
        if not isinstance(a_bzrdir.transport, LocalTransport):
1327
            raise errors.NotLocalUrl(a_bzrdir.transport.base)
1328
        transport = a_bzrdir.get_workingtree_transport(self)
1329
        control_files = self._open_control_files(a_bzrdir)
1330
        control_files.create_lock()
1331
        control_files.lock_write()
3407.2.5 by Martin Pool
Deprecate LockableFiles.put_utf8
1332
        transport.put_bytes('format', self.get_format_string(),
3468.1.1 by Martin Pool
Update more users of default file modes from control_files to bzrdir
1333
            mode=a_bzrdir._get_file_mode())
2955.5.3 by Vincent Ladeuil
Fix second unwanted connection by providing the right branch to create_checkout.
1334
        if from_branch is not None:
1335
            branch = from_branch
1336
        else:
1337
            branch = a_bzrdir.open_branch()
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1338
        if revision_id is None:
1339
            revision_id = branch.last_revision()
1340
        local_path = transport.local_abspath('dirstate')
2255.2.166 by Martin Pool
(broken) Add Tree.get_root_id() & test
1341
        # write out new dirstate (must exist when we create the tree)
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
1342
        state = dirstate.DirState.initialize(local_path)
1343
        state.unlock()
2371.2.1 by John Arbash Meinel
Update DirState._validate() to detect rename errors.
1344
        del state
3588.2.1 by Ian Clatworthy
make it easier to subclass WorkingTreeFormat4
1345
        wt = self._tree_class(a_bzrdir.root_transport.local_abspath('.'),
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1346
                         branch,
1347
                         _format=self,
1348
                         _bzrdir=a_bzrdir,
1349
                         _control_files=control_files)
1350
        wt._new_tree()
2255.7.42 by Robert Collins
WorkingTree4 only needs a tree write lock during initialize, not a deep write lock.
1351
        wt.lock_tree_write()
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1352
        try:
3588.2.1 by Ian Clatworthy
make it easier to subclass WorkingTreeFormat4
1353
            self._init_custom_control_files(wt)
2255.2.167 by Martin Pool
Change WorkingTree4.initialize to only get a random root id if not based on a revisiontree
1354
            if revision_id in (None, NULL_REVISION):
1551.15.6 by Aaron Bentley
Use ROOT_ID when the repository supports old clients (Bug #107168)
1355
                if branch.repository.supports_rich_root():
1356
                    wt._set_root_id(generate_ids.gen_root_id())
1357
                else:
1358
                    wt._set_root_id(ROOT_ID)
2255.2.166 by Martin Pool
(broken) Add Tree.get_root_id() & test
1359
                wt.flush()
3123.5.14 by Aaron Bentley
Avoid Repository.revision_tree in common-case branching
1360
            basis = None
1361
            # frequently, we will get here due to branching.  The accelerator
1362
            # tree will be the tree from the branch, so the desired basis
1363
            # tree will often be a parent of the accelerator tree.
1364
            if accelerator_tree is not None:
1365
                try:
1366
                    basis = accelerator_tree.revision_tree(revision_id)
1367
                except errors.NoSuchRevision:
1368
                    pass
1369
            if basis is None:
1370
                basis = branch.repository.revision_tree(revision_id)
1371
            if revision_id == NULL_REVISION:
1372
                parents_list = []
1373
            else:
1374
                parents_list = [(revision_id, basis)]
1375
            basis.lock_read()
3136.1.10 by Aaron Bentley
Clean error if filesystem does not support hard-links
1376
            try:
1377
                wt.set_parent_trees(parents_list, allow_leftmost_as_ghost=True)
2255.2.177 by Martin Pool
merge dirstate sorting fix, add more validation tests
1378
                wt.flush()
3136.1.10 by Aaron Bentley
Clean error if filesystem does not support hard-links
1379
                # if the basis has a root id we have to use that; otherwise we
1380
                # use a new random one
1381
                basis_root_id = basis.get_root_id()
1382
                if basis_root_id is not None:
1383
                    wt._set_root_id(basis_root_id)
1384
                    wt.flush()
3453.2.6 by Aaron Bentley
Rename mutate_tree to delta_from_tree, add comment
1385
                # delta_from_tree is safe even for DirStateRevisionTrees,
1386
                # because wt4.apply_inventory_delta does not mutate the input
1387
                # inventory entries.
3136.1.10 by Aaron Bentley
Clean error if filesystem does not support hard-links
1388
                transform.build_tree(basis, wt, accelerator_tree,
3453.2.6 by Aaron Bentley
Rename mutate_tree to delta_from_tree, add comment
1389
                                     hardlink=hardlink, delta_from_tree=True)
3136.1.10 by Aaron Bentley
Clean error if filesystem does not support hard-links
1390
            finally:
1391
                basis.unlock()
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1392
        finally:
1393
            control_files.unlock()
1394
            wt.unlock()
1395
        return wt
1396
3588.2.1 by Ian Clatworthy
make it easier to subclass WorkingTreeFormat4
1397
    def _init_custom_control_files(self, wt):
1398
        """Subclasses with custom control files should override this method.
1399
        
1400
        The working tree and control files are locked for writing when this
1401
        method is called.
1402
        
1403
        :param wt: the WorkingTree object
1404
        """
1405
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1406
    def _open(self, a_bzrdir, control_files):
1407
        """Open the tree itself.
2255.2.84 by John Arbash Meinel
Remove now-unecessary encode/decode calls for revision ids.
1408
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1409
        :param a_bzrdir: the dir for the tree.
1410
        :param control_files: the control files for the tree.
1411
        """
3588.2.1 by Ian Clatworthy
make it easier to subclass WorkingTreeFormat4
1412
        return self._tree_class(a_bzrdir.root_transport.local_abspath('.'),
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1413
                           branch=a_bzrdir.open_branch(),
1414
                           _format=self,
1415
                           _bzrdir=a_bzrdir,
1416
                           _control_files=control_files)
1417
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1418
    def __get_matchingbzrdir(self):
1419
        # please test against something that will let us do tree references
1420
        return bzrdir.format_registry.make_bzrdir(
2255.2.194 by Robert Collins
[BROKEN] Many updates to stop using experimental formats in tests.
1421
            'dirstate-with-subtree')
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1422
1423
    _matchingbzrdir = property(__get_matchingbzrdir)
1424
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1425
1426
class DirStateRevisionTree(Tree):
1427
    """A revision tree pulling the inventory from a dirstate."""
1428
1429
    def __init__(self, dirstate, revision_id, repository):
1430
        self._dirstate = dirstate
2858.2.1 by Martin Pool
Remove most calls to safe_file_id and safe_revision_id.
1431
        self._revision_id = revision_id
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1432
        self._repository = repository
1433
        self._inventory = None
2255.2.38 by Robert Collins
Fix WorkingTree4.pull to work.
1434
        self._locked = 0
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
1435
        self._dirstate_locked = False
3504.2.1 by John Arbash Meinel
Shortcut iter_references when we know references aren't supported.
1436
        self._repo_supports_tree_reference = getattr(
1437
            repository._format, "supports_tree_reference",
1438
            False)
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1439
2255.2.184 by Martin Pool
Fixes for some comparison tests; repr of DirStateRevisionTree
1440
    def __repr__(self):
1441
        return "<%s of %s in %s>" % \
1442
            (self.__class__.__name__, self._revision_id, self._dirstate)
1443
1551.15.46 by Aaron Bentley
Move plan merge to tree
1444
    def annotate_iter(self, file_id,
1445
                      default_revision=_mod_revision.CURRENT_REVISION):
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1446
        """See Tree.annotate_iter"""
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1447
        text_key = (file_id, self.inventory[file_id].revision)
1448
        annotations = self._repository.texts.annotate(text_key)
3350.6.10 by Martin Pool
VersionedFiles review cleanups
1449
        return [(key[-1], line) for (key, line) in annotations]
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1450
1551.15.46 by Aaron Bentley
Move plan merge to tree
1451
    def _get_ancestors(self, default_revision):
1452
        return set(self._repository.get_ancestry(self._revision_id,
1453
                                                 topo_sorted=False))
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1454
    def _comparison_data(self, entry, path):
2255.2.182 by Martin Pool
merge dirstate and trunk
1455
        """See Tree._comparison_data."""
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1456
        if entry is None:
1457
            return None, False, None
1458
        # trust the entry as RevisionTree does, but this may not be
1459
        # sensible: the entry might not have come from us?
1460
        return entry.kind, entry.executable, None
1461
2255.2.10 by Robert Collins
Now all tests matching dirstate pass - added generation of inventories for parent trees.
1462
    def _file_size(self, entry, stat_value):
1463
        return entry.text_size
1464
2255.2.78 by Robert Collins
Really finish the prior commit.
1465
    def filter_unversioned_files(self, paths):
1466
        """Filter out paths that are not versioned.
1467
1468
        :return: set of paths.
1469
        """
1470
        pred = self.has_filename
1471
        return set((p for p in paths if not pred(p)))
1472
2255.2.166 by Martin Pool
(broken) Add Tree.get_root_id() & test
1473
    def get_root_id(self):
1474
        return self.path2id('')
1475
3016.1.1 by Aaron Bentley
Update DirStateRevisionTree to avoid using inventory
1476
    def id2path(self, file_id):
1477
        "Convert a file-id to a path."
1478
        entry = self._get_entry(file_id=file_id)
1479
        if entry == (None, None):
1480
            raise errors.NoSuchId(tree=self, file_id=file_id)
1481
        path_utf8 = osutils.pathjoin(entry[0][0], entry[0][1])
1482
        return path_utf8.decode('utf8')
1483
3504.2.1 by John Arbash Meinel
Shortcut iter_references when we know references aren't supported.
1484
    def iter_references(self):
1485
        if not self._repo_supports_tree_reference:
1486
            # When the repo doesn't support references, we will have nothing to
1487
            # return
1488
            return iter([])
1489
        # Otherwise, fall back to the default implementation
1490
        return super(DirStateRevisionTree, self).iter_references()
1491
2255.2.134 by John Arbash Meinel
Add a tree-test for get_symlink_target
1492
    def _get_parent_index(self):
1493
        """Return the index in the dirstate referenced by this tree."""
1494
        return self._dirstate.get_parent_ids().index(self._revision_id) + 1
1495
2255.2.98 by Robert Collins
Perform path2id lookups in dirstate revision trees from the dirstate index without requiring an inventory.
1496
    def _get_entry(self, file_id=None, path=None):
1497
        """Get the dirstate row for file_id or path.
1498
1499
        If either file_id or path is supplied, it is used as the key to lookup.
1500
        If both are supplied, the fastest lookup is used, and an error is
1501
        raised if they do not both point at the same row.
1502
        
1503
        :param file_id: An optional unicode file_id to be looked up.
1504
        :param path: An optional unicode path to be looked up.
1505
        :return: The dirstate row tuple for path/file_id, or (None, None)
1506
        """
1507
        if file_id is None and path is None:
1508
            raise errors.BzrError('must supply file_id or path')
1509
        if path is not None:
1510
            path = path.encode('utf8')
2255.2.134 by John Arbash Meinel
Add a tree-test for get_symlink_target
1511
        parent_index = self._get_parent_index()
2255.2.98 by Robert Collins
Perform path2id lookups in dirstate revision trees from the dirstate index without requiring an inventory.
1512
        return self._dirstate._get_entry(parent_index, fileid_utf8=file_id, path_utf8=path)
1513
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1514
    def _generate_inventory(self):
1515
        """Create and set self.inventory from the dirstate object.
2255.2.84 by John Arbash Meinel
Remove now-unecessary encode/decode calls for revision ids.
1516
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1517
        (So this is only called the first time the inventory is requested for
2255.2.182 by Martin Pool
merge dirstate and trunk
1518
        this tree; it then remains in memory until it's out of date.)
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1519
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1520
        This is relatively expensive: we have to walk the entire dirstate.
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1521
        """
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1522
        if not self._locked:
1523
            raise AssertionError(
1524
                'cannot generate inventory of an unlocked '
1525
                'dirstate revision tree')
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1526
        # separate call for profiling - makes it clear where the costs are.
1527
        self._dirstate._read_dirblocks_if_needed()
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1528
        if self._revision_id not in self._dirstate.get_parent_ids():
1529
            raise AssertionError(
1530
                'parent %s has disappeared from %s' % (
1531
                self._revision_id, self._dirstate.get_parent_ids()))
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1532
        parent_index = self._dirstate.get_parent_ids().index(self._revision_id) + 1
1533
        # This is identical now to the WorkingTree _generate_inventory except
1534
        # for the tree index use.
1535
        root_key, current_entry = self._dirstate._get_entry(parent_index, path_utf8='')
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
1536
        current_id = root_key[2]
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1537
        if current_entry[parent_index][0] != 'd':
1538
            raise AssertionError()
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1539
        inv = Inventory(root_id=current_id, revision_id=self._revision_id)
1540
        inv.root.revision = current_entry[parent_index][4]
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
1541
        # Turn some things into local variables
1542
        minikind_to_kind = dirstate.DirState._minikind_to_kind
1543
        factory = entry_factory
1544
        utf8_decode = cache_utf8._utf8_decode
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
1545
        inv_byid = inv._byid
2255.2.73 by Robert Collins
50% speedup in the dirstate->inventory conversion logic by caching the parent ids as we walk the tree. Some further work would be to maintain a stack of parents as we know we visit depth first.
1546
        # we could do this straight out of the dirstate; it might be fast
1547
        # and should be profiled - RBC 20070216
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
1548
        parent_ies = {'' : inv.root}
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
1549
        for block in self._dirstate._dirblocks[1:]: #skip root
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1550
            dirname = block[0]
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
1551
            try:
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
1552
                parent_ie = parent_ies[dirname]
2255.2.96 by Robert Collins
Restore dirstate to all tests passing condition.
1553
            except KeyError:
1554
                # all the paths in this block are not versioned in this tree
1555
                continue
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1556
            for key, entry in block[1]:
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1557
                minikind, fingerprint, size, executable, revid = entry[parent_index]
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
1558
                if minikind in ('a', 'r'): # absent, relocated
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1559
                    # not this tree
1560
                    continue
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
1561
                name = key[1]
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
1562
                name_unicode = utf8_decode(name)[0]
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
1563
                file_id = key[2]
2255.2.114 by John Arbash Meinel
_get_inventory: 2.09 => 1.93s by tweaking some of the inner _generate_inventory loops
1564
                kind = minikind_to_kind[minikind]
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
1565
                inv_entry = factory[kind](file_id, name_unicode,
1566
                                          parent_ie.file_id)
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1567
                inv_entry.revision = revid
1568
                if kind == 'file':
1569
                    inv_entry.executable = executable
1570
                    inv_entry.text_size = size
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1571
                    inv_entry.text_sha1 = fingerprint
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1572
                elif kind == 'directory':
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
1573
                    parent_ies[(dirname + '/' + name).strip('/')] = inv_entry
2255.2.93 by Robert Collins
Dirstate - update WorkingTree4.unversion to the new layout, other tests still borked.
1574
                elif kind == 'symlink':
1575
                    inv_entry.executable = False
2338.4.1 by Marien Zwart
Fix committing merges in a dirstate tree with a symlink.
1576
                    inv_entry.text_size = None
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1577
                    inv_entry.symlink_target = utf8_decode(fingerprint)[0]
1578
                elif kind == 'tree-reference':
2255.2.218 by Robert Collins
Make the nested tree commit smoke test be more rigourous.
1579
                    inv_entry.reference_revision = fingerprint or None
2255.2.87 by Robert Collins
core dirstate tests passing with new structure.
1580
                else:
2255.2.158 by Martin Pool
Most of the integration of dirstate and subtree
1581
                    raise AssertionError("cannot convert entry %r into an InventoryEntry"
1582
                            % entry)
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
1583
                # These checks cost us around 40ms on a 55k entry tree
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1584
                if file_id in inv_byid:
1585
                    raise AssertionError('file_id %s already in'
1586
                        ' inventory as %s' % (file_id, inv_byid[file_id]))
1587
                if name_unicode in parent_ie.children:
1588
                    raise AssertionError('name %r already in parent'
1589
                        % (name_unicode,))
2255.2.115 by John Arbash Meinel
_get_inventory 1.75s: Directly update the inventory state rather than using inv.add()
1590
                inv_byid[file_id] = inv_entry
1591
                parent_ie.children[name_unicode] = inv_entry
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1592
        self._inventory = inv
1593
2255.7.36 by John Arbash Meinel
All trees should implement get_file_mtime()
1594
    def get_file_mtime(self, file_id, path=None):
1595
        """Return the modification time for this record.
1596
1597
        We return the timestamp of the last-changed revision.
1598
        """
1599
        # Make sure the file exists
1600
        entry = self._get_entry(file_id, path=path)
1601
        if entry == (None, None): # do we raise?
1602
            return None
1603
        parent_index = self._get_parent_index()
1604
        last_changed_revision = entry[1][parent_index][4]
1605
        return self._repository.get_revision(last_changed_revision).timestamp
1606
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1607
    def get_file_sha1(self, file_id, path=None, stat_value=None):
2255.10.1 by John Arbash Meinel
Update WorkingTree4 so that it doesn't use a HashCache,
1608
        entry = self._get_entry(file_id=file_id, path=path)
1609
        parent_index = self._get_parent_index()
1610
        parent_details = entry[1][parent_index]
1611
        if parent_details[0] == 'f':
1612
            return parent_details[1]
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1613
        return None
1614
2743.3.3 by Ian Clatworthy
Skip path lookup for tree.get_file() when we already know the path
1615
    def get_file(self, file_id, path=None):
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1616
        return StringIO(self.get_file_text(file_id))
1617
1618
    def get_file_lines(self, file_id):
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1619
        return osutils.split_lines(self.get_file_text(file_id))
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1620
1621
    def get_file_size(self, file_id):
3363.3.4 by Aaron Bentley
Add get_file_size to Tree interface
1622
        """See Tree.get_file_size"""
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1623
        return self.inventory[file_id].text_size
1624
1625
    def get_file_text(self, file_id):
3350.6.4 by Robert Collins
First cut at pluralised VersionedFiles. Some rather massive API incompatabilities, primarily because of the difficulty of coherence among competing stores.
1626
        return list(self.iter_files_bytes([(file_id, None)]))[0][1]
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1627
2255.2.226 by Robert Collins
Get merge_nested finally working: change nested tree iterators to take file_ids, and ensure the right branch is connected to in the merge logic. May not be suitable for shared repositories yet.
1628
    def get_reference_revision(self, file_id, path=None):
1629
        return self.inventory[file_id].reference_revision
2255.2.218 by Robert Collins
Make the nested tree commit smoke test be more rigourous.
1630
2708.1.7 by Aaron Bentley
Rename extract_files_bytes to iter_files_bytes
1631
    def iter_files_bytes(self, desired_files):
1632
        """See Tree.iter_files_bytes.
2708.1.4 by Aaron Bentley
RevisionTree and DirStateRevisionTree use Repository.extract_files_bytes
1633
2708.1.7 by Aaron Bentley
Rename extract_files_bytes to iter_files_bytes
1634
        This version is implemented on top of Repository.iter_files_bytes"""
2708.1.6 by Aaron Bentley
Turn extract_files_bytes into an iterator
1635
        parent_index = self._get_parent_index()
2708.1.11 by Aaron Bentley
Test and tweak error handling
1636
        repo_desired_files = []
1637
        for file_id, identifier in desired_files:
1638
            entry = self._get_entry(file_id)
1639
            if entry == (None, None):
1640
                raise errors.NoSuchId(self, file_id)
1641
            repo_desired_files.append((file_id, entry[1][parent_index][4],
1642
                                       identifier))
2708.1.7 by Aaron Bentley
Rename extract_files_bytes to iter_files_bytes
1643
        return self._repository.iter_files_bytes(repo_desired_files)
2708.1.4 by Aaron Bentley
RevisionTree and DirStateRevisionTree use Repository.extract_files_bytes
1644
2255.2.134 by John Arbash Meinel
Add a tree-test for get_symlink_target
1645
    def get_symlink_target(self, file_id):
1646
        entry = self._get_entry(file_id=file_id)
1647
        parent_index = self._get_parent_index()
1648
        if entry[1][parent_index][0] != 'l':
1649
            return None
1650
        else:
1651
            # At present, none of the tree implementations supports non-ascii
1652
            # symlink targets. So we will just assume that the dirstate path is
1653
            # correct.
1654
            return entry[1][parent_index][1]
1655
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1656
    def get_revision_id(self):
1657
        """Return the revision id for this tree."""
1658
        return self._revision_id
1659
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1660
    def _get_inventory(self):
1661
        if self._inventory is not None:
1662
            return self._inventory
2255.2.182 by Martin Pool
merge dirstate and trunk
1663
        self._must_be_locked()
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1664
        self._generate_inventory()
1665
        return self._inventory
1666
1667
    inventory = property(_get_inventory,
1668
                         doc="Inventory of this Tree")
1669
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1670
    def get_parent_ids(self):
1671
        """The parents of a tree in the dirstate are not cached."""
1672
        return self._repository.get_revision(self._revision_id).parent_ids
1673
2255.2.30 by Robert Collins
Some workingtree_implementations/test_workingtree.py test work - add DirStateRevisionTree.has_filename, locks around appropriate calls in tests.
1674
    def has_filename(self, filename):
2255.2.104 by Robert Collins
Add WorkingTree4.paths2ids which is inventory-usage free if the trees being examined are in the dirstate.
1675
        return bool(self.path2id(filename))
2255.2.30 by Robert Collins
Some workingtree_implementations/test_workingtree.py test work - add DirStateRevisionTree.has_filename, locks around appropriate calls in tests.
1676
2255.2.182 by Martin Pool
merge dirstate and trunk
1677
    def kind(self, file_id):
3016.1.1 by Aaron Bentley
Update DirStateRevisionTree to avoid using inventory
1678
        entry = self._get_entry(file_id=file_id)[1]
3376.2.11 by Martin Pool
Compare to None using is/is not not ==
1679
        if entry is None:
3016.1.1 by Aaron Bentley
Update DirStateRevisionTree to avoid using inventory
1680
            raise errors.NoSuchId(tree=self, file_id=file_id)
1681
        return dirstate.DirState._minikind_to_kind[entry[1][0]]
2255.2.182 by Martin Pool
merge dirstate and trunk
1682
3146.8.4 by Aaron Bentley
Eliminate direct use of inventory from transform application
1683
    def stored_kind(self, file_id):
1684
        """See Tree.stored_kind"""
1685
        return self.kind(file_id)
1686
2776.1.7 by Robert Collins
* New method on ``bzrlib.tree.Tree`` ``path_content_summary`` provides a
1687
    def path_content_summary(self, path):
1688
        """See Tree.path_content_summary."""
1689
        id = self.inventory.path2id(path)
1690
        if id is None:
1691
            return ('missing', None, None, None)
1692
        entry = self._inventory[id]
1693
        kind = entry.kind
1694
        if kind == 'file':
1695
            return (kind, entry.text_size, entry.executable, entry.text_sha1)
1696
        elif kind == 'symlink':
1697
            return (kind, None, None, entry.symlink_target)
1698
        else:
1699
            return (kind, None, None, None)
1700
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1701
    def is_executable(self, file_id, path=None):
1702
        ie = self.inventory[file_id]
1703
        if ie.kind != "file":
2255.2.84 by John Arbash Meinel
Remove now-unecessary encode/decode calls for revision ids.
1704
            return None
2255.2.31 by Robert Collins
Work in progress to make merge_inner work with dirstate trees.
1705
        return ie.executable
1706
2255.2.71 by John Arbash Meinel
Add a test for list_files, and implement it for DirStateRevisionTree
1707
    def list_files(self, include_root=False):
1708
        # We use a standard implementation, because DirStateRevisionTree is
1709
        # dealing with one of the parents of the current state
1710
        inv = self._get_inventory()
1711
        entries = inv.iter_entries()
1712
        if self.inventory.root is not None and not include_root:
1713
            entries.next()
1714
        for path, entry in entries:
1715
            yield path, 'V', entry.kind, entry.file_id, entry
2255.2.84 by John Arbash Meinel
Remove now-unecessary encode/decode calls for revision ids.
1716
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1717
    def lock_read(self):
1718
        """Lock the tree for a set of operations."""
2255.2.79 by Robert Collins
Take out repository locks from Dirstate revision trees, to improve file text access performance.
1719
        if not self._locked:
1720
            self._repository.lock_read()
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
1721
            if self._dirstate._lock_token is None:
1722
                self._dirstate.lock_read()
1723
                self._dirstate_locked = True
2255.2.38 by Robert Collins
Fix WorkingTree4.pull to work.
1724
        self._locked += 1
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1725
2255.2.183 by Martin Pool
add missing _must_be_locked and a better message
1726
    def _must_be_locked(self):
1727
        if not self._locked:
1728
            raise errors.ObjectNotLocked(self)
1729
2255.2.98 by Robert Collins
Perform path2id lookups in dirstate revision trees from the dirstate index without requiring an inventory.
1730
    @needs_read_lock
2255.2.65 by John Arbash Meinel
override path2id because it should be optimized anyway
1731
    def path2id(self, path):
1732
        """Return the id for path in this tree."""
2255.2.98 by Robert Collins
Perform path2id lookups in dirstate revision trees from the dirstate index without requiring an inventory.
1733
        # lookup by path: faster than splitting and walking the ivnentory.
1734
        entry = self._get_entry(path=path)
1735
        if entry == (None, None):
1736
            return None
2255.2.107 by John Arbash Meinel
(working), fix dirstate to use utf8 file ids.
1737
        return entry[0][2]
2255.2.65 by John Arbash Meinel
override path2id because it should be optimized anyway
1738
2255.2.3 by Robert Collins
Split out working tree format 4 to its own file, create stub dirstate revision object, start working on dirstate.set_parent_trees - a key failure point.
1739
    def unlock(self):
1740
        """Unlock, freeing any cache memory used during the lock."""
1741
        # outside of a lock, the inventory is suspect: release it.
2255.2.38 by Robert Collins
Fix WorkingTree4.pull to work.
1742
        self._locked -=1
1743
        if not self._locked:
1744
            self._inventory = None
2255.5.2 by John Arbash Meinel
(broken) lock and unlock the DirState object when locking and unlocking the Tree itself
1745
            self._locked = 0
1746
            if self._dirstate_locked:
1747
                self._dirstate.unlock()
1748
                self._dirstate_locked = False
2255.2.79 by Robert Collins
Take out repository locks from Dirstate revision trees, to improve file text access performance.
1749
            self._repository.unlock()
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1750
3504.2.1 by John Arbash Meinel
Shortcut iter_references when we know references aren't supported.
1751
    @needs_read_lock
1752
    def supports_tree_reference(self):
1753
        return self._repo_supports_tree_reference
1754
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1755
    def walkdirs(self, prefix=""):
2255.2.236 by Martin Pool
Review cleanups: mostly updating or removing todo comments.
1756
        # TODO: jam 20070215 This is the lazy way by using the RevisionTree
1757
        # implementation based on an inventory.  
1758
        # This should be cleaned up to use the much faster Dirstate code
1759
        # So for now, we just build up the parent inventory, and extract
1760
        # it the same way RevisionTree does.
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1761
        _directory = 'directory'
2255.2.70 by John Arbash Meinel
Minor improvements to DirStateRevisionTree.walkdirs()
1762
        inv = self._get_inventory()
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1763
        top_id = inv.path2id(prefix)
1764
        if top_id is None:
1765
            pending = []
1766
        else:
2255.2.70 by John Arbash Meinel
Minor improvements to DirStateRevisionTree.walkdirs()
1767
            pending = [(prefix, top_id)]
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1768
        while pending:
1769
            dirblock = []
2255.2.70 by John Arbash Meinel
Minor improvements to DirStateRevisionTree.walkdirs()
1770
            relpath, file_id = pending.pop()
1771
            # 0 - relpath, 1- file-id
1772
            if relpath:
1773
                relroot = relpath + '/'
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1774
            else:
1775
                relroot = ""
1776
            # FIXME: stash the node in pending
2255.2.70 by John Arbash Meinel
Minor improvements to DirStateRevisionTree.walkdirs()
1777
            entry = inv[file_id]
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1778
            for name, child in entry.sorted_children():
1779
                toppath = relroot + name
1780
                dirblock.append((toppath, name, child.kind, None,
1781
                    child.file_id, child.kind
1782
                    ))
2255.2.70 by John Arbash Meinel
Minor improvements to DirStateRevisionTree.walkdirs()
1783
            yield (relpath, entry.file_id), dirblock
2255.2.69 by John Arbash Meinel
Implement annotate_iter, get_revision_id, and walkdirs so that all tree_implementations now pass
1784
            # push the user specified dirs from dirblock
1785
            for dir in reversed(dirblock):
1786
                if dir[2] == _directory:
2255.2.70 by John Arbash Meinel
Minor improvements to DirStateRevisionTree.walkdirs()
1787
                    pending.append((dir[0], dir[4]))
2255.2.117 by Robert Collins
Add an InterDirStateTree InterTree optimiser.
1788
1789
1790
class InterDirStateTree(InterTree):
2255.13.3 by Martin Pool
Comments and better assertions in InterDirStateTree
1791
    """Fast path optimiser for changes_from with dirstate trees.
1792
    
1793
    This is used only when both trees are in the dirstate working file, and 
1794
    the source is any parent within the dirstate, and the destination is 
1795
    the current working tree of the same dirstate.
1796
    """
1797
    # this could be generalized to allow comparisons between any trees in the
1798
    # dirstate, and possibly between trees stored in different dirstates.
2255.2.117 by Robert Collins
Add an InterDirStateTree InterTree optimiser.
1799
2255.2.122 by Robert Collins
Alter intertree implementation tests to let dirstate inter-trees be correctly parameterised.
1800
    def __init__(self, source, target):
1801
        super(InterDirStateTree, self).__init__(source, target)
1802
        if not InterDirStateTree.is_compatible(source, target):
1803
            raise Exception, "invalid source %r and target %r" % (source, target)
1804
2255.2.117 by Robert Collins
Add an InterDirStateTree InterTree optimiser.
1805
    @staticmethod
2255.2.122 by Robert Collins
Alter intertree implementation tests to let dirstate inter-trees be correctly parameterised.
1806
    def make_source_parent_tree(source, target):
1807
        """Change the source tree into a parent of the target."""
1808
        revid = source.commit('record tree')
1809
        target.branch.repository.fetch(source.branch.repository, revid)
1810
        target.set_parent_ids([revid])
1811
        return target.basis_tree(), target
2255.7.25 by John Arbash Meinel
Shave off 200+ ms of 'time bzr status' in lp tree
1812
2255.2.117 by Robert Collins
Add an InterDirStateTree InterTree optimiser.
1813
    _matching_from_tree_format = WorkingTreeFormat4()
1814
    _matching_to_tree_format = WorkingTreeFormat4()
2255.2.122 by Robert Collins
Alter intertree implementation tests to let dirstate inter-trees be correctly parameterised.
1815
    _test_mutable_trees_to_test_trees = make_source_parent_tree
1816
3254.1.1 by Aaron Bentley
Make Tree.iter_changes a public method
1817
    def iter_changes(self, include_unchanged=False,
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1818
                      specific_files=None, pb=None, extra_trees=[],
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
1819
                      require_versioned=True, want_unversioned=False):
2255.2.122 by Robert Collins
Alter intertree implementation tests to let dirstate inter-trees be correctly parameterised.
1820
        """Return the changes from source to target.
1821
3254.1.1 by Aaron Bentley
Make Tree.iter_changes a public method
1822
        :return: An iterator that yields tuples. See InterTree.iter_changes
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1823
            for details.
2255.2.122 by Robert Collins
Alter intertree implementation tests to let dirstate inter-trees be correctly parameterised.
1824
        :param specific_files: An optional list of file paths to restrict the
1825
            comparison to. When mapping filenames to ids, all matches in all
1826
            trees (including optional extra_trees) are used, and all children of
1827
            matched directories are included.
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1828
        :param include_unchanged: An optional boolean requesting the inclusion of
2255.2.122 by Robert Collins
Alter intertree implementation tests to let dirstate inter-trees be correctly parameterised.
1829
            unchanged entries in the result.
1830
        :param extra_trees: An optional list of additional trees to use when
1831
            mapping the contents of specific_files (paths) to file_ids.
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1832
        :param require_versioned: If True, all files in specific_files must be
1833
            versioned in one of source, target, extra_trees or
1834
            PathsNotVersionedError is raised.
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
1835
        :param want_unversioned: Should unversioned files be returned in the
1836
            output. An unversioned file is defined as one with (False, False)
1837
            for the versioned pair.
2255.2.122 by Robert Collins
Alter intertree implementation tests to let dirstate inter-trees be correctly parameterised.
1838
        """
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
1839
        utf8_decode = cache_utf8._utf8_decode
2255.7.31 by John Arbash Meinel
Minor cleanup.
1840
        _minikind_to_kind = dirstate.DirState._minikind_to_kind
2474.1.44 by John Arbash Meinel
Use cmp_by_dirs in _iter_changes, it saves a bit of time.
1841
        cmp_by_dirs = dirstate.cmp_by_dirs
2255.2.122 by Robert Collins
Alter intertree implementation tests to let dirstate inter-trees be correctly parameterised.
1842
        # NB: show_status depends on being able to pass in non-versioned files
1843
        # and report them as unknown
2255.2.155 by Martin Pool
Better assertion message from InterDirStateTree._iter_changes
1844
        # TODO: handle extra trees in the dirstate.
2974.2.1 by John Arbash Meinel
Re-enable the fast path for the no-parent commit case.
1845
        if (extra_trees or specific_files == []):
2255.2.155 by Martin Pool
Better assertion message from InterDirStateTree._iter_changes
1846
            # we can't fast-path these cases (yet)
3254.1.1 by Aaron Bentley
Make Tree.iter_changes a public method
1847
            for f in super(InterDirStateTree, self).iter_changes(
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1848
                include_unchanged, specific_files, pb, extra_trees,
2255.2.204 by Robert Collins
Fix info and status again.
1849
                require_versioned, want_unversioned=want_unversioned):
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1850
                yield f
1851
            return
2255.7.1 by John Arbash Meinel
_iter_changes should return Unicode paths.
1852
        parent_ids = self.target.get_parent_ids()
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1853
        if not (self.source._revision_id in parent_ids
1854
                or self.source._revision_id == NULL_REVISION):
1855
            raise AssertionError(
1856
                "revision {%s} is not stored in {%s}, but %s "
1857
                "can only be used for trees stored in the dirstate"
1858
                % (self.source._revision_id, self.target, self.iter_changes))
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1859
        target_index = 0
2255.7.1 by John Arbash Meinel
_iter_changes should return Unicode paths.
1860
        if self.source._revision_id == NULL_REVISION:
1861
            source_index = None
1862
            indices = (target_index,)
1863
        else:
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
1864
            if not (self.source._revision_id in parent_ids):
1865
                raise AssertionError(
1866
                    "Failure: source._revision_id: %s not in target.parent_ids(%s)" % (
1867
                    self.source._revision_id, parent_ids))
2255.7.1 by John Arbash Meinel
_iter_changes should return Unicode paths.
1868
            source_index = 1 + parent_ids.index(self.source._revision_id)
2974.2.1 by John Arbash Meinel
Re-enable the fast path for the no-parent commit case.
1869
            indices = (source_index, target_index)
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1870
        # -- make all specific_files utf8 --
1871
        if specific_files:
1872
            specific_files_utf8 = set()
1873
            for path in specific_files:
1874
                specific_files_utf8.add(path.encode('utf8'))
1875
            specific_files = specific_files_utf8
1876
        else:
1877
            specific_files = set([''])
1878
        # -- specific_files is now a utf8 path set --
1879
        # -- get the state object and prepare it.
1880
        state = self.target.current_dirstate()
1881
        state._read_dirblocks_if_needed()
1882
        def _entries_for_path(path):
1883
            """Return a list with all the entries that match path for all ids.
1884
            """
1885
            dirname, basename = os.path.split(path)
1886
            key = (dirname, basename, '')
1887
            block_index, present = state._find_block_index_from_key(key)
1888
            if not present:
1889
                # the block which should contain path is absent.
1890
                return []
1891
            result = []
1892
            block = state._dirblocks[block_index][1]
1893
            entry_index, _ = state._find_entry_index(key, block)
1894
            # we may need to look at multiple entries at this path: walk while the specific_files match.
1895
            while (entry_index < len(block) and
1896
                block[entry_index][0][0:2] == key[0:2]):
1897
                result.append(block[entry_index])
1898
                entry_index += 1
1899
            return result
1900
        if require_versioned:
1901
            # -- check all supplied paths are versioned in a search tree. --
1902
            all_versioned = True
1903
            for path in specific_files:
1904
                path_entries = _entries_for_path(path)
1905
                if not path_entries:
1906
                    # this specified path is not present at all: error
1907
                    all_versioned = False
1908
                    break
1909
                found_versioned = False
1910
                # for each id at this path
1911
                for entry in path_entries:
1912
                    # for each tree.
2255.7.1 by John Arbash Meinel
_iter_changes should return Unicode paths.
1913
                    for index in indices:
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1914
                        if entry[1][index][0] != 'a': # absent
1915
                            found_versioned = True
1916
                            # all good: found a versioned cell
1917
                            break
1918
                if not found_versioned:
1919
                    # none of the indexes was not 'absent' at all ids for this
1920
                    # path.
1921
                    all_versioned = False
1922
                    break
1923
            if not all_versioned:
2255.7.62 by Robert Collins
Update the Tree.filter_unversioned_files docstring to reflect what the existing implementations actually do, and change the WorkingTree4 implementation to match a newly created test for it.
1924
                raise errors.PathsNotVersionedError(specific_files)
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1925
        # -- remove redundancy in supplied specific_files to prevent over-scanning --
1926
        search_specific_files = set()
1927
        for path in specific_files:
1928
            other_specific_files = specific_files.difference(set([path]))
1929
            if not osutils.is_inside_any(other_specific_files, path):
1930
                # this is a top level path, we must check it.
1931
                search_specific_files.add(path)
1932
        # sketch: 
1933
        # compare source_index and target_index at or under each element of search_specific_files.
1934
        # follow the following comparison table. Note that we only want to do diff operations when
1935
        # the target is fdl because thats when the walkdirs logic will have exposed the pathinfo 
1936
        # for the target.
1937
        # cases:
1938
        # 
1939
        # Source | Target | disk | action
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
1940
        #   r    | fdlt   |      | add source to search, add id path move and perform
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1941
        #        |        |      | diff check on source-target
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
1942
        #   r    | fdlt   |  a   | dangling file that was present in the basis. 
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1943
        #        |        |      | ???
1944
        #   r    |  a     |      | add source to search
1945
        #   r    |  a     |  a   | 
1946
        #   r    |  r     |      | this path is present in a non-examined tree, skip.
1947
        #   r    |  r     |  a   | this path is present in a non-examined tree, skip.
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
1948
        #   a    | fdlt   |      | add new id
1949
        #   a    | fdlt   |  a   | dangling locally added file, skip
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1950
        #   a    |  a     |      | not present in either tree, skip
1951
        #   a    |  a     |  a   | not present in any tree, skip
1952
        #   a    |  r     |      | not present in either tree at this path, skip as it
1953
        #        |        |      | may not be selected by the users list of paths.
1954
        #   a    |  r     |  a   | not present in either tree at this path, skip as it
1955
        #        |        |      | may not be selected by the users list of paths.
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
1956
        #  fdlt  | fdlt   |      | content in both: diff them
1957
        #  fdlt  | fdlt   |  a   | deleted locally, but not unversioned - show as deleted ?
1958
        #  fdlt  |  a     |      | unversioned: output deleted id for now
1959
        #  fdlt  |  a     |  a   | unversioned and deleted: output deleted id
1960
        #  fdlt  |  r     |      | relocated in this tree, so add target to search.
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1961
        #        |        |      | Dont diff, we will see an r,fd; pair when we reach
1962
        #        |        |      | this id at the other path.
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
1963
        #  fdlt  |  r     |  a   | relocated in this tree, so add target to search.
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1964
        #        |        |      | Dont diff, we will see an r,fd; pair when we reach
1965
        #        |        |      | this id at the other path.
1966
1967
        # for all search_indexs in each path at or under each element of
1968
        # search_specific_files, if the detail is relocated: add the id, and add the
1969
        # relocated path as one to search if its not searched already. If the
1970
        # detail is not relocated, add the id.
1971
        searched_specific_files = set()
2255.7.1 by John Arbash Meinel
_iter_changes should return Unicode paths.
1972
        NULL_PARENT_DETAILS = dirstate.DirState.NULL_PARENT_DETAILS
2255.7.29 by John Arbash Meinel
approx 300ms of 'time bzr status' in lp tree by caching last parent info
1973
        # Using a list so that we can access the values and change them in
1974
        # nested scope. Each one is [path, file_id, entry]
2485.3.8 by John Arbash Meinel
Keep track of directories that you have seen.
1975
        last_source_parent = [None, None]
1976
        last_target_parent = [None, None]
2255.7.29 by John Arbash Meinel
approx 300ms of 'time bzr status' in lp tree by caching last parent info
1977
2255.2.192 by John Arbash Meinel
Add support for executable bit under win32
1978
        use_filesystem_for_exec = (sys.platform != 'win32')
1979
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
1980
        # Just a sentry, so that _process_entry can say that this
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
1981
        # record is handled, but isn't interesting to process (unchanged)
1982
        uninteresting = object()
1983
2485.3.8 by John Arbash Meinel
Keep track of directories that you have seen.
1984
1985
        old_dirname_to_file_id = {}
1986
        new_dirname_to_file_id = {}
1987
        # TODO: jam 20070516 - Avoid the _get_entry lookup overhead by
1988
        #       keeping a cache of directories that we have seen.
1989
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
1990
        def _process_entry(entry, path_info):
1991
            """Compare an entry and real disk to generate delta information.
1992
1993
            :param path_info: top_relpath, basename, kind, lstat, abspath for
1994
                the path of entry. If None, then the path is considered absent.
1995
                (Perhaps we should pass in a concrete entry for this ?)
2255.7.80 by John Arbash Meinel
Don't decode the path entry until we've actually decided to return the tuple.
1996
                Basename is returned as a utf8 string because we expect this
1997
                tuple will be ignored, and don't want to take the time to
1998
                decode.
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
1999
            :return: None if these don't match
2000
                     A tuple of information about the change, or
2001
                     the object 'uninteresting' if these match, but are
2002
                     basically identical.
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2003
            """
2255.7.1 by John Arbash Meinel
_iter_changes should return Unicode paths.
2004
            if source_index is None:
2005
                source_details = NULL_PARENT_DETAILS
2006
            else:
2007
                source_details = entry[1][source_index]
2255.10.4 by John Arbash Meinel
do not update_entry from disk if it is supposed to be absent or renamed
2008
            target_details = entry[1][target_index]
2009
            target_minikind = target_details[0]
2255.13.3 by Martin Pool
Comments and better assertions in InterDirStateTree
2010
            if path_info is not None and target_minikind in 'fdlt':
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
2011
                if not (target_index == 0):
2012
                    raise AssertionError()
2255.10.3 by John Arbash Meinel
(broken) Change get_sha1_for_entry into update_entry
2013
                link_or_sha1 = state.update_entry(entry, abspath=path_info[4],
2014
                                                  stat_value=path_info[3])
2255.10.4 by John Arbash Meinel
do not update_entry from disk if it is supposed to be absent or renamed
2015
                # The entry may have been modified by update_entry
2016
                target_details = entry[1][target_index]
2017
                target_minikind = target_details[0]
2255.10.3 by John Arbash Meinel
(broken) Change get_sha1_for_entry into update_entry
2018
            else:
2019
                link_or_sha1 = None
2485.3.8 by John Arbash Meinel
Keep track of directories that you have seen.
2020
            file_id = entry[0][2]
2255.7.31 by John Arbash Meinel
Minor cleanup.
2021
            source_minikind = source_details[0]
2255.2.191 by Martin Pool
additional fix for subtree comparison
2022
            if source_minikind in 'fdltr' and target_minikind in 'fdlt':
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2023
                # claimed content in both: diff
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
2024
                #   r    | fdlt   |      | add source to search, add id path move and perform
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2025
                #        |        |      | diff check on source-target
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
2026
                #   r    | fdlt   |  a   | dangling file that was present in the basis.
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2027
                #        |        |      | ???
2255.7.31 by John Arbash Meinel
Minor cleanup.
2028
                if source_minikind in 'r':
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2029
                    # add the source to the search path to find any children it
2030
                    # has.  TODO ? : only add if it is a container ?
2255.7.31 by John Arbash Meinel
Minor cleanup.
2031
                    if not osutils.is_inside_any(searched_specific_files,
2032
                                                 source_details[1]):
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2033
                        search_specific_files.add(source_details[1])
2034
                    # generate the old path; this is needed for stating later
2035
                    # as well.
2036
                    old_path = source_details[1]
2037
                    old_dirname, old_basename = os.path.split(old_path)
2255.7.41 by John Arbash Meinel
WorkingTree.unversion() should not raise if unversioning a child and a parent.
2038
                    path = pathjoin(entry[0][0], entry[0][1])
2255.7.31 by John Arbash Meinel
Minor cleanup.
2039
                    old_entry = state._get_entry(source_index,
2040
                                                 path_utf8=old_path)
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2041
                    # update the source details variable to be the real
2042
                    # location.
3207.2.1 by jameinel
Add a test that _iter_changes raises a clearer error when we encounter an invalid rename.
2043
                    if old_entry == (None, None):
3221.1.3 by Martin Pool
Review cleanups for CorruptDirstate: use the path everywhere rather than the object, and use more standard phrasing.
2044
                        raise errors.CorruptDirstate(state._filename,
3207.2.1 by jameinel
Add a test that _iter_changes raises a clearer error when we encounter an invalid rename.
2045
                            "entry '%s/%s' is considered renamed from %r"
2046
                            " but source does not exist\n"
2047
                            "entry: %s" % (entry[0][0], entry[0][1], old_path, entry))
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2048
                    source_details = old_entry[1][source_index]
2255.7.31 by John Arbash Meinel
Minor cleanup.
2049
                    source_minikind = source_details[0]
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2050
                else:
2255.7.21 by John Arbash Meinel
Get iter_changes working again, by fixing set_parent_trees to
2051
                    old_dirname = entry[0][0]
2052
                    old_basename = entry[0][1]
2485.3.12 by John Arbash Meinel
Delay joining the path until we are actually going to be using it.
2053
                    old_path = path = None
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2054
                if path_info is None:
2055
                    # the file is missing on disk, show as removed.
2255.7.4 by Robert Collins
Test InterTree._iter_changes with missing (absent but versioned) files.
2056
                    content_change = True
2057
                    target_kind = None
2058
                    target_exec = False
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2059
                else:
2255.7.3 by Robert Collins
Add tests for _iter_changes with symlinks, disabled until unversioned file support is added, as that affects the test expected value.
2060
                    # source and target are both versioned and disk file is present.
2255.7.4 by Robert Collins
Test InterTree._iter_changes with missing (absent but versioned) files.
2061
                    target_kind = path_info[2]
2255.7.21 by John Arbash Meinel
Get iter_changes working again, by fixing set_parent_trees to
2062
                    if target_kind == 'directory':
2485.3.12 by John Arbash Meinel
Delay joining the path until we are actually going to be using it.
2063
                        if path is None:
2064
                            old_path = path = pathjoin(old_dirname, old_basename)
2485.3.8 by John Arbash Meinel
Keep track of directories that you have seen.
2065
                        new_dirname_to_file_id[path] = file_id
2255.7.31 by John Arbash Meinel
Minor cleanup.
2066
                        if source_minikind != 'd':
2255.7.3 by Robert Collins
Add tests for _iter_changes with symlinks, disabled until unversioned file support is added, as that affects the test expected value.
2067
                            content_change = True
2068
                        else:
2069
                            # directories have no fingerprint
2070
                            content_change = False
2255.7.4 by Robert Collins
Test InterTree._iter_changes with missing (absent but versioned) files.
2071
                        target_exec = False
2255.7.21 by John Arbash Meinel
Get iter_changes working again, by fixing set_parent_trees to
2072
                    elif target_kind == 'file':
2255.7.31 by John Arbash Meinel
Minor cleanup.
2073
                        if source_minikind != 'f':
2255.7.3 by Robert Collins
Add tests for _iter_changes with symlinks, disabled until unversioned file support is added, as that affects the test expected value.
2074
                            content_change = True
2075
                        else:
2255.10.3 by John Arbash Meinel
(broken) Change get_sha1_for_entry into update_entry
2076
                            # We could check the size, but we already have the
2077
                            # sha1 hash.
2078
                            content_change = (link_or_sha1 != source_details[1])
2255.10.5 by John Arbash Meinel
Fix a small bug when we have a symlink that does not need to be re-read.
2079
                        # Target details is updated at update_entry time
2255.2.192 by John Arbash Meinel
Add support for executable bit under win32
2080
                        if use_filesystem_for_exec:
2081
                            # We don't need S_ISREG here, because we are sure
2082
                            # we are dealing with a file.
2083
                            target_exec = bool(stat.S_IEXEC & path_info[3].st_mode)
2084
                        else:
2085
                            target_exec = target_details[3]
2255.7.21 by John Arbash Meinel
Get iter_changes working again, by fixing set_parent_trees to
2086
                    elif target_kind == 'symlink':
2255.7.31 by John Arbash Meinel
Minor cleanup.
2087
                        if source_minikind != 'l':
2255.7.3 by Robert Collins
Add tests for _iter_changes with symlinks, disabled until unversioned file support is added, as that affects the test expected value.
2088
                            content_change = True
2089
                        else:
2255.10.3 by John Arbash Meinel
(broken) Change get_sha1_for_entry into update_entry
2090
                            content_change = (link_or_sha1 != source_details[1])
2255.7.3 by Robert Collins
Add tests for _iter_changes with symlinks, disabled until unversioned file support is added, as that affects the test expected value.
2091
                        target_exec = False
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
2092
                    elif target_kind == 'tree-reference':
2093
                        if source_minikind != 't':
2094
                            content_change = True
2095
                        else:
2096
                            content_change = False
2255.2.214 by Robert Collins
Get _iter_changes on dirstate passing the subtree tests.
2097
                        target_exec = False
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2098
                    else:
2255.7.3 by Robert Collins
Add tests for _iter_changes with symlinks, disabled until unversioned file support is added, as that affects the test expected value.
2099
                        raise Exception, "unknown kind %s" % path_info[2]
2485.3.8 by John Arbash Meinel
Keep track of directories that you have seen.
2100
                if source_minikind == 'd':
2485.3.12 by John Arbash Meinel
Delay joining the path until we are actually going to be using it.
2101
                    if path is None:
2102
                        old_path = path = pathjoin(old_dirname, old_basename)
2103
                    old_dirname_to_file_id[old_path] = file_id
2255.7.4 by Robert Collins
Test InterTree._iter_changes with missing (absent but versioned) files.
2104
                # parent id is the entry for the path in the target tree
2255.7.29 by John Arbash Meinel
approx 300ms of 'time bzr status' in lp tree by caching last parent info
2105
                if old_dirname == last_source_parent[0]:
2106
                    source_parent_id = last_source_parent[1]
2107
                else:
2485.3.8 by John Arbash Meinel
Keep track of directories that you have seen.
2108
                    try:
2109
                        source_parent_id = old_dirname_to_file_id[old_dirname]
2110
                    except KeyError:
2111
                        source_parent_entry = state._get_entry(source_index,
2112
                                                               path_utf8=old_dirname)
2113
                        source_parent_id = source_parent_entry[0][2]
2255.7.29 by John Arbash Meinel
approx 300ms of 'time bzr status' in lp tree by caching last parent info
2114
                    if source_parent_id == entry[0][2]:
2115
                        # This is the root, so the parent is None
2116
                        source_parent_id = None
2255.7.30 by John Arbash Meinel
Don't cache the parent entry for root, since it is different than all other entries.
2117
                    else:
2118
                        last_source_parent[0] = old_dirname
2119
                        last_source_parent[1] = source_parent_id
2255.7.29 by John Arbash Meinel
approx 300ms of 'time bzr status' in lp tree by caching last parent info
2120
                new_dirname = entry[0][0]
2121
                if new_dirname == last_target_parent[0]:
2122
                    target_parent_id = last_target_parent[1]
2123
                else:
2485.3.8 by John Arbash Meinel
Keep track of directories that you have seen.
2124
                    try:
2125
                        target_parent_id = new_dirname_to_file_id[new_dirname]
2126
                    except KeyError:
2127
                        # TODO: We don't always need to do the lookup, because the
2128
                        #       parent entry will be the same as the source entry.
2129
                        target_parent_entry = state._get_entry(target_index,
2130
                                                               path_utf8=new_dirname)
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
2131
                        if target_parent_entry == (None, None):
2132
                            raise AssertionError(
2133
                                "Could not find target parent in wt: %s\nparent of: %s"
2134
                                % (new_dirname, entry))
2485.3.8 by John Arbash Meinel
Keep track of directories that you have seen.
2135
                        target_parent_id = target_parent_entry[0][2]
2255.7.25 by John Arbash Meinel
Shave off 200+ ms of 'time bzr status' in lp tree
2136
                    if target_parent_id == entry[0][2]:
2137
                        # This is the root, so the parent is None
2138
                        target_parent_id = None
2255.7.30 by John Arbash Meinel
Don't cache the parent entry for root, since it is different than all other entries.
2139
                    else:
2140
                        last_target_parent[0] = new_dirname
2141
                        last_target_parent[1] = target_parent_id
2255.7.29 by John Arbash Meinel
approx 300ms of 'time bzr status' in lp tree by caching last parent info
2142
2255.7.4 by Robert Collins
Test InterTree._iter_changes with missing (absent but versioned) files.
2143
                source_exec = source_details[3]
2485.3.4 by John Arbash Meinel
Change _process_entry to detect when we don't care about something.
2144
                if (include_unchanged
2145
                    or content_change
2146
                    or source_parent_id != target_parent_id
2147
                    or old_basename != entry[0][1]
2148
                    or source_exec != target_exec
2149
                    ):
2485.3.12 by John Arbash Meinel
Delay joining the path until we are actually going to be using it.
2150
                    if old_path is None:
2151
                        old_path = path = pathjoin(old_dirname, old_basename)
2152
                        old_path_u = utf8_decode(old_path)[0]
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2153
                        path_u = old_path_u
2154
                    else:
2485.3.12 by John Arbash Meinel
Delay joining the path until we are actually going to be using it.
2155
                        old_path_u = utf8_decode(old_path)[0]
2156
                        if old_path == path:
2157
                            path_u = old_path_u
2158
                        else:
2159
                            path_u = utf8_decode(path)[0]
2485.3.6 by John Arbash Meinel
Delay calling pathjoin() until we've figured out we're going to use it
2160
                    source_kind = _minikind_to_kind[source_minikind]
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2161
                    return (entry[0][2],
2162
                           (old_path_u, path_u),
2163
                           content_change,
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2164
                           (True, True),
2165
                           (source_parent_id, target_parent_id),
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2166
                           (utf8_decode(old_basename)[0], utf8_decode(entry[0][1])[0]),
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2167
                           (source_kind, target_kind),
2168
                           (source_exec, target_exec))
2485.3.4 by John Arbash Meinel
Change _process_entry to detect when we don't care about something.
2169
                else:
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2170
                    return uninteresting
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
2171
            elif source_minikind in 'a' and target_minikind in 'fdlt':
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2172
                # looks like a new file
2173
                if path_info is not None:
2255.7.41 by John Arbash Meinel
WorkingTree.unversion() should not raise if unversioning a child and a parent.
2174
                    path = pathjoin(entry[0][0], entry[0][1])
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2175
                    # parent id is the entry for the path in the target tree
2176
                    # TODO: these are the same for an entire directory: cache em.
2255.10.5 by John Arbash Meinel
Fix a small bug when we have a symlink that does not need to be re-read.
2177
                    parent_id = state._get_entry(target_index,
2178
                                                 path_utf8=entry[0][0])[0][2]
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2179
                    if parent_id == entry[0][2]:
2180
                        parent_id = None
2255.2.192 by John Arbash Meinel
Add support for executable bit under win32
2181
                    if use_filesystem_for_exec:
2182
                        # We need S_ISREG here, because we aren't sure if this
2183
                        # is a file or not.
2184
                        target_exec = bool(
2185
                            stat.S_ISREG(path_info[3].st_mode)
2186
                            and stat.S_IEXEC & path_info[3].st_mode)
2187
                    else:
2188
                        target_exec = target_details[3]
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2189
                    return (entry[0][2],
2190
                           (None, utf8_decode(path)[0]),
2191
                           True,
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2192
                           (False, True),
2193
                           (None, parent_id),
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2194
                           (None, utf8_decode(entry[0][1])[0]),
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2195
                           (None, path_info[2]),
2196
                           (None, target_exec))
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2197
                else:
2198
                    # but its not on disk: we deliberately treat this as just
2199
                    # never-present. (Why ?! - RBC 20070224)
2200
                    pass
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
2201
            elif source_minikind in 'fdlt' and target_minikind in 'a':
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2202
                # unversioned, possibly, or possibly not deleted: we dont care.
2203
                # if its still on disk, *and* theres no other entry at this
2204
                # path [we dont know this in this routine at the moment -
2205
                # perhaps we should change this - then it would be an unknown.
2255.7.41 by John Arbash Meinel
WorkingTree.unversion() should not raise if unversioning a child and a parent.
2206
                old_path = pathjoin(entry[0][0], entry[0][1])
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2207
                # parent id is the entry for the path in the target tree
2208
                parent_id = state._get_entry(source_index, path_utf8=entry[0][0])[0][2]
2209
                if parent_id == entry[0][2]:
2210
                    parent_id = None
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2211
                return (entry[0][2],
2212
                       (utf8_decode(old_path)[0], None),
2213
                       True,
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2214
                       (True, False),
2215
                       (parent_id, None),
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2216
                       (utf8_decode(entry[0][1])[0], None),
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2217
                       (_minikind_to_kind[source_minikind], None),
2218
                       (source_details[3], None))
2255.2.189 by Martin Pool
Add and fix up basic comparison of subtrees.
2219
            elif source_minikind in 'fdlt' and target_minikind in 'r':
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2220
                # a rename; could be a true rename, or a rename inherited from
2221
                # a renamed parent. TODO: handle this efficiently. Its not
2222
                # common case to rename dirs though, so a correct but slow
2223
                # implementation will do.
2224
                if not osutils.is_inside_any(searched_specific_files, target_details[1]):
2225
                    search_specific_files.add(target_details[1])
1551.10.31 by Aaron Bentley
Fix WorkingTree4._iter_changes with pending merges and deleted files
2226
            elif source_minikind in 'ra' and target_minikind in 'ra':
2255.7.45 by Robert Collins
Handle the source and target paths both being relocated from another path in the tree - this is possible with a pending merge.
2227
                # neither of the selected trees contain this file,
2228
                # so skip over it. This is not currently directly tested, but
2229
                # is indirectly via test_too_much.TestCommands.test_conflicts.
2230
                pass
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2231
            else:
2255.13.3 by Martin Pool
Comments and better assertions in InterDirStateTree
2232
                raise AssertionError("don't know how to compare "
2233
                    "source_minikind=%r, target_minikind=%r"
2234
                    % (source_minikind, target_minikind))
2235
                ## import pdb;pdb.set_trace()
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2236
            return None
2323.4.2 by Robert Collins
Fix the behaviour of dirstate optimised iter_changes recursing its disk iterator into subtrees inappropriately.
2237
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2238
        while search_specific_files:
2255.2.236 by Martin Pool
Review cleanups: mostly updating or removing todo comments.
2239
            # TODO: the pending list should be lexically sorted?  the
2240
            # interface doesn't require it.
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2241
            current_root = search_specific_files.pop()
2360.1.2 by John Arbash Meinel
Add an overzealous test, for Unicode support of _iter_changes.
2242
            current_root_unicode = current_root.decode('utf8')
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2243
            searched_specific_files.add(current_root)
2244
            # process the entries for this containing directory: the rest will be
2245
            # found by their parents recursively.
2246
            root_entries = _entries_for_path(current_root)
2360.1.2 by John Arbash Meinel
Add an overzealous test, for Unicode support of _iter_changes.
2247
            root_abspath = self.target.abspath(current_root_unicode)
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2248
            try:
2249
                root_stat = os.lstat(root_abspath)
2250
            except OSError, e:
2251
                if e.errno == errno.ENOENT:
2255.2.151 by Robert Collins
Handle specific_files natively for WorkingTreeFormat4._iter_changes.
2252
                    # the path does not exist: let _process_entry know that.
2253
                    root_dir_info = None
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2254
                else:
2255
                    # some other random error: hand it up.
2256
                    raise
2255.2.151 by Robert Collins
Handle specific_files natively for WorkingTreeFormat4._iter_changes.
2257
            else:
2258
                root_dir_info = ('', current_root,
2259
                    osutils.file_kind_from_stat_mode(root_stat.st_mode), root_stat,
2260
                    root_abspath)
2255.2.214 by Robert Collins
Get _iter_changes on dirstate passing the subtree tests.
2261
                if root_dir_info[2] == 'directory':
2255.2.215 by Robert Collins
Hook directory-tree-reference detection into dirstate _iter_changes.
2262
                    if self.target._directory_is_tree_reference(
2263
                        current_root.decode('utf8')):
2255.2.214 by Robert Collins
Get _iter_changes on dirstate passing the subtree tests.
2264
                        root_dir_info = root_dir_info[:2] + \
2265
                            ('tree-reference',) + root_dir_info[3:]
2266
2255.2.151 by Robert Collins
Handle specific_files natively for WorkingTreeFormat4._iter_changes.
2267
            if not root_entries and not root_dir_info:
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2268
                # this specified path is not present at all, skip it.
2269
                continue
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
2270
            path_handled = False
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2271
            for entry in root_entries:
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2272
                result = _process_entry(entry, root_dir_info)
2273
                if result is not None:
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
2274
                    path_handled = True
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2275
                    if result is not uninteresting:
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2276
                        yield result
2360.1.2 by John Arbash Meinel
Add an overzealous test, for Unicode support of _iter_changes.
2277
            if want_unversioned and not path_handled and root_dir_info:
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
2278
                new_executable = bool(
2279
                    stat.S_ISREG(root_dir_info[3].st_mode)
2280
                    and stat.S_IEXEC & root_dir_info[3].st_mode)
2360.1.6 by John Arbash Meinel
Change utf8_decode_with_None to return what we care about.
2281
                yield (None,
2282
                       (None, current_root_unicode),
2283
                       True,
2284
                       (False, False),
2285
                       (None, None),
2286
                       (None, splitpath(current_root_unicode)[-1]),
2287
                       (None, root_dir_info[2]),
2288
                       (None, new_executable)
2289
                      )
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2290
            initial_key = (current_root, '', '')
2291
            block_index, _ = state._find_block_index_from_key(initial_key)
2292
            if block_index == 0:
2293
                # we have processed the total root already, but because the
2255.7.21 by John Arbash Meinel
Get iter_changes working again, by fixing set_parent_trees to
2294
                # initial key matched it we should skip it here.
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2295
                block_index +=1
2323.4.2 by Robert Collins
Fix the behaviour of dirstate optimised iter_changes recursing its disk iterator into subtrees inappropriately.
2296
            if root_dir_info and root_dir_info[2] == 'tree-reference':
2297
                current_dir_info = None
2298
            else:
2299
                dir_iterator = osutils._walkdirs_utf8(root_abspath, prefix=current_root)
2300
                try:
2301
                    current_dir_info = dir_iterator.next()
2363.1.2 by John Arbash Meinel
Clean up the error.
2302
                except OSError, e:
2363.1.4 by John Arbash Meinel
Handle ERROR_DIRECTORY for python 2.5
2303
                    # on win32, python2.4 has e.errno == ERROR_DIRECTORY, but
2304
                    # python 2.5 has e.errno == EINVAL,
2305
                    #            and e.winerror == ERROR_DIRECTORY
2306
                    e_winerror = getattr(e, 'winerror', None)
2408.1.5 by Alexander Belchenko
John's patch for WT4 on Windows+Python2.4
2307
                    win_errors = (ERROR_DIRECTORY, ERROR_PATH_NOT_FOUND)
2363.1.4 by John Arbash Meinel
Handle ERROR_DIRECTORY for python 2.5
2308
                    # there may be directories in the inventory even though
2309
                    # this path is not a file on disk: so mark it as end of
2310
                    # iterator
2311
                    if e.errno in (errno.ENOENT, errno.ENOTDIR, errno.EINVAL):
2312
                        current_dir_info = None
2313
                    elif (sys.platform == 'win32'
2408.1.5 by Alexander Belchenko
John's patch for WT4 on Windows+Python2.4
2314
                          and (e.errno in win_errors
2315
                               or e_winerror in win_errors)):
2323.4.2 by Robert Collins
Fix the behaviour of dirstate optimised iter_changes recursing its disk iterator into subtrees inappropriately.
2316
                        current_dir_info = None
2317
                    else:
2318
                        raise
2255.2.151 by Robert Collins
Handle specific_files natively for WorkingTreeFormat4._iter_changes.
2319
                else:
2323.4.2 by Robert Collins
Fix the behaviour of dirstate optimised iter_changes recursing its disk iterator into subtrees inappropriately.
2320
                    if current_dir_info[0][0] == '':
2321
                        # remove .bzr from iteration
2322
                        bzr_index = bisect_left(current_dir_info[1], ('.bzr',))
3376.2.4 by Martin Pool
Remove every assert statement from bzrlib!
2323
                        if current_dir_info[1][bzr_index][0] != '.bzr':
2324
                            raise AssertionError()
2323.4.2 by Robert Collins
Fix the behaviour of dirstate optimised iter_changes recursing its disk iterator into subtrees inappropriately.
2325
                        del current_dir_info[1][bzr_index]
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2326
            # walk until both the directory listing and the versioned metadata
2255.2.236 by Martin Pool
Review cleanups: mostly updating or removing todo comments.
2327
            # are exhausted. 
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2328
            if (block_index < len(state._dirblocks) and
2329
                osutils.is_inside(current_root, state._dirblocks[block_index][0])):
2330
                current_block = state._dirblocks[block_index]
2331
            else:
2332
                current_block = None
2333
            while (current_dir_info is not None or
2255.7.35 by John Arbash Meinel
Handle the case when a directory has been removed, and isn't the last entry.
2334
                   current_block is not None):
2335
                if (current_dir_info and current_block
2336
                    and current_dir_info[0][0] != current_block[0]):
2474.1.44 by John Arbash Meinel
Use cmp_by_dirs in _iter_changes, it saves a bit of time.
2337
                    if cmp_by_dirs(current_dir_info[0][0], current_block[0]) < 0:
2255.7.35 by John Arbash Meinel
Handle the case when a directory has been removed, and isn't the last entry.
2338
                        # filesystem data refers to paths not covered by the dirblock.
2255.7.6 by Robert Collins
Test for iterating changes past empty directories.
2339
                        # this has two possibilities:
2340
                        # A) it is versioned but empty, so there is no block for it
2341
                        # B) it is not versioned.
2402.2.2 by John Arbash Meinel
Fix _iter_changes to properly handle versioned (but empty) directories
2342
2343
                        # if (A) then we need to recurse into it to check for
2344
                        # new unknown files or directories.
2345
                        # if (B) then we should ignore it, because we don't
2346
                        # recurse into unknown directories.
2466.4.3 by John Arbash Meinel
Fix bug #110399 by changing _iter_changes to never descend into unknown directories.
2347
                        path_index = 0
2348
                        while path_index < len(current_dir_info[1]):
2349
                                current_path_info = current_dir_info[1][path_index]
2350
                                if want_unversioned:
2402.2.2 by John Arbash Meinel
Fix _iter_changes to properly handle versioned (but empty) directories
2351
                                    if current_path_info[2] == 'directory':
2352
                                        if self.target._directory_is_tree_reference(
2353
                                            current_path_info[0].decode('utf8')):
2354
                                            current_path_info = current_path_info[:2] + \
2355
                                                ('tree-reference',) + current_path_info[3:]
2356
                                    new_executable = bool(
2357
                                        stat.S_ISREG(current_path_info[3].st_mode)
2358
                                        and stat.S_IEXEC & current_path_info[3].st_mode)
2359
                                    yield (None,
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2360
                                        (None, utf8_decode(current_path_info[0])[0]),
2402.2.2 by John Arbash Meinel
Fix _iter_changes to properly handle versioned (but empty) directories
2361
                                        True,
2362
                                        (False, False),
2363
                                        (None, None),
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2364
                                        (None, utf8_decode(current_path_info[1])[0]),
2402.2.2 by John Arbash Meinel
Fix _iter_changes to properly handle versioned (but empty) directories
2365
                                        (None, current_path_info[2]),
2366
                                        (None, new_executable))
2466.4.3 by John Arbash Meinel
Fix bug #110399 by changing _iter_changes to never descend into unknown directories.
2367
                                # dont descend into this unversioned path if it is
2368
                                # a dir
2369
                                if current_path_info[2] in ('directory',
2370
                                                            'tree-reference'):
2371
                                    del current_dir_info[1][path_index]
2372
                                    path_index -= 1
2373
                                path_index += 1
2402.2.2 by John Arbash Meinel
Fix _iter_changes to properly handle versioned (but empty) directories
2374
2375
                        # This dir info has been handled, go to the next
2255.7.6 by Robert Collins
Test for iterating changes past empty directories.
2376
                        try:
2377
                            current_dir_info = dir_iterator.next()
2378
                        except StopIteration:
2379
                            current_dir_info = None
2255.7.35 by John Arbash Meinel
Handle the case when a directory has been removed, and isn't the last entry.
2380
                    else:
2381
                        # We have a dirblock entry for this location, but there
2382
                        # is no filesystem path for this. This is most likely
2383
                        # because a directory was removed from the disk.
2384
                        # We don't have to report the missing directory,
2385
                        # because that should have already been handled, but we
2386
                        # need to handle all of the files that are contained
2387
                        # within.
2388
                        for current_entry in current_block[1]:
2389
                            # entry referring to file not present on disk.
2390
                            # advance the entry only, after processing.
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2391
                            result = _process_entry(current_entry, None)
2392
                            if result is not None:
2393
                                if result is not uninteresting:
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2394
                                    yield result
2255.7.35 by John Arbash Meinel
Handle the case when a directory has been removed, and isn't the last entry.
2395
                        block_index +=1
2396
                        if (block_index < len(state._dirblocks) and
2397
                            osutils.is_inside(current_root,
2398
                                              state._dirblocks[block_index][0])):
2399
                            current_block = state._dirblocks[block_index]
2400
                        else:
2401
                            current_block = None
2255.7.7 by Robert Collins
continue iteration at the right point for InterDirStateTree._iter_changes.
2402
                    continue
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2403
                entry_index = 0
2404
                if current_block and entry_index < len(current_block[1]):
2405
                    current_entry = current_block[1][entry_index]
2406
                else:
2407
                    current_entry = None
2408
                advance_entry = True
2409
                path_index = 0
2410
                if current_dir_info and path_index < len(current_dir_info[1]):
2411
                    current_path_info = current_dir_info[1][path_index]
2255.2.214 by Robert Collins
Get _iter_changes on dirstate passing the subtree tests.
2412
                    if current_path_info[2] == 'directory':
2413
                        if self.target._directory_is_tree_reference(
2255.2.215 by Robert Collins
Hook directory-tree-reference detection into dirstate _iter_changes.
2414
                            current_path_info[0].decode('utf8')):
2255.2.214 by Robert Collins
Get _iter_changes on dirstate passing the subtree tests.
2415
                            current_path_info = current_path_info[:2] + \
2416
                                ('tree-reference',) + current_path_info[3:]
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2417
                else:
2418
                    current_path_info = None
2419
                advance_path = True
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
2420
                path_handled = False
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2421
                while (current_entry is not None or
2422
                    current_path_info is not None):
2423
                    if current_entry is None:
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
2424
                        # the check for path_handled when the path is adnvaced
2425
                        # will yield this path if needed.
2426
                        pass
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2427
                    elif current_path_info is None:
2428
                        # no path is fine: the per entry code will handle it.
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2429
                        result = _process_entry(current_entry, current_path_info)
2430
                        if result is not None:
2431
                            if result is not uninteresting:
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2432
                                yield result
2472.3.2 by John Arbash Meinel
Now that finding a file on disk which doesn't match
2433
                    elif (current_entry[0][1] != current_path_info[1]
2434
                          or current_entry[1][target_index][0] in 'ar'):
2435
                        # The current path on disk doesn't match the dirblock
2436
                        # record. Either the dirblock is marked as absent, or
2437
                        # the file on disk is not present at all in the
2438
                        # dirblock. Either way, report about the dirblock
2439
                        # entry, and let other code handle the filesystem one.
2598.2.1 by John Arbash Meinel
Update WT4._iter_changes to not split the basename, since it will
2440
2441
                        # Compare the basename for these files to determine
2442
                        # which comes first
2443
                        if current_path_info[1] < current_entry[0][1]:
2255.7.34 by John Arbash Meinel
Clean up test_bad_files, and fix a bug in _iter_changes when
2444
                            # extra file on disk: pass for now, but only
2445
                            # increment the path, not the entry
2446
                            advance_entry = False
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2447
                        else:
2448
                            # entry referring to file not present on disk.
2449
                            # advance the entry only, after processing.
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2450
                            result = _process_entry(current_entry, None)
2451
                            if result is not None:
2452
                                if result is not uninteresting:
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2453
                                    yield result
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2454
                            advance_path = False
2455
                    else:
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2456
                        result = _process_entry(current_entry, current_path_info)
2457
                        if result is not None:
2465.1.2 by John Arbash Meinel
Alternate fix for 'absent' entries.
2458
                            path_handled = True
2485.3.5 by John Arbash Meinel
switching to a single returned object from _process_entry is not faster
2459
                            if result is not uninteresting:
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2460
                                yield result
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2461
                    if advance_entry and current_entry is not None:
2462
                        entry_index += 1
2463
                        if entry_index < len(current_block[1]):
2464
                            current_entry = current_block[1][entry_index]
2465
                        else:
2466
                            current_entry = None
2467
                    else:
2468
                        advance_entry = True # reset the advance flaga
2469
                    if advance_path and current_path_info is not None:
2255.7.87 by Robert Collins
Dont walk unversioned directories in _iter_changes.
2470
                        if not path_handled:
2471
                            # unversioned in all regards
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
2472
                            if want_unversioned:
2255.7.87 by Robert Collins
Dont walk unversioned directories in _iter_changes.
2473
                                new_executable = bool(
2474
                                    stat.S_ISREG(current_path_info[3].st_mode)
2475
                                    and stat.S_IEXEC & current_path_info[3].st_mode)
3287.20.2 by John Arbash Meinel
Raise a clear error about the offending filename when there is a filename with bad characters.
2476
                                try:
2477
                                    relpath_unicode = utf8_decode(current_path_info[0])[0]
2478
                                except UnicodeDecodeError:
2479
                                    raise errors.BadFilenameEncoding(
2480
                                        current_path_info[0], osutils._fs_enc)
2402.2.2 by John Arbash Meinel
Fix _iter_changes to properly handle versioned (but empty) directories
2481
                                yield (None,
3287.20.2 by John Arbash Meinel
Raise a clear error about the offending filename when there is a filename with bad characters.
2482
                                    (None, relpath_unicode),
2402.2.2 by John Arbash Meinel
Fix _iter_changes to properly handle versioned (but empty) directories
2483
                                    True,
2484
                                    (False, False),
2485
                                    (None, None),
2485.3.9 by John Arbash Meinel
Now that we know when tuples will be yielded
2486
                                    (None, utf8_decode(current_path_info[1])[0]),
2402.2.2 by John Arbash Meinel
Fix _iter_changes to properly handle versioned (but empty) directories
2487
                                    (None, current_path_info[2]),
2488
                                    (None, new_executable))
2255.7.87 by Robert Collins
Dont walk unversioned directories in _iter_changes.
2489
                            # dont descend into this unversioned path if it is
2490
                            # a dir
2323.4.2 by Robert Collins
Fix the behaviour of dirstate optimised iter_changes recursing its disk iterator into subtrees inappropriately.
2491
                            if current_path_info[2] in ('directory'):
2255.7.87 by Robert Collins
Dont walk unversioned directories in _iter_changes.
2492
                                del current_dir_info[1][path_index]
2493
                                path_index -= 1
2323.4.2 by Robert Collins
Fix the behaviour of dirstate optimised iter_changes recursing its disk iterator into subtrees inappropriately.
2494
                        # dont descend the disk iterator into any tree 
2495
                        # paths.
2496
                        if current_path_info[2] == 'tree-reference':
2497
                            del current_dir_info[1][path_index]
2498
                            path_index -= 1
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2499
                        path_index += 1
2500
                        if path_index < len(current_dir_info[1]):
2501
                            current_path_info = current_dir_info[1][path_index]
2255.2.214 by Robert Collins
Get _iter_changes on dirstate passing the subtree tests.
2502
                            if current_path_info[2] == 'directory':
2503
                                if self.target._directory_is_tree_reference(
2255.2.215 by Robert Collins
Hook directory-tree-reference detection into dirstate _iter_changes.
2504
                                    current_path_info[0].decode('utf8')):
2255.2.214 by Robert Collins
Get _iter_changes on dirstate passing the subtree tests.
2505
                                    current_path_info = current_path_info[:2] + \
2506
                                        ('tree-reference',) + current_path_info[3:]
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2507
                        else:
2508
                            current_path_info = None
2255.7.85 by Robert Collins
Teach _iter_changes to gather unversioned path details upon request.
2509
                        path_handled = False
2255.2.149 by Robert Collins
Crufty but existing _iter_changes implementation for WorkingTreeFormat4.
2510
                    else:
2511
                        advance_path = True # reset the advance flagg.
2512
                if current_block is not None:
2513
                    block_index += 1
2514
                    if (block_index < len(state._dirblocks) and
2515
                        osutils.is_inside(current_root, state._dirblocks[block_index][0])):
2516
                        current_block = state._dirblocks[block_index]
2517
                    else:
2518
                        current_block = None
2519
                if current_dir_info is not None:
2520
                    try:
2521
                        current_dir_info = dir_iterator.next()
2522
                    except StopIteration:
2523
                        current_dir_info = None
2524
2255.2.117 by Robert Collins
Add an InterDirStateTree InterTree optimiser.
2525
2526
    @staticmethod
2527
    def is_compatible(source, target):
2528
        # the target must be a dirstate working tree
2529
        if not isinstance(target, WorkingTree4):
2530
            return False
2531
        # the source must be a revtreee or dirstate rev tree.
2532
        if not isinstance(source,
2533
            (revisiontree.RevisionTree, DirStateRevisionTree)):
2534
            return False
2535
        # the source revid must be in the target dirstate
2536
        if not (source._revision_id == NULL_REVISION or
2537
            source._revision_id in target.get_parent_ids()):
2538
            # TODO: what about ghosts? it may well need to 
2539
            # check for them explicitly.
2540
            return False
2541
        return True
2542
2543
InterTree.register_optimiser(InterDirStateTree)
2255.12.1 by Robert Collins
Implement upgrade for working trees.
2544
2545
2546
class Converter3to4(object):
2547
    """Perform an in-place upgrade of format 3 to format 4 trees."""
2548
2549
    def __init__(self):
2550
        self.target_format = WorkingTreeFormat4()
2551
2552
    def convert(self, tree):
2553
        # lock the control files not the tree, so that we dont get tree
2554
        # on-unlock behaviours, and so that noone else diddles with the 
2555
        # tree during upgrade.
2556
        tree._control_files.lock_write()
2557
        try:
2334.1.3 by John Arbash Meinel
When upgrading, we can't assume that WorkingTree._inventory is valid, because that is now
2558
            tree.read_working_inventory()
2255.12.1 by Robert Collins
Implement upgrade for working trees.
2559
            self.create_dirstate_data(tree)
2560
            self.update_format(tree)
2561
            self.remove_xml_files(tree)
2562
        finally:
2563
            tree._control_files.unlock()
2564
2565
    def create_dirstate_data(self, tree):
2566
        """Create the dirstate based data for tree."""
2567
        local_path = tree.bzrdir.get_workingtree_transport(None
2568
            ).local_abspath('dirstate')
2569
        state = dirstate.DirState.from_tree(tree, local_path)
2570
        state.save()
2571
        state.unlock()
2572
2573
    def remove_xml_files(self, tree):
2574
        """Remove the oldformat 3 data."""
2575
        transport = tree.bzrdir.get_workingtree_transport(None)
2576
        for path in ['basis-inventory-cache', 'inventory', 'last-revision',
2577
            'pending-merges', 'stat-cache']:
2255.2.194 by Robert Collins
[BROKEN] Many updates to stop using experimental formats in tests.
2578
            try:
2579
                transport.delete(path)
2580
            except errors.NoSuchFile:
2581
                # some files are optional - just deal.
2582
                pass
2255.12.1 by Robert Collins
Implement upgrade for working trees.
2583
2584
    def update_format(self, tree):
2585
        """Change the format marker."""
3407.2.14 by Martin Pool
Remove more cases of getting transport via control_files
2586
        tree._transport.put_bytes('format',
3407.2.5 by Martin Pool
Deprecate LockableFiles.put_utf8
2587
            self.target_format.get_format_string(),
3468.1.1 by Martin Pool
Update more users of default file modes from control_files to bzrdir
2588
            mode=tree.bzrdir._get_file_mode())