262
264
# return '%X.%X' % (int(st.st_mtime), st.st_mode)
267
class SHA1Provider(object):
268
"""An interface for getting sha1s of a file."""
270
def sha1(self, abspath):
271
"""Return the sha1 of a file given its absolute path.
273
:param abspath: May be a filesystem encoded absolute path
276
raise NotImplementedError(self.sha1)
278
def stat_and_sha1(self, abspath):
279
"""Return the stat and sha1 of a file given its absolute path.
281
:param abspath: May be a filesystem encoded absolute path
284
Note: the stat should be the stat of the physical file
285
while the sha may be the sha of its canonical content.
287
raise NotImplementedError(self.stat_and_sha1)
290
class DefaultSHA1Provider(SHA1Provider):
291
"""A SHA1Provider that reads directly from the filesystem."""
293
def sha1(self, abspath):
294
"""Return the sha1 of a file given its absolute path."""
295
return osutils.sha_file_by_name(abspath)
297
def stat_and_sha1(self, abspath):
298
"""Return the stat and sha1 of a file given its absolute path."""
299
file_obj = file(abspath, 'rb')
301
statvalue = os.fstat(file_obj.fileno())
302
sha1 = osutils.sha_file(file_obj)
305
return statvalue, sha1
265
308
class DirState(object):
266
309
"""Record directory and metadata state for fast access.
415
461
raise AssertionError(
416
462
"must be a utf8 file_id not %s" % (type(file_id), ))
417
463
# Make sure the file_id does not exist in this tree
418
file_id_entry = self._get_entry(0, fileid_utf8=file_id)
465
file_id_entry = self._get_entry(0, fileid_utf8=file_id, include_deleted=True)
419
466
if file_id_entry != (None, None):
420
path = osutils.pathjoin(file_id_entry[0][0], file_id_entry[0][1])
421
kind = DirState._minikind_to_kind[file_id_entry[1][0][0]]
422
info = '%s:%s' % (kind, path)
423
raise errors.DuplicateFileId(file_id, info)
467
if file_id_entry[1][0][0] == 'a':
468
if file_id_entry[0] != (dirname, basename, file_id):
469
# set the old name's current operation to rename
470
self.update_minimal(file_id_entry[0],
476
rename_from = file_id_entry[0][0:2]
478
path = osutils.pathjoin(file_id_entry[0][0], file_id_entry[0][1])
479
kind = DirState._minikind_to_kind[file_id_entry[1][0][0]]
480
info = '%s:%s' % (kind, path)
481
raise errors.DuplicateFileId(file_id, info)
424
482
first_key = (dirname, basename, '')
425
483
block_index, present = self._find_block_index_from_key(first_key)
427
485
# check the path is not in the tree
428
486
block = self._dirblocks[block_index][1]
429
487
entry_index, _ = self._find_entry_index(first_key, block)
430
while (entry_index < len(block) and
488
while (entry_index < len(block) and
431
489
block[entry_index][0][0:2] == first_key[0:2]):
432
490
if block[entry_index][1][0][0] not in 'ar':
433
491
# this path is in the dirstate in the current tree.
1211
1278
def update_by_delta(self, delta):
1212
1279
"""Apply an inventory delta to the dirstate for tree 0
1281
This is the workhorse for apply_inventory_delta in dirstate based
1214
1284
:param delta: An inventory delta. See Inventory.apply_delta for
1217
1287
self._read_dirblocks_if_needed()
1288
encode = cache_utf8.encode
1218
1289
insertions = {}
1220
for old_path, new_path, file_id, inv_entry in sorted(delta, reverse=True):
1291
# Accumulate parent references (path_utf8, id), to check for parentless
1292
# items or items placed under files/links/tree-references. We get
1293
# references from every item in the delta that is not a deletion and
1294
# is not itself the root.
1296
# Added ids must not be in the dirstate already. This set holds those
1299
# This loop transforms the delta to single atomic operations that can
1300
# be executed and validated.
1301
for old_path, new_path, file_id, inv_entry in sorted(
1302
inventory._check_delta_unique_old_paths(
1303
inventory._check_delta_unique_new_paths(
1304
inventory._check_delta_ids_match_entry(
1305
inventory._check_delta_ids_are_valid(
1306
inventory._check_delta_new_path_entry_both_or_None(delta))))),
1221
1308
if (file_id in insertions) or (file_id in removals):
1222
raise AssertionError("repeated file id in delta %r" % (file_id,))
1309
raise errors.InconsistentDelta(old_path or new_path, file_id,
1223
1311
if old_path is not None:
1224
1312
old_path = old_path.encode('utf-8')
1225
1313
removals[file_id] = old_path
1315
new_ids.add(file_id)
1226
1316
if new_path is not None:
1317
if inv_entry is None:
1318
raise errors.InconsistentDelta(new_path, file_id,
1319
"new_path with no entry")
1227
1320
new_path = new_path.encode('utf-8')
1228
dirname, basename = osutils.split(new_path)
1229
key = (dirname, basename, file_id)
1321
dirname_utf8, basename = osutils.split(new_path)
1323
parents.add((dirname_utf8, inv_entry.parent_id))
1324
key = (dirname_utf8, basename, file_id)
1230
1325
minikind = DirState._kind_to_minikind[inv_entry.kind]
1231
1326
if minikind == 't':
1232
fingerprint = inv_entry.reference_revision
1327
fingerprint = inv_entry.reference_revision or ''
1234
1329
fingerprint = ''
1235
1330
insertions[file_id] = (key, minikind, inv_entry.executable,
1244
1339
minikind = child[1][0][0]
1245
1340
fingerprint = child[1][0][4]
1246
1341
executable = child[1][0][3]
1247
old_child_path = osutils.pathjoin(child[0][0],
1342
old_child_path = osutils.pathjoin(child_dirname,
1249
1344
removals[child[0][2]] = old_child_path
1250
1345
child_suffix = child_dirname[len(old_path):]
1251
1346
new_child_dirname = (new_path + child_suffix)
1252
1347
key = (new_child_dirname, child_basename, child[0][2])
1253
new_child_path = os.path.join(new_child_dirname,
1348
new_child_path = osutils.pathjoin(new_child_dirname,
1255
1350
insertions[child[0][2]] = (key, minikind, executable,
1256
1351
fingerprint, new_child_path)
1257
self._apply_removals(removals.values())
1258
self._apply_insertions(insertions.values())
1352
self._check_delta_ids_absent(new_ids, delta, 0)
1354
self._apply_removals(removals.iteritems())
1355
self._apply_insertions(insertions.values())
1357
self._after_delta_check_parents(parents, 0)
1358
except errors.BzrError, e:
1359
self._changes_aborted = True
1360
if 'integrity error' not in str(e):
1362
# _get_entry raises BzrError when a request is inconsistent; we
1363
# want such errors to be shown as InconsistentDelta - and that
1364
# fits the behaviour we trigger.
1365
raise errors.InconsistentDeltaDelta(delta, "error from _get_entry.")
1260
1367
def _apply_removals(self, removals):
1261
for path in sorted(removals, reverse=True):
1368
for file_id, path in sorted(removals, reverse=True,
1369
key=operator.itemgetter(1)):
1262
1370
dirname, basename = osutils.split(path)
1263
1371
block_i, entry_i, d_present, f_present = \
1264
1372
self._get_block_entry_index(dirname, basename, 0)
1265
entry = self._dirblocks[block_i][1][entry_i]
1374
entry = self._dirblocks[block_i][1][entry_i]
1376
self._changes_aborted = True
1377
raise errors.InconsistentDelta(path, file_id,
1378
"Wrong path for old path.")
1379
if not f_present or entry[1][0][0] in 'ar':
1380
self._changes_aborted = True
1381
raise errors.InconsistentDelta(path, file_id,
1382
"Wrong path for old path.")
1383
if file_id != entry[0][2]:
1384
self._changes_aborted = True
1385
raise errors.InconsistentDelta(path, file_id,
1386
"Attempt to remove path has wrong id - found %r."
1266
1388
self._make_absent(entry)
1267
1389
# See if we have a malformed delta: deleting a directory must not
1268
1390
# leave crud behind. This increases the number of bisects needed
1276
1398
# be due to it being in a parent tree, or a corrupt delta.
1277
1399
for child_entry in self._dirblocks[block_i][1]:
1278
1400
if child_entry[1][0][0] not in ('r', 'a'):
1401
self._changes_aborted = True
1279
1402
raise errors.InconsistentDelta(path, entry[0][2],
1280
1403
"The file id was deleted but its children were "
1281
1404
"not deleted.")
1283
1406
def _apply_insertions(self, adds):
1284
for key, minikind, executable, fingerprint, path_utf8 in sorted(adds):
1285
self.update_minimal(key, minikind, executable, fingerprint,
1286
path_utf8=path_utf8)
1408
for key, minikind, executable, fingerprint, path_utf8 in sorted(adds):
1409
self.update_minimal(key, minikind, executable, fingerprint,
1410
path_utf8=path_utf8)
1411
except errors.NotVersionedError:
1412
self._changes_aborted = True
1413
raise errors.InconsistentDelta(path_utf8.decode('utf8'), key[2],
1288
1416
def update_basis_by_delta(self, delta, new_revid):
1289
1417
"""Update the parents of this tree after a commit.
1333
1461
# At the same time, to reduce interface friction we convert the input
1334
1462
# inventory entries to dirstate.
1335
1463
root_only = ('', '')
1464
# Accumulate parent references (path_utf8, id), to check for parentless
1465
# items or items placed under files/links/tree-references. We get
1466
# references from every item in the delta that is not a deletion and
1467
# is not itself the root.
1469
# Added ids must not be in the dirstate already. This set holds those
1336
1472
for old_path, new_path, file_id, inv_entry in delta:
1473
if inv_entry is not None and file_id != inv_entry.file_id:
1474
raise errors.InconsistentDelta(new_path, file_id,
1475
"mismatched entry file_id %r" % inv_entry)
1476
if new_path is not None:
1477
if inv_entry is None:
1478
raise errors.InconsistentDelta(new_path, file_id,
1479
"new_path with no entry")
1480
new_path_utf8 = encode(new_path)
1481
# note the parent for validation
1482
dirname_utf8, basename_utf8 = osutils.split(new_path_utf8)
1484
parents.add((dirname_utf8, inv_entry.parent_id))
1337
1485
if old_path is None:
1338
1486
adds.append((None, encode(new_path), file_id,
1339
1487
inv_to_entry(inv_entry), True))
1488
new_ids.add(file_id)
1340
1489
elif new_path is None:
1341
1490
deletes.append((encode(old_path), None, file_id, None, True))
1342
1491
elif (old_path, new_path) != root_only:
1386
1534
# of everything.
1387
1535
changes.append((encode(old_path), encode(new_path), file_id,
1388
1536
inv_to_entry(inv_entry)))
1390
# Finish expunging deletes/first half of renames.
1391
self._update_basis_apply_deletes(deletes)
1392
# Reinstate second half of renames and new paths.
1393
self._update_basis_apply_adds(adds)
1394
# Apply in-situ changes.
1395
self._update_basis_apply_changes(changes)
1537
self._check_delta_ids_absent(new_ids, delta, 1)
1539
# Finish expunging deletes/first half of renames.
1540
self._update_basis_apply_deletes(deletes)
1541
# Reinstate second half of renames and new paths.
1542
self._update_basis_apply_adds(adds)
1543
# Apply in-situ changes.
1544
self._update_basis_apply_changes(changes)
1546
self._after_delta_check_parents(parents, 1)
1547
except errors.BzrError, e:
1548
self._changes_aborted = True
1549
if 'integrity error' not in str(e):
1551
# _get_entry raises BzrError when a request is inconsistent; we
1552
# want such errors to be shown as InconsistentDelta - and that
1553
# fits the behaviour we trigger. Partof this is driven by dirstate
1554
# only supporting deltas that turn the basis into a closer fit to
1556
raise errors.InconsistentDeltaDelta(delta, "error from _get_entry.")
1397
1558
self._dirblock_state = DirState.IN_MEMORY_MODIFIED
1398
1559
self._header_state = DirState.IN_MEMORY_MODIFIED
1399
1560
self._id_index = None
1563
def _check_delta_ids_absent(self, new_ids, delta, tree_index):
1564
"""Check that none of the file_ids in new_ids are present in a tree."""
1567
id_index = self._get_id_index()
1568
for file_id in new_ids:
1569
for key in id_index.get(file_id, []):
1570
block_i, entry_i, d_present, f_present = \
1571
self._get_block_entry_index(key[0], key[1], tree_index)
1573
# In a different tree
1575
entry = self._dirblocks[block_i][1][entry_i]
1576
if entry[0][2] != file_id:
1577
# Different file_id, so not what we want.
1579
# NB: No changes made before this helper is called, so no need
1580
# to set the _changes_aborted flag.
1581
raise errors.InconsistentDelta(
1582
("%s/%s" % key[0:2]).decode('utf8'), file_id,
1583
"This file_id is new in the delta but already present in "
1402
1586
def _update_basis_apply_adds(self, adds):
1403
1587
"""Apply a sequence of adds to tree 1 during update_basis_by_delta.
1507
1692
# it is being resurrected here, so blank it out temporarily.
1508
1693
self._dirblocks[block_index][1][entry_index][1][1] = null
1695
def _after_delta_check_parents(self, parents, index):
1696
"""Check that parents required by the delta are all intact.
1698
:param parents: An iterable of (path_utf8, file_id) tuples which are
1699
required to be present in tree 'index' at path_utf8 with id file_id
1701
:param index: The column in the dirstate to check for parents in.
1703
for dirname_utf8, file_id in parents:
1704
# Get the entry - the ensures that file_id, dirname_utf8 exists and
1705
# has the right file id.
1706
entry = self._get_entry(index, file_id, dirname_utf8)
1707
if entry[1] is None:
1708
self._changes_aborted = True
1709
raise errors.InconsistentDelta(dirname_utf8.decode('utf8'),
1710
file_id, "This parent is not present.")
1711
# Parents of things must be directories
1712
if entry[1][index][0] != 'd':
1713
self._changes_aborted = True
1714
raise errors.InconsistentDelta(dirname_utf8.decode('utf8'),
1715
file_id, "This parent is not a directory.")
1510
1717
def _observed_sha1(self, entry, sha1, stat_value,
1511
1718
_stat_to_minikind=_stat_to_minikind, _pack_stat=pack_stat):
1512
1719
"""Note the sha1 of a file.
2120
2356
self.update_minimal(('', '', new_id), 'd',
2121
2357
path_utf8='', packed_stat=entry[1][0][4])
2122
2358
self._dirblock_state = DirState.IN_MEMORY_MODIFIED
2123
if self._id_index is not None:
2124
self._id_index.setdefault(new_id, set()).add(entry[0])
2126
2360
def set_parent_trees(self, trees, ghosts):
2127
2361
"""Set the parent trees for the dirstate.
2129
2363
:param trees: A list of revision_id, tree tuples. tree must be provided
2130
even if the revision_id refers to a ghost: supply an empty tree in
2364
even if the revision_id refers to a ghost: supply an empty tree in
2132
2366
:param ghosts: A list of the revision_ids that are ghosts at the time
2135
# TODO: generate a list of parent indexes to preserve to save
2369
# TODO: generate a list of parent indexes to preserve to save
2136
2370
# processing specific parent trees. In the common case one tree will
2137
2371
# be preserved - the left most parent.
2138
2372
# TODO: if the parent tree is a dirstate, we might want to walk them
2369
2620
and new_entry_key[1:] < current_old[0][1:])):
2370
2621
# new comes before:
2371
2622
# add a entry for this and advance new
2624
trace.mutter("Inserting from new '%s'.",
2625
new_path_utf8.decode('utf8'))
2372
2626
self.update_minimal(new_entry_key, current_new_minikind,
2373
2627
executable=current_new[1].executable,
2374
path_utf8=new_path_utf8, fingerprint=fingerprint)
2628
path_utf8=new_path_utf8, fingerprint=fingerprint,
2375
2630
current_new = advance(new_iterator)
2377
2632
# we've advanced past the place where the old key would be,
2378
2633
# without seeing it in the new list. so it must be gone.
2635
trace.mutter("Deleting from old '%s/%s'.",
2636
current_old[0][0].decode('utf8'),
2637
current_old[0][1].decode('utf8'))
2379
2638
self._make_absent(current_old)
2380
2639
current_old = advance(old_iterator)
2381
2640
self._dirblock_state = DirState.IN_MEMORY_MODIFIED
2382
2641
self._id_index = None
2383
2642
self._packed_stat_index = None
2644
trace.mutter("set_state_from_inventory complete.")
2385
2646
def _make_absent(self, current_old):
2386
2647
"""Mark current_old - an entry - as absent for tree 0.
2476
2757
# grab one of them and use it to generate parent
2477
2758
# relocation/absent entries.
2478
2759
new_entry = key, [new_details]
2479
for other_key in existing_keys:
2760
# existing_keys can be changed as we iterate.
2761
for other_key in tuple(existing_keys):
2480
2762
# change the record at other to be a pointer to this new
2481
2763
# record. The loop looks similar to the change to
2482
2764
# relocations when updating an existing record but its not:
2483
2765
# the test for existing kinds is different: this can be
2484
2766
# factored out to a helper though.
2485
other_block_index, present = self._find_block_index_from_key(other_key)
2487
raise AssertionError('could not find block for %s' % (other_key,))
2488
other_entry_index, present = self._find_entry_index(other_key,
2489
self._dirblocks[other_block_index][1])
2491
raise AssertionError('could not find entry for %s' % (other_key,))
2767
other_block_index, present = self._find_block_index_from_key(
2770
raise AssertionError('could not find block for %s' % (
2772
other_block = self._dirblocks[other_block_index][1]
2773
other_entry_index, present = self._find_entry_index(
2774
other_key, other_block)
2776
raise AssertionError(
2777
'update_minimal: could not find other entry for %s'
2492
2779
if path_utf8 is None:
2493
2780
raise AssertionError('no path')
2494
self._dirblocks[other_block_index][1][other_entry_index][1][0] = \
2495
('r', path_utf8, 0, False, '')
2781
# Turn this other location into a reference to the new
2782
# location. This also updates the aliased iterator
2783
# (current_old in set_state_from_inventory) so that the old
2784
# entry, if not already examined, is skipped over by that
2786
other_entry = other_block[other_entry_index]
2787
other_entry[1][0] = ('r', path_utf8, 0, False, '')
2788
self._maybe_remove_row(other_block, other_entry_index,
2792
# adds a tuple to the new details for each column
2793
# - either by copying an existing relocation pointer inside that column
2794
# - or by creating a new pointer to the right row inside that column
2497
2795
num_present_parents = self._num_present_parents()
2796
if num_present_parents:
2797
other_key = list(existing_keys)[0]
2498
2798
for lookup_index in xrange(1, num_present_parents + 1):
2499
2799
# grab any one entry, use it to find the right path.
2500
# TODO: optimise this to reduce memory use in highly
2800
# TODO: optimise this to reduce memory use in highly
2501
2801
# fragmented situations by reusing the relocation
2503
2803
update_block_index, present = \
2840
3167
False, DirState.NULLSTAT)
2841
3168
state._dirblock_state = DirState.IN_MEMORY_MODIFIED
2842
3169
return link_or_sha1
2843
update_entry = py_update_entry
2846
3172
class ProcessEntryPython(object):
2848
__slots__ = ["old_dirname_to_file_id", "new_dirname_to_file_id", "uninteresting",
3174
__slots__ = ["old_dirname_to_file_id", "new_dirname_to_file_id",
2849
3175
"last_source_parent", "last_target_parent", "include_unchanged",
2850
"use_filesystem_for_exec", "utf8_decode", "searched_specific_files",
2851
"search_specific_files", "state", "source_index", "target_index",
2852
"want_unversioned", "tree"]
3176
"partial", "use_filesystem_for_exec", "utf8_decode",
3177
"searched_specific_files", "search_specific_files",
3178
"searched_exact_paths", "search_specific_file_parents", "seen_ids",
3179
"state", "source_index", "target_index", "want_unversioned", "tree"]
2854
3181
def __init__(self, include_unchanged, use_filesystem_for_exec,
2855
3182
search_specific_files, state, source_index, target_index,
2856
3183
want_unversioned, tree):
2857
3184
self.old_dirname_to_file_id = {}
2858
3185
self.new_dirname_to_file_id = {}
2859
# Just a sentry, so that _process_entry can say that this
2860
# record is handled, but isn't interesting to process (unchanged)
2861
self.uninteresting = object()
3186
# Are we doing a partial iter_changes?
3187
self.partial = search_specific_files != set([''])
2862
3188
# Using a list so that we can access the values and change them in
2863
3189
# nested scope. Each one is [path, file_id, entry]
2864
3190
self.last_source_parent = [None, None]
2867
3193
self.use_filesystem_for_exec = use_filesystem_for_exec
2868
3194
self.utf8_decode = cache_utf8._utf8_decode
2869
3195
# for all search_indexs in each path at or under each element of
2870
# search_specific_files, if the detail is relocated: add the id, and add the
2871
# relocated path as one to search if its not searched already. If the
2872
# detail is not relocated, add the id.
3196
# search_specific_files, if the detail is relocated: add the id, and
3197
# add the relocated path as one to search if its not searched already.
3198
# If the detail is not relocated, add the id.
2873
3199
self.searched_specific_files = set()
3200
# When we search exact paths without expanding downwards, we record
3202
self.searched_exact_paths = set()
2874
3203
self.search_specific_files = search_specific_files
3204
# The parents up to the root of the paths we are searching.
3205
# After all normal paths are returned, these specific items are returned.
3206
self.search_specific_file_parents = set()
3207
# The ids we've sent out in the delta.
3208
self.seen_ids = set()
2875
3209
self.state = state
2876
3210
self.source_index = source_index
2877
3211
self.target_index = target_index
3212
if target_index != 0:
3213
# A lot of code in here depends on target_index == 0
3214
raise errors.BzrError('unsupported target index')
2878
3215
self.want_unversioned = want_unversioned
2879
3216
self.tree = tree
2882
3219
"""Compare an entry and real disk to generate delta information.
2884
3221
:param path_info: top_relpath, basename, kind, lstat, abspath for
2885
the path of entry. If None, then the path is considered absent.
2886
(Perhaps we should pass in a concrete entry for this ?)
3222
the path of entry. If None, then the path is considered absent in
3223
the target (Perhaps we should pass in a concrete entry for this ?)
2887
3224
Basename is returned as a utf8 string because we expect this
2888
3225
tuple will be ignored, and don't want to take the time to
2890
:return: None if these don't match
2891
A tuple of information about the change, or
2892
the object 'uninteresting' if these match, but are
2893
basically identical.
3227
:return: (iter_changes_result, changed). If the entry has not been
3228
handled then changed is None. Otherwise it is False if no content
3229
or metadata changes have occurred, and True if any content or
3230
metadata change has occurred. If self.include_unchanged is True then
3231
if changed is not None, iter_changes_result will always be a result
3232
tuple. Otherwise, iter_changes_result is None unless changed is
2895
3235
if self.source_index is None:
2896
3236
source_details = DirState.NULL_PARENT_DETAILS
2964
3304
if source_minikind != 'f':
2965
3305
content_change = True
2967
# If the size is the same, check the sha:
2968
if target_details[2] == source_details[2]:
2969
if link_or_sha1 is None:
2971
file_obj = file(path_info[4], 'rb')
2973
statvalue = os.fstat(file_obj.fileno())
2974
link_or_sha1 = osutils.sha_file(file_obj)
2977
self.state._observed_sha1(entry, link_or_sha1,
2979
content_change = (link_or_sha1 != source_details[1])
2981
# Size changed, so must be different
2982
content_change = True
3307
# Check the sha. We can't just rely on the size as
3308
# content filtering may mean differ sizes actually
3309
# map to the same content
3310
if link_or_sha1 is None:
3312
statvalue, link_or_sha1 = \
3313
self.state._sha1_provider.stat_and_sha1(
3315
self.state._observed_sha1(entry, link_or_sha1,
3317
content_change = (link_or_sha1 != source_details[1])
2983
3318
# Target details is updated at update_entry time
2984
3319
if self.use_filesystem_for_exec:
2985
3320
# We don't need S_ISREG here, because we are sure
3144
3481
"source_minikind=%r, target_minikind=%r"
3145
3482
% (source_minikind, target_minikind))
3146
3483
## import pdb;pdb.set_trace()
3149
3486
def __iter__(self):
3489
def _gather_result_for_consistency(self, result):
3490
"""Check a result we will yield to make sure we are consistent later.
3492
This gathers result's parents into a set to output later.
3494
:param result: A result tuple.
3496
if not self.partial or not result[0]:
3498
self.seen_ids.add(result[0])
3499
new_path = result[1][1]
3501
# Not the root and not a delete: queue up the parents of the path.
3502
self.search_specific_file_parents.update(
3503
osutils.parent_directories(new_path.encode('utf8')))
3504
# Add the root directory which parent_directories does not
3506
self.search_specific_file_parents.add('')
3152
3508
def iter_changes(self):
3153
3509
"""Iterate over the changes."""
3154
3510
utf8_decode = cache_utf8._utf8_decode
3155
3511
_cmp_by_dirs = cmp_by_dirs
3156
3512
_process_entry = self._process_entry
3157
uninteresting = self.uninteresting
3158
3513
search_specific_files = self.search_specific_files
3159
3514
searched_specific_files = self.searched_specific_files
3160
3515
splitpath = osutils.splitpath
3162
3517
# compare source_index and target_index at or under each element of search_specific_files.
3163
3518
# follow the following comparison table. Note that we only want to do diff operations when
3164
# the target is fdl because thats when the walkdirs logic will have exposed the pathinfo
3519
# the target is fdl because thats when the walkdirs logic will have exposed the pathinfo
3165
3520
# for the target.
3168
3523
# Source | Target | disk | action
3169
3524
# r | fdlt | | add source to search, add id path move and perform
3170
3525
# | | | diff check on source-target
3171
# r | fdlt | a | dangling file that was present in the basis.
3526
# r | fdlt | a | dangling file that was present in the basis.
3173
3528
# r | a | | add source to search
3175
3530
# r | r | | this path is present in a non-examined tree, skip.
3176
3531
# r | r | a | this path is present in a non-examined tree, skip.
3177
3532
# a | fdlt | | add new id
3482
3847
current_dir_info = dir_iterator.next()
3483
3848
except StopIteration:
3484
3849
current_dir_info = None
3485
_process_entry = ProcessEntryPython
3850
for result in self._iter_specific_file_parents():
3853
def _iter_specific_file_parents(self):
3854
"""Iter over the specific file parents."""
3855
while self.search_specific_file_parents:
3856
# Process the parent directories for the paths we were iterating.
3857
# Even in extremely large trees this should be modest, so currently
3858
# no attempt is made to optimise.
3859
path_utf8 = self.search_specific_file_parents.pop()
3860
if osutils.is_inside_any(self.searched_specific_files, path_utf8):
3861
# We've examined this path.
3863
if path_utf8 in self.searched_exact_paths:
3864
# We've examined this path.
3866
path_entries = self.state._entries_for_path(path_utf8)
3867
# We need either one or two entries. If the path in
3868
# self.target_index has moved (so the entry in source_index is in
3869
# 'ar') then we need to also look for the entry for this path in
3870
# self.source_index, to output the appropriate delete-or-rename.
3871
selected_entries = []
3873
for candidate_entry in path_entries:
3874
# Find entries present in target at this path:
3875
if candidate_entry[1][self.target_index][0] not in 'ar':
3877
selected_entries.append(candidate_entry)
3878
# Find entries present in source at this path:
3879
elif (self.source_index is not None and
3880
candidate_entry[1][self.source_index][0] not in 'ar'):
3882
if candidate_entry[1][self.target_index][0] == 'a':
3883
# Deleted, emit it here.
3884
selected_entries.append(candidate_entry)
3886
# renamed, emit it when we process the directory it
3888
self.search_specific_file_parents.add(
3889
candidate_entry[1][self.target_index][1])
3891
raise AssertionError(
3892
"Missing entry for specific path parent %r, %r" % (
3893
path_utf8, path_entries))
3894
path_info = self._path_info(path_utf8, path_utf8.decode('utf8'))
3895
for entry in selected_entries:
3896
if entry[0][2] in self.seen_ids:
3898
result, changed = self._process_entry(entry, path_info)
3900
raise AssertionError(
3901
"Got entry<->path mismatch for specific path "
3902
"%r entry %r path_info %r " % (
3903
path_utf8, entry, path_info))
3904
# Only include changes - we're outside the users requested
3907
self._gather_result_for_consistency(result)
3908
if (result[6][0] == 'directory' and
3909
result[6][1] != 'directory'):
3910
# This stopped being a directory, the old children have
3912
if entry[1][self.source_index][0] == 'r':
3913
# renamed, take the source path
3914
entry_path_utf8 = entry[1][self.source_index][1]
3916
entry_path_utf8 = path_utf8
3917
initial_key = (entry_path_utf8, '', '')
3918
block_index, _ = self.state._find_block_index_from_key(
3920
if block_index == 0:
3921
# The children of the root are in block index 1.
3923
current_block = None
3924
if block_index < len(self.state._dirblocks):
3925
current_block = self.state._dirblocks[block_index]
3926
if not osutils.is_inside(
3927
entry_path_utf8, current_block[0]):
3928
# No entries for this directory at all.
3929
current_block = None
3930
if current_block is not None:
3931
for entry in current_block[1]:
3932
if entry[1][self.source_index][0] in 'ar':
3933
# Not in the source tree, so doesn't have to be
3936
# Path of the entry itself.
3938
self.search_specific_file_parents.add(
3939
osutils.pathjoin(*entry[0][:2]))
3940
if changed or self.include_unchanged:
3942
self.searched_exact_paths.add(path_utf8)
3944
def _path_info(self, utf8_path, unicode_path):
3945
"""Generate path_info for unicode_path.
3947
:return: None if unicode_path does not exist, or a path_info tuple.
3949
abspath = self.tree.abspath(unicode_path)
3951
stat = os.lstat(abspath)
3953
if e.errno == errno.ENOENT:
3954
# the path does not exist.
3958
utf8_basename = utf8_path.rsplit('/', 1)[-1]
3959
dir_info = (utf8_path, utf8_basename,
3960
osutils.file_kind_from_stat_mode(stat.st_mode), stat,
3962
if dir_info[2] == 'directory':
3963
if self.tree._directory_is_tree_reference(
3965
self.root_dir_info = self.root_dir_info[:2] + \
3966
('tree-reference',) + self.root_dir_info[3:]
3488
3970
# Try to load the compiled form if possible
3490
from bzrlib._dirstate_helpers_c import (
3491
_read_dirblocks_c as _read_dirblocks,
3492
bisect_dirblock_c as bisect_dirblock,
3493
_bisect_path_left_c as _bisect_path_left,
3494
_bisect_path_right_c as _bisect_path_right,
3495
cmp_by_dirs_c as cmp_by_dirs,
3972
from bzrlib._dirstate_helpers_pyx import (
3496
3978
ProcessEntryC as _process_entry,
3497
3979
update_entry as update_entry,
3981
except ImportError, e:
3982
osutils.failed_to_load_extension(e)
3500
3983
from bzrlib._dirstate_helpers_py import (
3501
_read_dirblocks_py as _read_dirblocks,
3502
bisect_dirblock_py as bisect_dirblock,
3503
_bisect_path_left_py as _bisect_path_left,
3504
_bisect_path_right_py as _bisect_path_right,
3505
cmp_by_dirs_py as cmp_by_dirs,
3990
# FIXME: It would be nice to be able to track moved lines so that the
3991
# corresponding python code can be moved to the _dirstate_helpers_py
3992
# module. I don't want to break the history for this important piece of
3993
# code so I left the code here -- vila 20090622
3994
update_entry = py_update_entry
3995
_process_entry = ProcessEntryPython