264
262
# return '%X.%X' % (int(st.st_mtime), st.st_mode)
267
class SHA1Provider(object):
268
"""An interface for getting sha1s of a file."""
270
def sha1(self, abspath):
271
"""Return the sha1 of a file given its absolute path.
273
:param abspath: May be a filesystem encoded absolute path
276
raise NotImplementedError(self.sha1)
278
def stat_and_sha1(self, abspath):
279
"""Return the stat and sha1 of a file given its absolute path.
281
:param abspath: May be a filesystem encoded absolute path
284
Note: the stat should be the stat of the physical file
285
while the sha may be the sha of its canonical content.
287
raise NotImplementedError(self.stat_and_sha1)
290
class DefaultSHA1Provider(SHA1Provider):
291
"""A SHA1Provider that reads directly from the filesystem."""
293
def sha1(self, abspath):
294
"""Return the sha1 of a file given its absolute path."""
295
return osutils.sha_file_by_name(abspath)
297
def stat_and_sha1(self, abspath):
298
"""Return the stat and sha1 of a file given its absolute path."""
299
file_obj = file(abspath, 'rb')
301
statvalue = os.fstat(file_obj.fileno())
302
sha1 = osutils.sha_file(file_obj)
305
return statvalue, sha1
308
265
class DirState(object):
309
266
"""Record directory and metadata state for fast access.
461
415
raise AssertionError(
462
416
"must be a utf8 file_id not %s" % (type(file_id), ))
463
417
# Make sure the file_id does not exist in this tree
465
file_id_entry = self._get_entry(0, fileid_utf8=file_id, include_deleted=True)
418
file_id_entry = self._get_entry(0, fileid_utf8=file_id)
466
419
if file_id_entry != (None, None):
467
if file_id_entry[1][0][0] == 'a':
468
if file_id_entry[0] != (dirname, basename, file_id):
469
# set the old name's current operation to rename
470
self.update_minimal(file_id_entry[0],
476
rename_from = file_id_entry[0][0:2]
478
path = osutils.pathjoin(file_id_entry[0][0], file_id_entry[0][1])
479
kind = DirState._minikind_to_kind[file_id_entry[1][0][0]]
480
info = '%s:%s' % (kind, path)
481
raise errors.DuplicateFileId(file_id, info)
420
path = osutils.pathjoin(file_id_entry[0][0], file_id_entry[0][1])
421
kind = DirState._minikind_to_kind[file_id_entry[1][0][0]]
422
info = '%s:%s' % (kind, path)
423
raise errors.DuplicateFileId(file_id, info)
482
424
first_key = (dirname, basename, '')
483
425
block_index, present = self._find_block_index_from_key(first_key)
485
427
# check the path is not in the tree
486
428
block = self._dirblocks[block_index][1]
487
429
entry_index, _ = self._find_entry_index(first_key, block)
488
while (entry_index < len(block) and
430
while (entry_index < len(block) and
489
431
block[entry_index][0][0:2] == first_key[0:2]):
490
432
if block[entry_index][1][0][0] not in 'ar':
491
433
# this path is in the dirstate in the current tree.
1278
1211
def update_by_delta(self, delta):
1279
1212
"""Apply an inventory delta to the dirstate for tree 0
1281
This is the workhorse for apply_inventory_delta in dirstate based
1284
1214
:param delta: An inventory delta. See Inventory.apply_delta for
1287
1217
self._read_dirblocks_if_needed()
1288
encode = cache_utf8.encode
1289
1218
insertions = {}
1291
# Accumulate parent references (path_utf8, id), to check for parentless
1292
# items or items placed under files/links/tree-references. We get
1293
# references from every item in the delta that is not a deletion and
1294
# is not itself the root.
1296
# Added ids must not be in the dirstate already. This set holds those
1299
# This loop transforms the delta to single atomic operations that can
1300
# be executed and validated.
1301
for old_path, new_path, file_id, inv_entry in sorted(
1302
inventory._check_delta_unique_old_paths(
1303
inventory._check_delta_unique_new_paths(
1304
inventory._check_delta_ids_match_entry(
1305
inventory._check_delta_ids_are_valid(
1306
inventory._check_delta_new_path_entry_both_or_None(delta))))),
1220
for old_path, new_path, file_id, inv_entry in sorted(delta, reverse=True):
1308
1221
if (file_id in insertions) or (file_id in removals):
1309
raise errors.InconsistentDelta(old_path or new_path, file_id,
1222
raise AssertionError("repeated file id in delta %r" % (file_id,))
1311
1223
if old_path is not None:
1312
1224
old_path = old_path.encode('utf-8')
1313
1225
removals[file_id] = old_path
1315
new_ids.add(file_id)
1316
1226
if new_path is not None:
1317
if inv_entry is None:
1318
raise errors.InconsistentDelta(new_path, file_id,
1319
"new_path with no entry")
1320
1227
new_path = new_path.encode('utf-8')
1321
dirname_utf8, basename = osutils.split(new_path)
1323
parents.add((dirname_utf8, inv_entry.parent_id))
1324
key = (dirname_utf8, basename, file_id)
1228
dirname, basename = osutils.split(new_path)
1229
key = (dirname, basename, file_id)
1325
1230
minikind = DirState._kind_to_minikind[inv_entry.kind]
1326
1231
if minikind == 't':
1327
fingerprint = inv_entry.reference_revision or ''
1232
fingerprint = inv_entry.reference_revision
1329
1234
fingerprint = ''
1330
1235
insertions[file_id] = (key, minikind, inv_entry.executable,
1339
1244
minikind = child[1][0][0]
1340
1245
fingerprint = child[1][0][4]
1341
1246
executable = child[1][0][3]
1342
old_child_path = osutils.pathjoin(child_dirname,
1247
old_child_path = osutils.pathjoin(child[0][0],
1344
1249
removals[child[0][2]] = old_child_path
1345
1250
child_suffix = child_dirname[len(old_path):]
1346
1251
new_child_dirname = (new_path + child_suffix)
1347
1252
key = (new_child_dirname, child_basename, child[0][2])
1348
new_child_path = osutils.pathjoin(new_child_dirname,
1253
new_child_path = os.path.join(new_child_dirname,
1350
1255
insertions[child[0][2]] = (key, minikind, executable,
1351
1256
fingerprint, new_child_path)
1352
self._check_delta_ids_absent(new_ids, delta, 0)
1354
self._apply_removals(removals.iteritems())
1355
self._apply_insertions(insertions.values())
1357
self._after_delta_check_parents(parents, 0)
1358
except errors.BzrError, e:
1359
self._changes_aborted = True
1360
if 'integrity error' not in str(e):
1362
# _get_entry raises BzrError when a request is inconsistent; we
1363
# want such errors to be shown as InconsistentDelta - and that
1364
# fits the behaviour we trigger.
1365
raise errors.InconsistentDeltaDelta(delta, "error from _get_entry.")
1257
self._apply_removals(removals.values())
1258
self._apply_insertions(insertions.values())
1367
1260
def _apply_removals(self, removals):
1368
for file_id, path in sorted(removals, reverse=True,
1369
key=operator.itemgetter(1)):
1261
for path in sorted(removals, reverse=True):
1370
1262
dirname, basename = osutils.split(path)
1371
1263
block_i, entry_i, d_present, f_present = \
1372
1264
self._get_block_entry_index(dirname, basename, 0)
1374
entry = self._dirblocks[block_i][1][entry_i]
1376
self._changes_aborted = True
1377
raise errors.InconsistentDelta(path, file_id,
1378
"Wrong path for old path.")
1379
if not f_present or entry[1][0][0] in 'ar':
1380
self._changes_aborted = True
1381
raise errors.InconsistentDelta(path, file_id,
1382
"Wrong path for old path.")
1383
if file_id != entry[0][2]:
1384
self._changes_aborted = True
1385
raise errors.InconsistentDelta(path, file_id,
1386
"Attempt to remove path has wrong id - found %r."
1265
entry = self._dirblocks[block_i][1][entry_i]
1388
1266
self._make_absent(entry)
1389
1267
# See if we have a malformed delta: deleting a directory must not
1390
1268
# leave crud behind. This increases the number of bisects needed
1398
1276
# be due to it being in a parent tree, or a corrupt delta.
1399
1277
for child_entry in self._dirblocks[block_i][1]:
1400
1278
if child_entry[1][0][0] not in ('r', 'a'):
1401
self._changes_aborted = True
1402
1279
raise errors.InconsistentDelta(path, entry[0][2],
1403
1280
"The file id was deleted but its children were "
1404
1281
"not deleted.")
1406
1283
def _apply_insertions(self, adds):
1408
for key, minikind, executable, fingerprint, path_utf8 in sorted(adds):
1409
self.update_minimal(key, minikind, executable, fingerprint,
1410
path_utf8=path_utf8)
1411
except errors.NotVersionedError:
1412
self._changes_aborted = True
1413
raise errors.InconsistentDelta(path_utf8.decode('utf8'), key[2],
1284
for key, minikind, executable, fingerprint, path_utf8 in sorted(adds):
1285
self.update_minimal(key, minikind, executable, fingerprint,
1286
path_utf8=path_utf8)
1416
1288
def update_basis_by_delta(self, delta, new_revid):
1417
1289
"""Update the parents of this tree after a commit.
1461
1333
# At the same time, to reduce interface friction we convert the input
1462
1334
# inventory entries to dirstate.
1463
1335
root_only = ('', '')
1464
# Accumulate parent references (path_utf8, id), to check for parentless
1465
# items or items placed under files/links/tree-references. We get
1466
# references from every item in the delta that is not a deletion and
1467
# is not itself the root.
1469
# Added ids must not be in the dirstate already. This set holds those
1472
1336
for old_path, new_path, file_id, inv_entry in delta:
1473
if inv_entry is not None and file_id != inv_entry.file_id:
1474
raise errors.InconsistentDelta(new_path, file_id,
1475
"mismatched entry file_id %r" % inv_entry)
1476
if new_path is not None:
1477
if inv_entry is None:
1478
raise errors.InconsistentDelta(new_path, file_id,
1479
"new_path with no entry")
1480
new_path_utf8 = encode(new_path)
1481
# note the parent for validation
1482
dirname_utf8, basename_utf8 = osutils.split(new_path_utf8)
1484
parents.add((dirname_utf8, inv_entry.parent_id))
1485
1337
if old_path is None:
1486
1338
adds.append((None, encode(new_path), file_id,
1487
1339
inv_to_entry(inv_entry), True))
1488
new_ids.add(file_id)
1489
1340
elif new_path is None:
1490
1341
deletes.append((encode(old_path), None, file_id, None, True))
1491
1342
elif (old_path, new_path) != root_only:
1534
1386
# of everything.
1535
1387
changes.append((encode(old_path), encode(new_path), file_id,
1536
1388
inv_to_entry(inv_entry)))
1537
self._check_delta_ids_absent(new_ids, delta, 1)
1539
# Finish expunging deletes/first half of renames.
1540
self._update_basis_apply_deletes(deletes)
1541
# Reinstate second half of renames and new paths.
1542
self._update_basis_apply_adds(adds)
1543
# Apply in-situ changes.
1544
self._update_basis_apply_changes(changes)
1546
self._after_delta_check_parents(parents, 1)
1547
except errors.BzrError, e:
1548
self._changes_aborted = True
1549
if 'integrity error' not in str(e):
1551
# _get_entry raises BzrError when a request is inconsistent; we
1552
# want such errors to be shown as InconsistentDelta - and that
1553
# fits the behaviour we trigger. Partof this is driven by dirstate
1554
# only supporting deltas that turn the basis into a closer fit to
1556
raise errors.InconsistentDeltaDelta(delta, "error from _get_entry.")
1390
# Finish expunging deletes/first half of renames.
1391
self._update_basis_apply_deletes(deletes)
1392
# Reinstate second half of renames and new paths.
1393
self._update_basis_apply_adds(adds)
1394
# Apply in-situ changes.
1395
self._update_basis_apply_changes(changes)
1558
1397
self._dirblock_state = DirState.IN_MEMORY_MODIFIED
1559
1398
self._header_state = DirState.IN_MEMORY_MODIFIED
1560
1399
self._id_index = None
1563
def _check_delta_ids_absent(self, new_ids, delta, tree_index):
1564
"""Check that none of the file_ids in new_ids are present in a tree."""
1567
id_index = self._get_id_index()
1568
for file_id in new_ids:
1569
for key in id_index.get(file_id, []):
1570
block_i, entry_i, d_present, f_present = \
1571
self._get_block_entry_index(key[0], key[1], tree_index)
1573
# In a different tree
1575
entry = self._dirblocks[block_i][1][entry_i]
1576
if entry[0][2] != file_id:
1577
# Different file_id, so not what we want.
1579
# NB: No changes made before this helper is called, so no need
1580
# to set the _changes_aborted flag.
1581
raise errors.InconsistentDelta(
1582
("%s/%s" % key[0:2]).decode('utf8'), file_id,
1583
"This file_id is new in the delta but already present in "
1586
1402
def _update_basis_apply_adds(self, adds):
1587
1403
"""Apply a sequence of adds to tree 1 during update_basis_by_delta.
1692
1507
# it is being resurrected here, so blank it out temporarily.
1693
1508
self._dirblocks[block_index][1][entry_index][1][1] = null
1695
def _after_delta_check_parents(self, parents, index):
1696
"""Check that parents required by the delta are all intact.
1698
:param parents: An iterable of (path_utf8, file_id) tuples which are
1699
required to be present in tree 'index' at path_utf8 with id file_id
1701
:param index: The column in the dirstate to check for parents in.
1703
for dirname_utf8, file_id in parents:
1704
# Get the entry - the ensures that file_id, dirname_utf8 exists and
1705
# has the right file id.
1706
entry = self._get_entry(index, file_id, dirname_utf8)
1707
if entry[1] is None:
1708
self._changes_aborted = True
1709
raise errors.InconsistentDelta(dirname_utf8.decode('utf8'),
1710
file_id, "This parent is not present.")
1711
# Parents of things must be directories
1712
if entry[1][index][0] != 'd':
1713
self._changes_aborted = True
1714
raise errors.InconsistentDelta(dirname_utf8.decode('utf8'),
1715
file_id, "This parent is not a directory.")
1717
1510
def _observed_sha1(self, entry, sha1, stat_value,
1718
1511
_stat_to_minikind=_stat_to_minikind, _pack_stat=pack_stat):
1719
1512
"""Note the sha1 of a file.
2356
2120
self.update_minimal(('', '', new_id), 'd',
2357
2121
path_utf8='', packed_stat=entry[1][0][4])
2358
2122
self._dirblock_state = DirState.IN_MEMORY_MODIFIED
2123
if self._id_index is not None:
2124
self._id_index.setdefault(new_id, set()).add(entry[0])
2360
2126
def set_parent_trees(self, trees, ghosts):
2361
2127
"""Set the parent trees for the dirstate.
2363
2129
:param trees: A list of revision_id, tree tuples. tree must be provided
2364
even if the revision_id refers to a ghost: supply an empty tree in
2130
even if the revision_id refers to a ghost: supply an empty tree in
2366
2132
:param ghosts: A list of the revision_ids that are ghosts at the time
2369
# TODO: generate a list of parent indexes to preserve to save
2135
# TODO: generate a list of parent indexes to preserve to save
2370
2136
# processing specific parent trees. In the common case one tree will
2371
2137
# be preserved - the left most parent.
2372
2138
# TODO: if the parent tree is a dirstate, we might want to walk them
2620
2369
and new_entry_key[1:] < current_old[0][1:])):
2621
2370
# new comes before:
2622
2371
# add a entry for this and advance new
2624
trace.mutter("Inserting from new '%s'.",
2625
new_path_utf8.decode('utf8'))
2626
2372
self.update_minimal(new_entry_key, current_new_minikind,
2627
2373
executable=current_new[1].executable,
2628
path_utf8=new_path_utf8, fingerprint=fingerprint,
2374
path_utf8=new_path_utf8, fingerprint=fingerprint)
2630
2375
current_new = advance(new_iterator)
2632
2377
# we've advanced past the place where the old key would be,
2633
2378
# without seeing it in the new list. so it must be gone.
2635
trace.mutter("Deleting from old '%s/%s'.",
2636
current_old[0][0].decode('utf8'),
2637
current_old[0][1].decode('utf8'))
2638
2379
self._make_absent(current_old)
2639
2380
current_old = advance(old_iterator)
2640
2381
self._dirblock_state = DirState.IN_MEMORY_MODIFIED
2641
2382
self._id_index = None
2642
2383
self._packed_stat_index = None
2644
trace.mutter("set_state_from_inventory complete.")
2646
2385
def _make_absent(self, current_old):
2647
2386
"""Mark current_old - an entry - as absent for tree 0.
2757
2476
# grab one of them and use it to generate parent
2758
2477
# relocation/absent entries.
2759
2478
new_entry = key, [new_details]
2760
# existing_keys can be changed as we iterate.
2761
for other_key in tuple(existing_keys):
2479
for other_key in existing_keys:
2762
2480
# change the record at other to be a pointer to this new
2763
2481
# record. The loop looks similar to the change to
2764
2482
# relocations when updating an existing record but its not:
2765
2483
# the test for existing kinds is different: this can be
2766
2484
# factored out to a helper though.
2767
other_block_index, present = self._find_block_index_from_key(
2770
raise AssertionError('could not find block for %s' % (
2772
other_block = self._dirblocks[other_block_index][1]
2773
other_entry_index, present = self._find_entry_index(
2774
other_key, other_block)
2776
raise AssertionError(
2777
'update_minimal: could not find other entry for %s'
2485
other_block_index, present = self._find_block_index_from_key(other_key)
2487
raise AssertionError('could not find block for %s' % (other_key,))
2488
other_entry_index, present = self._find_entry_index(other_key,
2489
self._dirblocks[other_block_index][1])
2491
raise AssertionError('could not find entry for %s' % (other_key,))
2779
2492
if path_utf8 is None:
2780
2493
raise AssertionError('no path')
2781
# Turn this other location into a reference to the new
2782
# location. This also updates the aliased iterator
2783
# (current_old in set_state_from_inventory) so that the old
2784
# entry, if not already examined, is skipped over by that
2786
other_entry = other_block[other_entry_index]
2787
other_entry[1][0] = ('r', path_utf8, 0, False, '')
2788
self._maybe_remove_row(other_block, other_entry_index,
2494
self._dirblocks[other_block_index][1][other_entry_index][1][0] = \
2495
('r', path_utf8, 0, False, '')
2792
# adds a tuple to the new details for each column
2793
# - either by copying an existing relocation pointer inside that column
2794
# - or by creating a new pointer to the right row inside that column
2795
2497
num_present_parents = self._num_present_parents()
2796
if num_present_parents:
2797
other_key = list(existing_keys)[0]
2798
2498
for lookup_index in xrange(1, num_present_parents + 1):
2799
2499
# grab any one entry, use it to find the right path.
2800
# TODO: optimise this to reduce memory use in highly
2500
# TODO: optimise this to reduce memory use in highly
2801
2501
# fragmented situations by reusing the relocation
2803
2503
update_block_index, present = \
3167
2840
False, DirState.NULLSTAT)
3168
2841
state._dirblock_state = DirState.IN_MEMORY_MODIFIED
3169
2842
return link_or_sha1
2843
update_entry = py_update_entry
3172
2846
class ProcessEntryPython(object):
3174
__slots__ = ["old_dirname_to_file_id", "new_dirname_to_file_id",
2848
__slots__ = ["old_dirname_to_file_id", "new_dirname_to_file_id", "uninteresting",
3175
2849
"last_source_parent", "last_target_parent", "include_unchanged",
3176
"partial", "use_filesystem_for_exec", "utf8_decode",
3177
"searched_specific_files", "search_specific_files",
3178
"searched_exact_paths", "search_specific_file_parents", "seen_ids",
3179
"state", "source_index", "target_index", "want_unversioned", "tree"]
2850
"use_filesystem_for_exec", "utf8_decode", "searched_specific_files",
2851
"search_specific_files", "state", "source_index", "target_index",
2852
"want_unversioned", "tree"]
3181
2854
def __init__(self, include_unchanged, use_filesystem_for_exec,
3182
2855
search_specific_files, state, source_index, target_index,
3183
2856
want_unversioned, tree):
3184
2857
self.old_dirname_to_file_id = {}
3185
2858
self.new_dirname_to_file_id = {}
3186
# Are we doing a partial iter_changes?
3187
self.partial = search_specific_files != set([''])
2859
# Just a sentry, so that _process_entry can say that this
2860
# record is handled, but isn't interesting to process (unchanged)
2861
self.uninteresting = object()
3188
2862
# Using a list so that we can access the values and change them in
3189
2863
# nested scope. Each one is [path, file_id, entry]
3190
2864
self.last_source_parent = [None, None]
3193
2867
self.use_filesystem_for_exec = use_filesystem_for_exec
3194
2868
self.utf8_decode = cache_utf8._utf8_decode
3195
2869
# for all search_indexs in each path at or under each element of
3196
# search_specific_files, if the detail is relocated: add the id, and
3197
# add the relocated path as one to search if its not searched already.
3198
# If the detail is not relocated, add the id.
2870
# search_specific_files, if the detail is relocated: add the id, and add the
2871
# relocated path as one to search if its not searched already. If the
2872
# detail is not relocated, add the id.
3199
2873
self.searched_specific_files = set()
3200
# When we search exact paths without expanding downwards, we record
3202
self.searched_exact_paths = set()
3203
2874
self.search_specific_files = search_specific_files
3204
# The parents up to the root of the paths we are searching.
3205
# After all normal paths are returned, these specific items are returned.
3206
self.search_specific_file_parents = set()
3207
# The ids we've sent out in the delta.
3208
self.seen_ids = set()
3209
2875
self.state = state
3210
2876
self.source_index = source_index
3211
2877
self.target_index = target_index
3212
if target_index != 0:
3213
# A lot of code in here depends on target_index == 0
3214
raise errors.BzrError('unsupported target index')
3215
2878
self.want_unversioned = want_unversioned
3216
2879
self.tree = tree
3219
2882
"""Compare an entry and real disk to generate delta information.
3221
2884
:param path_info: top_relpath, basename, kind, lstat, abspath for
3222
the path of entry. If None, then the path is considered absent in
3223
the target (Perhaps we should pass in a concrete entry for this ?)
2885
the path of entry. If None, then the path is considered absent.
2886
(Perhaps we should pass in a concrete entry for this ?)
3224
2887
Basename is returned as a utf8 string because we expect this
3225
2888
tuple will be ignored, and don't want to take the time to
3227
:return: (iter_changes_result, changed). If the entry has not been
3228
handled then changed is None. Otherwise it is False if no content
3229
or metadata changes have occurred, and True if any content or
3230
metadata change has occurred. If self.include_unchanged is True then
3231
if changed is not None, iter_changes_result will always be a result
3232
tuple. Otherwise, iter_changes_result is None unless changed is
2890
:return: None if these don't match
2891
A tuple of information about the change, or
2892
the object 'uninteresting' if these match, but are
2893
basically identical.
3235
2895
if self.source_index is None:
3236
2896
source_details = DirState.NULL_PARENT_DETAILS
3304
2964
if source_minikind != 'f':
3305
2965
content_change = True
3307
# Check the sha. We can't just rely on the size as
3308
# content filtering may mean differ sizes actually
3309
# map to the same content
3310
if link_or_sha1 is None:
3312
statvalue, link_or_sha1 = \
3313
self.state._sha1_provider.stat_and_sha1(
3315
self.state._observed_sha1(entry, link_or_sha1,
3317
content_change = (link_or_sha1 != source_details[1])
2967
# If the size is the same, check the sha:
2968
if target_details[2] == source_details[2]:
2969
if link_or_sha1 is None:
2971
file_obj = file(path_info[4], 'rb')
2973
statvalue = os.fstat(file_obj.fileno())
2974
link_or_sha1 = osutils.sha_file(file_obj)
2977
self.state._observed_sha1(entry, link_or_sha1,
2979
content_change = (link_or_sha1 != source_details[1])
2981
# Size changed, so must be different
2982
content_change = True
3318
2983
# Target details is updated at update_entry time
3319
2984
if self.use_filesystem_for_exec:
3320
2985
# We don't need S_ISREG here, because we are sure
3481
3144
"source_minikind=%r, target_minikind=%r"
3482
3145
% (source_minikind, target_minikind))
3483
3146
## import pdb;pdb.set_trace()
3486
3149
def __iter__(self):
3489
def _gather_result_for_consistency(self, result):
3490
"""Check a result we will yield to make sure we are consistent later.
3492
This gathers result's parents into a set to output later.
3494
:param result: A result tuple.
3496
if not self.partial or not result[0]:
3498
self.seen_ids.add(result[0])
3499
new_path = result[1][1]
3501
# Not the root and not a delete: queue up the parents of the path.
3502
self.search_specific_file_parents.update(
3503
osutils.parent_directories(new_path.encode('utf8')))
3504
# Add the root directory which parent_directories does not
3506
self.search_specific_file_parents.add('')
3508
3152
def iter_changes(self):
3509
3153
"""Iterate over the changes."""
3510
3154
utf8_decode = cache_utf8._utf8_decode
3511
3155
_cmp_by_dirs = cmp_by_dirs
3512
3156
_process_entry = self._process_entry
3157
uninteresting = self.uninteresting
3513
3158
search_specific_files = self.search_specific_files
3514
3159
searched_specific_files = self.searched_specific_files
3515
3160
splitpath = osutils.splitpath
3517
3162
# compare source_index and target_index at or under each element of search_specific_files.
3518
3163
# follow the following comparison table. Note that we only want to do diff operations when
3519
# the target is fdl because thats when the walkdirs logic will have exposed the pathinfo
3164
# the target is fdl because thats when the walkdirs logic will have exposed the pathinfo
3520
3165
# for the target.
3523
3168
# Source | Target | disk | action
3524
3169
# r | fdlt | | add source to search, add id path move and perform
3525
3170
# | | | diff check on source-target
3526
# r | fdlt | a | dangling file that was present in the basis.
3171
# r | fdlt | a | dangling file that was present in the basis.
3528
3173
# r | a | | add source to search
3530
3175
# r | r | | this path is present in a non-examined tree, skip.
3531
3176
# r | r | a | this path is present in a non-examined tree, skip.
3532
3177
# a | fdlt | | add new id
3847
3482
current_dir_info = dir_iterator.next()
3848
3483
except StopIteration:
3849
3484
current_dir_info = None
3850
for result in self._iter_specific_file_parents():
3853
def _iter_specific_file_parents(self):
3854
"""Iter over the specific file parents."""
3855
while self.search_specific_file_parents:
3856
# Process the parent directories for the paths we were iterating.
3857
# Even in extremely large trees this should be modest, so currently
3858
# no attempt is made to optimise.
3859
path_utf8 = self.search_specific_file_parents.pop()
3860
if osutils.is_inside_any(self.searched_specific_files, path_utf8):
3861
# We've examined this path.
3863
if path_utf8 in self.searched_exact_paths:
3864
# We've examined this path.
3866
path_entries = self.state._entries_for_path(path_utf8)
3867
# We need either one or two entries. If the path in
3868
# self.target_index has moved (so the entry in source_index is in
3869
# 'ar') then we need to also look for the entry for this path in
3870
# self.source_index, to output the appropriate delete-or-rename.
3871
selected_entries = []
3873
for candidate_entry in path_entries:
3874
# Find entries present in target at this path:
3875
if candidate_entry[1][self.target_index][0] not in 'ar':
3877
selected_entries.append(candidate_entry)
3878
# Find entries present in source at this path:
3879
elif (self.source_index is not None and
3880
candidate_entry[1][self.source_index][0] not in 'ar'):
3882
if candidate_entry[1][self.target_index][0] == 'a':
3883
# Deleted, emit it here.
3884
selected_entries.append(candidate_entry)
3886
# renamed, emit it when we process the directory it
3888
self.search_specific_file_parents.add(
3889
candidate_entry[1][self.target_index][1])
3891
raise AssertionError(
3892
"Missing entry for specific path parent %r, %r" % (
3893
path_utf8, path_entries))
3894
path_info = self._path_info(path_utf8, path_utf8.decode('utf8'))
3895
for entry in selected_entries:
3896
if entry[0][2] in self.seen_ids:
3898
result, changed = self._process_entry(entry, path_info)
3900
raise AssertionError(
3901
"Got entry<->path mismatch for specific path "
3902
"%r entry %r path_info %r " % (
3903
path_utf8, entry, path_info))
3904
# Only include changes - we're outside the users requested
3907
self._gather_result_for_consistency(result)
3908
if (result[6][0] == 'directory' and
3909
result[6][1] != 'directory'):
3910
# This stopped being a directory, the old children have
3912
if entry[1][self.source_index][0] == 'r':
3913
# renamed, take the source path
3914
entry_path_utf8 = entry[1][self.source_index][1]
3916
entry_path_utf8 = path_utf8
3917
initial_key = (entry_path_utf8, '', '')
3918
block_index, _ = self.state._find_block_index_from_key(
3920
if block_index == 0:
3921
# The children of the root are in block index 1.
3923
current_block = None
3924
if block_index < len(self.state._dirblocks):
3925
current_block = self.state._dirblocks[block_index]
3926
if not osutils.is_inside(
3927
entry_path_utf8, current_block[0]):
3928
# No entries for this directory at all.
3929
current_block = None
3930
if current_block is not None:
3931
for entry in current_block[1]:
3932
if entry[1][self.source_index][0] in 'ar':
3933
# Not in the source tree, so doesn't have to be
3936
# Path of the entry itself.
3938
self.search_specific_file_parents.add(
3939
osutils.pathjoin(*entry[0][:2]))
3940
if changed or self.include_unchanged:
3942
self.searched_exact_paths.add(path_utf8)
3944
def _path_info(self, utf8_path, unicode_path):
3945
"""Generate path_info for unicode_path.
3947
:return: None if unicode_path does not exist, or a path_info tuple.
3949
abspath = self.tree.abspath(unicode_path)
3951
stat = os.lstat(abspath)
3953
if e.errno == errno.ENOENT:
3954
# the path does not exist.
3958
utf8_basename = utf8_path.rsplit('/', 1)[-1]
3959
dir_info = (utf8_path, utf8_basename,
3960
osutils.file_kind_from_stat_mode(stat.st_mode), stat,
3962
if dir_info[2] == 'directory':
3963
if self.tree._directory_is_tree_reference(
3965
self.root_dir_info = self.root_dir_info[:2] + \
3966
('tree-reference',) + self.root_dir_info[3:]
3485
_process_entry = ProcessEntryPython
3970
3488
# Try to load the compiled form if possible
3972
from bzrlib._dirstate_helpers_pyx import (
3490
from bzrlib._dirstate_helpers_c import (
3491
_read_dirblocks_c as _read_dirblocks,
3492
bisect_dirblock_c as bisect_dirblock,
3493
_bisect_path_left_c as _bisect_path_left,
3494
_bisect_path_right_c as _bisect_path_right,
3495
cmp_by_dirs_c as cmp_by_dirs,
3978
3496
ProcessEntryC as _process_entry,
3979
3497
update_entry as update_entry,
3981
except ImportError, e:
3982
osutils.failed_to_load_extension(e)
3983
3500
from bzrlib._dirstate_helpers_py import (
3501
_read_dirblocks_py as _read_dirblocks,
3502
bisect_dirblock_py as bisect_dirblock,
3503
_bisect_path_left_py as _bisect_path_left,
3504
_bisect_path_right_py as _bisect_path_right,
3505
cmp_by_dirs_py as cmp_by_dirs,
3990
# FIXME: It would be nice to be able to track moved lines so that the
3991
# corresponding python code can be moved to the _dirstate_helpers_py
3992
# module. I don't want to break the history for this important piece of
3993
# code so I left the code here -- vila 20090622
3994
update_entry = py_update_entry
3995
_process_entry = ProcessEntryPython