1278
def update_by_delta(self, delta):
1279
"""Apply an inventory delta to the dirstate for tree 0
1281
This is the workhorse for apply_inventory_delta in dirstate based
1284
:param delta: An inventory delta. See Inventory.apply_delta for
1287
self._read_dirblocks_if_needed()
1288
encode = cache_utf8.encode
1291
# Accumulate parent references (path_utf8, id), to check for parentless
1292
# items or items placed under files/links/tree-references. We get
1293
# references from every item in the delta that is not a deletion and
1294
# is not itself the root.
1296
# Added ids must not be in the dirstate already. This set holds those
1299
# This loop transforms the delta to single atomic operations that can
1300
# be executed and validated.
1301
for old_path, new_path, file_id, inv_entry in sorted(
1302
inventory._check_delta_unique_old_paths(
1303
inventory._check_delta_unique_new_paths(
1304
inventory._check_delta_ids_match_entry(
1305
inventory._check_delta_ids_are_valid(
1306
inventory._check_delta_new_path_entry_both_or_None(delta))))),
1308
if (file_id in insertions) or (file_id in removals):
1309
raise errors.InconsistentDelta(old_path or new_path, file_id,
1311
if old_path is not None:
1312
old_path = old_path.encode('utf-8')
1313
removals[file_id] = old_path
1315
new_ids.add(file_id)
1316
if new_path is not None:
1317
if inv_entry is None:
1318
raise errors.InconsistentDelta(new_path, file_id,
1319
"new_path with no entry")
1320
new_path = new_path.encode('utf-8')
1321
dirname_utf8, basename = osutils.split(new_path)
1323
parents.add((dirname_utf8, inv_entry.parent_id))
1324
key = (dirname_utf8, basename, file_id)
1325
minikind = DirState._kind_to_minikind[inv_entry.kind]
1327
fingerprint = inv_entry.reference_revision
1330
insertions[file_id] = (key, minikind, inv_entry.executable,
1331
fingerprint, new_path)
1332
# Transform moves into delete+add pairs
1333
if None not in (old_path, new_path):
1334
for child in self._iter_child_entries(0, old_path):
1335
if child[0][2] in insertions or child[0][2] in removals:
1337
child_dirname = child[0][0]
1338
child_basename = child[0][1]
1339
minikind = child[1][0][0]
1340
fingerprint = child[1][0][4]
1341
executable = child[1][0][3]
1342
old_child_path = osutils.pathjoin(child[0][0],
1344
removals[child[0][2]] = old_child_path
1345
child_suffix = child_dirname[len(old_path):]
1346
new_child_dirname = (new_path + child_suffix)
1347
key = (new_child_dirname, child_basename, child[0][2])
1348
new_child_path = os.path.join(new_child_dirname,
1350
insertions[child[0][2]] = (key, minikind, executable,
1351
fingerprint, new_child_path)
1352
self._check_delta_ids_absent(new_ids, delta, 0)
1354
self._apply_removals(removals.iteritems())
1355
self._apply_insertions(insertions.values())
1357
self._after_delta_check_parents(parents, 0)
1358
except errors.BzrError, e:
1359
self._changes_aborted = True
1360
if 'integrity error' not in str(e):
1362
# _get_entry raises BzrError when a request is inconsistent; we
1363
# want such errors to be shown as InconsistentDelta - and that
1364
# fits the behaviour we trigger.
1365
raise errors.InconsistentDeltaDelta(delta, "error from _get_entry.")
1367
def _apply_removals(self, removals):
1368
for file_id, path in sorted(removals, reverse=True,
1369
key=operator.itemgetter(1)):
1370
dirname, basename = osutils.split(path)
1371
block_i, entry_i, d_present, f_present = \
1372
self._get_block_entry_index(dirname, basename, 0)
1374
entry = self._dirblocks[block_i][1][entry_i]
1376
self._changes_aborted = True
1377
raise errors.InconsistentDelta(path, file_id,
1378
"Wrong path for old path.")
1379
if not f_present or entry[1][0][0] in 'ar':
1380
self._changes_aborted = True
1381
raise errors.InconsistentDelta(path, file_id,
1382
"Wrong path for old path.")
1383
if file_id != entry[0][2]:
1384
self._changes_aborted = True
1385
raise errors.InconsistentDelta(path, file_id,
1386
"Attempt to remove path has wrong id - found %r."
1388
self._make_absent(entry)
1389
# See if we have a malformed delta: deleting a directory must not
1390
# leave crud behind. This increases the number of bisects needed
1391
# substantially, but deletion or renames of large numbers of paths
1392
# is rare enough it shouldn't be an issue (famous last words?) RBC
1394
block_i, entry_i, d_present, f_present = \
1395
self._get_block_entry_index(path, '', 0)
1397
# The dir block is still present in the dirstate; this could
1398
# be due to it being in a parent tree, or a corrupt delta.
1399
for child_entry in self._dirblocks[block_i][1]:
1400
if child_entry[1][0][0] not in ('r', 'a'):
1401
self._changes_aborted = True
1402
raise errors.InconsistentDelta(path, entry[0][2],
1403
"The file id was deleted but its children were "
1406
def _apply_insertions(self, adds):
1408
for key, minikind, executable, fingerprint, path_utf8 in sorted(adds):
1409
self.update_minimal(key, minikind, executable, fingerprint,
1410
path_utf8=path_utf8)
1411
except errors.NotVersionedError:
1412
self._changes_aborted = True
1413
raise errors.InconsistentDelta(path_utf8.decode('utf8'), key[2],
1416
def update_basis_by_delta(self, delta, new_revid):
1417
"""Update the parents of this tree after a commit.
1419
This gives the tree one parent, with revision id new_revid. The
1420
inventory delta is applied to the current basis tree to generate the
1421
inventory for the parent new_revid, and all other parent trees are
1424
Note that an exception during the operation of this method will leave
1425
the dirstate in a corrupt state where it should not be saved.
1427
Finally, we expect all changes to be synchronising the basis tree with
1430
:param new_revid: The new revision id for the trees parent.
1431
:param delta: An inventory delta (see apply_inventory_delta) describing
1432
the changes from the current left most parent revision to new_revid.
1434
self._read_dirblocks_if_needed()
1435
self._discard_merge_parents()
1436
if self._ghosts != []:
1437
raise NotImplementedError(self.update_basis_by_delta)
1438
if len(self._parents) == 0:
1439
# setup a blank tree, the most simple way.
1440
empty_parent = DirState.NULL_PARENT_DETAILS
1441
for entry in self._iter_entries():
1442
entry[1].append(empty_parent)
1443
self._parents.append(new_revid)
1445
self._parents[0] = new_revid
1447
delta = sorted(delta, reverse=True)
1451
# The paths this function accepts are unicode and must be encoded as we
1453
encode = cache_utf8.encode
1454
inv_to_entry = self._inv_entry_to_details
1455
# delta is now (deletes, changes), (adds) in reverse lexographical
1457
# deletes in reverse lexographic order are safe to process in situ.
1458
# renames are not, as a rename from any path could go to a path
1459
# lexographically lower, so we transform renames into delete, add pairs,
1460
# expanding them recursively as needed.
1461
# At the same time, to reduce interface friction we convert the input
1462
# inventory entries to dirstate.
1463
root_only = ('', '')
1464
# Accumulate parent references (path_utf8, id), to check for parentless
1465
# items or items placed under files/links/tree-references. We get
1466
# references from every item in the delta that is not a deletion and
1467
# is not itself the root.
1469
# Added ids must not be in the dirstate already. This set holds those
1472
for old_path, new_path, file_id, inv_entry in delta:
1473
if inv_entry is not None and file_id != inv_entry.file_id:
1474
raise errors.InconsistentDelta(new_path, file_id,
1475
"mismatched entry file_id %r" % inv_entry)
1476
if new_path is not None:
1477
if inv_entry is None:
1478
raise errors.InconsistentDelta(new_path, file_id,
1479
"new_path with no entry")
1480
new_path_utf8 = encode(new_path)
1481
# note the parent for validation
1482
dirname_utf8, basename_utf8 = osutils.split(new_path_utf8)
1484
parents.add((dirname_utf8, inv_entry.parent_id))
1485
if old_path is None:
1486
adds.append((None, encode(new_path), file_id,
1487
inv_to_entry(inv_entry), True))
1488
new_ids.add(file_id)
1489
elif new_path is None:
1490
deletes.append((encode(old_path), None, file_id, None, True))
1491
elif (old_path, new_path) != root_only:
1493
# Because renames must preserve their children we must have
1494
# processed all relocations and removes before hand. The sort
1495
# order ensures we've examined the child paths, but we also
1496
# have to execute the removals, or the split to an add/delete
1497
# pair will result in the deleted item being reinserted, or
1498
# renamed items being reinserted twice - and possibly at the
1499
# wrong place. Splitting into a delete/add pair also simplifies
1500
# the handling of entries with ('f', ...), ('r' ...) because
1501
# the target of the 'r' is old_path here, and we add that to
1502
# deletes, meaning that the add handler does not need to check
1503
# for 'r' items on every pass.
1504
self._update_basis_apply_deletes(deletes)
1506
# Split into an add/delete pair recursively.
1507
adds.append((None, new_path_utf8, file_id,
1508
inv_to_entry(inv_entry), False))
1509
# Expunge deletes that we've seen so that deleted/renamed
1510
# children of a rename directory are handled correctly.
1511
new_deletes = reversed(list(self._iter_child_entries(1,
1513
# Remove the current contents of the tree at orig_path, and
1514
# reinsert at the correct new path.
1515
for entry in new_deletes:
1517
source_path = entry[0][0] + '/' + entry[0][1]
1519
source_path = entry[0][1]
1521
target_path = new_path_utf8 + source_path[len(old_path):]
1524
raise AssertionError("cannot rename directory to"
1526
target_path = source_path[len(old_path) + 1:]
1527
adds.append((None, target_path, entry[0][2], entry[1][1], False))
1529
(source_path, target_path, entry[0][2], None, False))
1531
(encode(old_path), new_path, file_id, None, False))
1533
# changes to just the root should not require remove/insertion
1535
changes.append((encode(old_path), encode(new_path), file_id,
1536
inv_to_entry(inv_entry)))
1537
self._check_delta_ids_absent(new_ids, delta, 1)
1539
# Finish expunging deletes/first half of renames.
1540
self._update_basis_apply_deletes(deletes)
1541
# Reinstate second half of renames and new paths.
1542
self._update_basis_apply_adds(adds)
1543
# Apply in-situ changes.
1544
self._update_basis_apply_changes(changes)
1546
self._after_delta_check_parents(parents, 1)
1547
except errors.BzrError, e:
1548
self._changes_aborted = True
1549
if 'integrity error' not in str(e):
1551
# _get_entry raises BzrError when a request is inconsistent; we
1552
# want such errors to be shown as InconsistentDelta - and that
1553
# fits the behaviour we trigger. Partof this is driven by dirstate
1554
# only supporting deltas that turn the basis into a closer fit to
1556
raise errors.InconsistentDeltaDelta(delta, "error from _get_entry.")
1558
self._dirblock_state = DirState.IN_MEMORY_MODIFIED
1559
self._header_state = DirState.IN_MEMORY_MODIFIED
1560
self._id_index = None
1563
def _check_delta_ids_absent(self, new_ids, delta, tree_index):
1564
"""Check that none of the file_ids in new_ids are present in a tree."""
1567
id_index = self._get_id_index()
1568
for file_id in new_ids:
1569
for key in id_index.get(file_id, []):
1570
block_i, entry_i, d_present, f_present = \
1571
self._get_block_entry_index(key[0], key[1], tree_index)
1573
# In a different tree
1575
entry = self._dirblocks[block_i][1][entry_i]
1576
if entry[0][2] != file_id:
1577
# Different file_id, so not what we want.
1579
# NB: No changes made before this helper is called, so no need
1580
# to set the _changes_aborted flag.
1581
raise errors.InconsistentDelta(
1582
("%s/%s" % key[0:2]).decode('utf8'), file_id,
1583
"This file_id is new in the delta but already present in "
1586
def _update_basis_apply_adds(self, adds):
1587
"""Apply a sequence of adds to tree 1 during update_basis_by_delta.
1589
They may be adds, or renames that have been split into add/delete
1592
:param adds: A sequence of adds. Each add is a tuple:
1593
(None, new_path_utf8, file_id, (entry_details), real_add). real_add
1594
is False when the add is the second half of a remove-and-reinsert
1595
pair created to handle renames and deletes.
1597
# Adds are accumulated partly from renames, so can be in any input
1600
# adds is now in lexographic order, which places all parents before
1601
# their children, so we can process it linearly.
1603
for old_path, new_path, file_id, new_details, real_add in adds:
1604
# the entry for this file_id must be in tree 0.
1605
entry = self._get_entry(0, file_id, new_path)
1606
if entry[0] is None or entry[0][2] != file_id:
1607
self._changes_aborted = True
1608
raise errors.InconsistentDelta(new_path, file_id,
1609
'working tree does not contain new entry')
1610
if real_add and entry[1][1][0] not in absent:
1611
self._changes_aborted = True
1612
raise errors.InconsistentDelta(new_path, file_id,
1613
'The entry was considered to be a genuinely new record,'
1614
' but there was already an old record for it.')
1615
# We don't need to update the target of an 'r' because the handling
1616
# of renames turns all 'r' situations into a delete at the original
1618
entry[1][1] = new_details
1620
def _update_basis_apply_changes(self, changes):
1621
"""Apply a sequence of changes to tree 1 during update_basis_by_delta.
1623
:param adds: A sequence of changes. Each change is a tuple:
1624
(path_utf8, path_utf8, file_id, (entry_details))
1627
for old_path, new_path, file_id, new_details in changes:
1628
# the entry for this file_id must be in tree 0.
1629
entry = self._get_entry(0, file_id, new_path)
1630
if entry[0] is None or entry[0][2] != file_id:
1631
self._changes_aborted = True
1632
raise errors.InconsistentDelta(new_path, file_id,
1633
'working tree does not contain new entry')
1634
if (entry[1][0][0] in absent or
1635
entry[1][1][0] in absent):
1636
self._changes_aborted = True
1637
raise errors.InconsistentDelta(new_path, file_id,
1638
'changed considered absent')
1639
entry[1][1] = new_details
1641
def _update_basis_apply_deletes(self, deletes):
1642
"""Apply a sequence of deletes to tree 1 during update_basis_by_delta.
1644
They may be deletes, or renames that have been split into add/delete
1647
:param deletes: A sequence of deletes. Each delete is a tuple:
1648
(old_path_utf8, new_path_utf8, file_id, None, real_delete).
1649
real_delete is True when the desired outcome is an actual deletion
1650
rather than the rename handling logic temporarily deleting a path
1651
during the replacement of a parent.
1653
null = DirState.NULL_PARENT_DETAILS
1654
for old_path, new_path, file_id, _, real_delete in deletes:
1655
if real_delete != (new_path is None):
1656
self._changes_aborted = True
1657
raise AssertionError("bad delete delta")
1658
# the entry for this file_id must be in tree 1.
1659
dirname, basename = osutils.split(old_path)
1660
block_index, entry_index, dir_present, file_present = \
1661
self._get_block_entry_index(dirname, basename, 1)
1662
if not file_present:
1663
self._changes_aborted = True
1664
raise errors.InconsistentDelta(old_path, file_id,
1665
'basis tree does not contain removed entry')
1666
entry = self._dirblocks[block_index][1][entry_index]
1667
if entry[0][2] != file_id:
1668
self._changes_aborted = True
1669
raise errors.InconsistentDelta(old_path, file_id,
1670
'mismatched file_id in tree 1')
1672
if entry[1][0][0] != 'a':
1673
self._changes_aborted = True
1674
raise errors.InconsistentDelta(old_path, file_id,
1675
'This was marked as a real delete, but the WT state'
1676
' claims that it still exists and is versioned.')
1677
del self._dirblocks[block_index][1][entry_index]
1679
if entry[1][0][0] == 'a':
1680
self._changes_aborted = True
1681
raise errors.InconsistentDelta(old_path, file_id,
1682
'The entry was considered a rename, but the source path'
1683
' is marked as absent.')
1684
# For whatever reason, we were asked to rename an entry
1685
# that was originally marked as deleted. This could be
1686
# because we are renaming the parent directory, and the WT
1687
# current state has the file marked as deleted.
1688
elif entry[1][0][0] == 'r':
1689
# implement the rename
1690
del self._dirblocks[block_index][1][entry_index]
1692
# it is being resurrected here, so blank it out temporarily.
1693
self._dirblocks[block_index][1][entry_index][1][1] = null
1695
def _after_delta_check_parents(self, parents, index):
1696
"""Check that parents required by the delta are all intact.
1698
:param parents: An iterable of (path_utf8, file_id) tuples which are
1699
required to be present in tree 'index' at path_utf8 with id file_id
1701
:param index: The column in the dirstate to check for parents in.
1703
for dirname_utf8, file_id in parents:
1704
# Get the entry - the ensures that file_id, dirname_utf8 exists and
1705
# has the right file id.
1706
entry = self._get_entry(index, file_id, dirname_utf8)
1707
if entry[1] is None:
1708
self._changes_aborted = True
1709
raise errors.InconsistentDelta(dirname_utf8.decode('utf8'),
1710
file_id, "This parent is not present.")
1711
# Parents of things must be directories
1712
if entry[1][index][0] != 'd':
1713
self._changes_aborted = True
1714
raise errors.InconsistentDelta(dirname_utf8.decode('utf8'),
1715
file_id, "This parent is not a directory.")
1717
def _observed_sha1(self, entry, sha1, stat_value,
1718
_stat_to_minikind=_stat_to_minikind, _pack_stat=pack_stat):
1719
"""Note the sha1 of a file.
1721
:param entry: The entry the sha1 is for.
1722
:param sha1: The observed sha1.
1723
:param stat_value: The os.lstat for the file.
1091
def update_entry(self, entry, abspath, stat_value,
1092
_stat_to_minikind=_stat_to_minikind,
1093
_pack_stat=pack_stat):
1094
"""Update the entry based on what is actually on disk.
1096
:param entry: This is the dirblock entry for the file in question.
1097
:param abspath: The path on disk for this file.
1098
:param stat_value: (optional) if we already have done a stat on the
1100
:return: The sha1 hexdigest of the file (40 bytes) or link target of a
1726
1104
minikind = _stat_to_minikind[stat_value.st_mode & 0170000]
3069
2367
self._split_path_cache = {}
3071
2369
def _requires_lock(self):
3072
"""Check that a lock is currently held by someone on the dirstate."""
2370
"""Checks that a lock is currently held by someone on the dirstate"""
3073
2371
if not self._lock_token:
3074
2372
raise errors.ObjectNotLocked(self)
3077
def py_update_entry(state, entry, abspath, stat_value,
3078
_stat_to_minikind=DirState._stat_to_minikind,
3079
_pack_stat=pack_stat):
3080
"""Update the entry based on what is actually on disk.
3082
This function only calculates the sha if it needs to - if the entry is
3083
uncachable, or clearly different to the first parent's entry, no sha
3084
is calculated, and None is returned.
3086
:param state: The dirstate this entry is in.
3087
:param entry: This is the dirblock entry for the file in question.
3088
:param abspath: The path on disk for this file.
3089
:param stat_value: The stat value done on the path.
3090
:return: None, or The sha1 hexdigest of the file (40 bytes) or link
3091
target of a symlink.
2375
def bisect_dirblock(dirblocks, dirname, lo=0, hi=None, cache={}):
2376
"""Return the index where to insert dirname into the dirblocks.
2378
The return value idx is such that all directories blocks in dirblock[:idx]
2379
have names < dirname, and all blocks in dirblock[idx:] have names >=
2382
Optional args lo (default 0) and hi (default len(dirblocks)) bound the
2383
slice of a to be searched.
3094
minikind = _stat_to_minikind[stat_value.st_mode & 0170000]
2388
dirname_split = cache[dirname]
3095
2389
except KeyError:
3098
packed_stat = _pack_stat(stat_value)
3099
(saved_minikind, saved_link_or_sha1, saved_file_size,
3100
saved_executable, saved_packed_stat) = entry[1][0]
3102
if minikind == 'd' and saved_minikind == 't':
3104
if (minikind == saved_minikind
3105
and packed_stat == saved_packed_stat):
3106
# The stat hasn't changed since we saved, so we can re-use the
3111
# size should also be in packed_stat
3112
if saved_file_size == stat_value.st_size:
3113
return saved_link_or_sha1
3115
# If we have gotten this far, that means that we need to actually
3116
# process this entry.
3119
executable = state._is_executable(stat_value.st_mode,
3121
if state._cutoff_time is None:
3122
state._sha_cutoff_time()
3123
if (stat_value.st_mtime < state._cutoff_time
3124
and stat_value.st_ctime < state._cutoff_time
3125
and len(entry[1]) > 1
3126
and entry[1][1][0] != 'a'):
3127
# Could check for size changes for further optimised
3128
# avoidance of sha1's. However the most prominent case of
3129
# over-shaing is during initial add, which this catches.
3130
# Besides, if content filtering happens, size and sha
3131
# are calculated at the same time, so checking just the size
3132
# gains nothing w.r.t. performance.
3133
link_or_sha1 = state._sha1_file(abspath)
3134
entry[1][0] = ('f', link_or_sha1, stat_value.st_size,
3135
executable, packed_stat)
3137
entry[1][0] = ('f', '', stat_value.st_size,
3138
executable, DirState.NULLSTAT)
3139
elif minikind == 'd':
3141
entry[1][0] = ('d', '', 0, False, packed_stat)
3142
if saved_minikind != 'd':
3143
# This changed from something into a directory. Make sure we
3144
# have a directory block for it. This doesn't happen very
3145
# often, so this doesn't have to be super fast.
3146
block_index, entry_index, dir_present, file_present = \
3147
state._get_block_entry_index(entry[0][0], entry[0][1], 0)
3148
state._ensure_block(block_index, entry_index,
3149
osutils.pathjoin(entry[0][0], entry[0][1]))
3150
elif minikind == 'l':
3151
link_or_sha1 = state._read_link(abspath, saved_link_or_sha1)
3152
if state._cutoff_time is None:
3153
state._sha_cutoff_time()
3154
if (stat_value.st_mtime < state._cutoff_time
3155
and stat_value.st_ctime < state._cutoff_time):
3156
entry[1][0] = ('l', link_or_sha1, stat_value.st_size,
3159
entry[1][0] = ('l', '', stat_value.st_size,
3160
False, DirState.NULLSTAT)
3161
state._dirblock_state = DirState.IN_MEMORY_MODIFIED
3165
class ProcessEntryPython(object):
3167
__slots__ = ["old_dirname_to_file_id", "new_dirname_to_file_id",
3168
"last_source_parent", "last_target_parent", "include_unchanged",
3169
"use_filesystem_for_exec", "utf8_decode", "searched_specific_files",
3170
"search_specific_files", "state", "source_index", "target_index",
3171
"want_unversioned", "tree"]
3173
def __init__(self, include_unchanged, use_filesystem_for_exec,
3174
search_specific_files, state, source_index, target_index,
3175
want_unversioned, tree):
3176
self.old_dirname_to_file_id = {}
3177
self.new_dirname_to_file_id = {}
3178
# Using a list so that we can access the values and change them in
3179
# nested scope. Each one is [path, file_id, entry]
3180
self.last_source_parent = [None, None]
3181
self.last_target_parent = [None, None]
3182
self.include_unchanged = include_unchanged
3183
self.use_filesystem_for_exec = use_filesystem_for_exec
3184
self.utf8_decode = cache_utf8._utf8_decode
3185
# for all search_indexs in each path at or under each element of
3186
# search_specific_files, if the detail is relocated: add the id, and add the
3187
# relocated path as one to search if its not searched already. If the
3188
# detail is not relocated, add the id.
3189
self.searched_specific_files = set()
3190
self.search_specific_files = search_specific_files
3192
self.source_index = source_index
3193
self.target_index = target_index
3194
self.want_unversioned = want_unversioned
3197
def _process_entry(self, entry, path_info, pathjoin=osutils.pathjoin):
3198
"""Compare an entry and real disk to generate delta information.
3200
:param path_info: top_relpath, basename, kind, lstat, abspath for
3201
the path of entry. If None, then the path is considered absent.
3202
(Perhaps we should pass in a concrete entry for this ?)
3203
Basename is returned as a utf8 string because we expect this
3204
tuple will be ignored, and don't want to take the time to
3206
:return: (iter_changes_result, changed). If the entry has not been
3207
handled then changed is None. Otherwise it is False if no content
3208
or metadata changes have occured, and None if any content or
3209
metadata change has occured. If self.include_unchanged is True then
3210
if changed is not None, iter_changes_result will always be a result
3211
tuple. Otherwise, iter_changes_result is None unless changed is
3214
if self.source_index is None:
3215
source_details = DirState.NULL_PARENT_DETAILS
3217
source_details = entry[1][self.source_index]
3218
target_details = entry[1][self.target_index]
3219
target_minikind = target_details[0]
3220
if path_info is not None and target_minikind in 'fdlt':
3221
if not (self.target_index == 0):
3222
raise AssertionError()
3223
link_or_sha1 = update_entry(self.state, entry,
3224
abspath=path_info[4], stat_value=path_info[3])
3225
# The entry may have been modified by update_entry
3226
target_details = entry[1][self.target_index]
3227
target_minikind = target_details[0]
3230
file_id = entry[0][2]
3231
source_minikind = source_details[0]
3232
if source_minikind in 'fdltr' and target_minikind in 'fdlt':
3233
# claimed content in both: diff
3234
# r | fdlt | | add source to search, add id path move and perform
3235
# | | | diff check on source-target
3236
# r | fdlt | a | dangling file that was present in the basis.
3238
if source_minikind in 'r':
3239
# add the source to the search path to find any children it
3240
# has. TODO ? : only add if it is a container ?
3241
if not osutils.is_inside_any(self.searched_specific_files,
3243
self.search_specific_files.add(source_details[1])
3244
# generate the old path; this is needed for stating later
3246
old_path = source_details[1]
3247
old_dirname, old_basename = os.path.split(old_path)
3248
path = pathjoin(entry[0][0], entry[0][1])
3249
old_entry = self.state._get_entry(self.source_index,
3251
# update the source details variable to be the real
3253
if old_entry == (None, None):
3254
raise errors.CorruptDirstate(self.state._filename,
3255
"entry '%s/%s' is considered renamed from %r"
3256
" but source does not exist\n"
3257
"entry: %s" % (entry[0][0], entry[0][1], old_path, entry))
3258
source_details = old_entry[1][self.source_index]
3259
source_minikind = source_details[0]
3261
old_dirname = entry[0][0]
3262
old_basename = entry[0][1]
3263
old_path = path = None
3264
if path_info is None:
3265
# the file is missing on disk, show as removed.
3266
content_change = True
3270
# source and target are both versioned and disk file is present.
3271
target_kind = path_info[2]
3272
if target_kind == 'directory':
3274
old_path = path = pathjoin(old_dirname, old_basename)
3275
self.new_dirname_to_file_id[path] = file_id
3276
if source_minikind != 'd':
3277
content_change = True
3279
# directories have no fingerprint
3280
content_change = False
3282
elif target_kind == 'file':
3283
if source_minikind != 'f':
3284
content_change = True
3286
# Check the sha. We can't just rely on the size as
3287
# content filtering may mean differ sizes actually
3288
# map to the same content
3289
if link_or_sha1 is None:
3291
statvalue, link_or_sha1 = \
3292
self.state._sha1_provider.stat_and_sha1(
3294
self.state._observed_sha1(entry, link_or_sha1,
3296
content_change = (link_or_sha1 != source_details[1])
3297
# Target details is updated at update_entry time
3298
if self.use_filesystem_for_exec:
3299
# We don't need S_ISREG here, because we are sure
3300
# we are dealing with a file.
3301
target_exec = bool(stat.S_IEXEC & path_info[3].st_mode)
3303
target_exec = target_details[3]
3304
elif target_kind == 'symlink':
3305
if source_minikind != 'l':
3306
content_change = True
3308
content_change = (link_or_sha1 != source_details[1])
3310
elif target_kind == 'tree-reference':
3311
if source_minikind != 't':
3312
content_change = True
3314
content_change = False
3317
raise Exception, "unknown kind %s" % path_info[2]
3318
if source_minikind == 'd':
3320
old_path = path = pathjoin(old_dirname, old_basename)
3321
self.old_dirname_to_file_id[old_path] = file_id
3322
# parent id is the entry for the path in the target tree
3323
if old_basename and old_dirname == self.last_source_parent[0]:
3324
source_parent_id = self.last_source_parent[1]
3327
source_parent_id = self.old_dirname_to_file_id[old_dirname]
3329
source_parent_entry = self.state._get_entry(self.source_index,
3330
path_utf8=old_dirname)
3331
source_parent_id = source_parent_entry[0][2]
3332
if source_parent_id == entry[0][2]:
3333
# This is the root, so the parent is None
3334
source_parent_id = None
3336
self.last_source_parent[0] = old_dirname
3337
self.last_source_parent[1] = source_parent_id
3338
new_dirname = entry[0][0]
3339
if entry[0][1] and new_dirname == self.last_target_parent[0]:
3340
target_parent_id = self.last_target_parent[1]
3343
target_parent_id = self.new_dirname_to_file_id[new_dirname]
3345
# TODO: We don't always need to do the lookup, because the
3346
# parent entry will be the same as the source entry.
3347
target_parent_entry = self.state._get_entry(self.target_index,
3348
path_utf8=new_dirname)
3349
if target_parent_entry == (None, None):
3350
raise AssertionError(
3351
"Could not find target parent in wt: %s\nparent of: %s"
3352
% (new_dirname, entry))
3353
target_parent_id = target_parent_entry[0][2]
3354
if target_parent_id == entry[0][2]:
3355
# This is the root, so the parent is None
3356
target_parent_id = None
3358
self.last_target_parent[0] = new_dirname
3359
self.last_target_parent[1] = target_parent_id
3361
source_exec = source_details[3]
3362
changed = (content_change
3363
or source_parent_id != target_parent_id
3364
or old_basename != entry[0][1]
3365
or source_exec != target_exec
3367
if not changed and not self.include_unchanged:
3370
if old_path is None:
3371
old_path = path = pathjoin(old_dirname, old_basename)
3372
old_path_u = self.utf8_decode(old_path)[0]
3375
old_path_u = self.utf8_decode(old_path)[0]
3376
if old_path == path:
3379
path_u = self.utf8_decode(path)[0]
3380
source_kind = DirState._minikind_to_kind[source_minikind]
3381
return (entry[0][2],
3382
(old_path_u, path_u),
3385
(source_parent_id, target_parent_id),
3386
(self.utf8_decode(old_basename)[0], self.utf8_decode(entry[0][1])[0]),
3387
(source_kind, target_kind),
3388
(source_exec, target_exec)), changed
3389
elif source_minikind in 'a' and target_minikind in 'fdlt':
3390
# looks like a new file
3391
path = pathjoin(entry[0][0], entry[0][1])
3392
# parent id is the entry for the path in the target tree
3393
# TODO: these are the same for an entire directory: cache em.
3394
parent_id = self.state._get_entry(self.target_index,
3395
path_utf8=entry[0][0])[0][2]
3396
if parent_id == entry[0][2]:
3398
if path_info is not None:
3400
if self.use_filesystem_for_exec:
3401
# We need S_ISREG here, because we aren't sure if this
3404
stat.S_ISREG(path_info[3].st_mode)
3405
and stat.S_IEXEC & path_info[3].st_mode)
3407
target_exec = target_details[3]
3408
return (entry[0][2],
3409
(None, self.utf8_decode(path)[0]),
3413
(None, self.utf8_decode(entry[0][1])[0]),
3414
(None, path_info[2]),
3415
(None, target_exec)), True
3417
# Its a missing file, report it as such.
3418
return (entry[0][2],
3419
(None, self.utf8_decode(path)[0]),
3423
(None, self.utf8_decode(entry[0][1])[0]),
3425
(None, False)), True
3426
elif source_minikind in 'fdlt' and target_minikind in 'a':
3427
# unversioned, possibly, or possibly not deleted: we dont care.
3428
# if its still on disk, *and* theres no other entry at this
3429
# path [we dont know this in this routine at the moment -
3430
# perhaps we should change this - then it would be an unknown.
3431
old_path = pathjoin(entry[0][0], entry[0][1])
3432
# parent id is the entry for the path in the target tree
3433
parent_id = self.state._get_entry(self.source_index, path_utf8=entry[0][0])[0][2]
3434
if parent_id == entry[0][2]:
3436
return (entry[0][2],
3437
(self.utf8_decode(old_path)[0], None),
3441
(self.utf8_decode(entry[0][1])[0], None),
3442
(DirState._minikind_to_kind[source_minikind], None),
3443
(source_details[3], None)), True
3444
elif source_minikind in 'fdlt' and target_minikind in 'r':
3445
# a rename; could be a true rename, or a rename inherited from
3446
# a renamed parent. TODO: handle this efficiently. Its not
3447
# common case to rename dirs though, so a correct but slow
3448
# implementation will do.
3449
if not osutils.is_inside_any(self.searched_specific_files, target_details[1]):
3450
self.search_specific_files.add(target_details[1])
3451
elif source_minikind in 'ra' and target_minikind in 'ra':
3452
# neither of the selected trees contain this file,
3453
# so skip over it. This is not currently directly tested, but
3454
# is indirectly via test_too_much.TestCommands.test_conflicts.
3457
raise AssertionError("don't know how to compare "
3458
"source_minikind=%r, target_minikind=%r"
3459
% (source_minikind, target_minikind))
3460
## import pdb;pdb.set_trace()
3466
def iter_changes(self):
3467
"""Iterate over the changes."""
3468
utf8_decode = cache_utf8._utf8_decode
3469
_cmp_by_dirs = cmp_by_dirs
3470
_process_entry = self._process_entry
3471
search_specific_files = self.search_specific_files
3472
searched_specific_files = self.searched_specific_files
3473
splitpath = osutils.splitpath
3475
# compare source_index and target_index at or under each element of search_specific_files.
3476
# follow the following comparison table. Note that we only want to do diff operations when
3477
# the target is fdl because thats when the walkdirs logic will have exposed the pathinfo
3481
# Source | Target | disk | action
3482
# r | fdlt | | add source to search, add id path move and perform
3483
# | | | diff check on source-target
3484
# r | fdlt | a | dangling file that was present in the basis.
3486
# r | a | | add source to search
3488
# r | r | | this path is present in a non-examined tree, skip.
3489
# r | r | a | this path is present in a non-examined tree, skip.
3490
# a | fdlt | | add new id
3491
# a | fdlt | a | dangling locally added file, skip
3492
# a | a | | not present in either tree, skip
3493
# a | a | a | not present in any tree, skip
3494
# a | r | | not present in either tree at this path, skip as it
3495
# | | | may not be selected by the users list of paths.
3496
# a | r | a | not present in either tree at this path, skip as it
3497
# | | | may not be selected by the users list of paths.
3498
# fdlt | fdlt | | content in both: diff them
3499
# fdlt | fdlt | a | deleted locally, but not unversioned - show as deleted ?
3500
# fdlt | a | | unversioned: output deleted id for now
3501
# fdlt | a | a | unversioned and deleted: output deleted id
3502
# fdlt | r | | relocated in this tree, so add target to search.
3503
# | | | Dont diff, we will see an r,fd; pair when we reach
3504
# | | | this id at the other path.
3505
# fdlt | r | a | relocated in this tree, so add target to search.
3506
# | | | Dont diff, we will see an r,fd; pair when we reach
3507
# | | | this id at the other path.
3509
# TODO: jam 20070516 - Avoid the _get_entry lookup overhead by
3510
# keeping a cache of directories that we have seen.
3512
while search_specific_files:
3513
# TODO: the pending list should be lexically sorted? the
3514
# interface doesn't require it.
3515
current_root = search_specific_files.pop()
3516
current_root_unicode = current_root.decode('utf8')
3517
searched_specific_files.add(current_root)
3518
# process the entries for this containing directory: the rest will be
3519
# found by their parents recursively.
3520
root_entries = self.state._entries_for_path(current_root)
3521
root_abspath = self.tree.abspath(current_root_unicode)
3523
root_stat = os.lstat(root_abspath)
3525
if e.errno == errno.ENOENT:
3526
# the path does not exist: let _process_entry know that.
3527
root_dir_info = None
3529
# some other random error: hand it up.
3532
root_dir_info = ('', current_root,
3533
osutils.file_kind_from_stat_mode(root_stat.st_mode), root_stat,
3535
if root_dir_info[2] == 'directory':
3536
if self.tree._directory_is_tree_reference(
3537
current_root.decode('utf8')):
3538
root_dir_info = root_dir_info[:2] + \
3539
('tree-reference',) + root_dir_info[3:]
3541
if not root_entries and not root_dir_info:
3542
# this specified path is not present at all, skip it.
3544
path_handled = False
3545
for entry in root_entries:
3546
result, changed = _process_entry(entry, root_dir_info)
3547
if changed is not None:
3549
if changed or self.include_unchanged:
3551
if self.want_unversioned and not path_handled and root_dir_info:
3552
new_executable = bool(
3553
stat.S_ISREG(root_dir_info[3].st_mode)
3554
and stat.S_IEXEC & root_dir_info[3].st_mode)
3556
(None, current_root_unicode),
3560
(None, splitpath(current_root_unicode)[-1]),
3561
(None, root_dir_info[2]),
3562
(None, new_executable)
3564
initial_key = (current_root, '', '')
3565
block_index, _ = self.state._find_block_index_from_key(initial_key)
3566
if block_index == 0:
3567
# we have processed the total root already, but because the
3568
# initial key matched it we should skip it here.
3570
if root_dir_info and root_dir_info[2] == 'tree-reference':
3571
current_dir_info = None
3573
dir_iterator = osutils._walkdirs_utf8(root_abspath, prefix=current_root)
3575
current_dir_info = dir_iterator.next()
3577
# on win32, python2.4 has e.errno == ERROR_DIRECTORY, but
3578
# python 2.5 has e.errno == EINVAL,
3579
# and e.winerror == ERROR_DIRECTORY
3580
e_winerror = getattr(e, 'winerror', None)
3581
win_errors = (ERROR_DIRECTORY, ERROR_PATH_NOT_FOUND)
3582
# there may be directories in the inventory even though
3583
# this path is not a file on disk: so mark it as end of
3585
if e.errno in (errno.ENOENT, errno.ENOTDIR, errno.EINVAL):
3586
current_dir_info = None
3587
elif (sys.platform == 'win32'
3588
and (e.errno in win_errors
3589
or e_winerror in win_errors)):
3590
current_dir_info = None
3594
if current_dir_info[0][0] == '':
3595
# remove .bzr from iteration
3596
bzr_index = bisect.bisect_left(current_dir_info[1], ('.bzr',))
3597
if current_dir_info[1][bzr_index][0] != '.bzr':
3598
raise AssertionError()
3599
del current_dir_info[1][bzr_index]
3600
# walk until both the directory listing and the versioned metadata
3602
if (block_index < len(self.state._dirblocks) and
3603
osutils.is_inside(current_root, self.state._dirblocks[block_index][0])):
3604
current_block = self.state._dirblocks[block_index]
3606
current_block = None
3607
while (current_dir_info is not None or
3608
current_block is not None):
3609
if (current_dir_info and current_block
3610
and current_dir_info[0][0] != current_block[0]):
3611
if _cmp_by_dirs(current_dir_info[0][0], current_block[0]) < 0:
3612
# filesystem data refers to paths not covered by the dirblock.
3613
# this has two possibilities:
3614
# A) it is versioned but empty, so there is no block for it
3615
# B) it is not versioned.
3617
# if (A) then we need to recurse into it to check for
3618
# new unknown files or directories.
3619
# if (B) then we should ignore it, because we don't
3620
# recurse into unknown directories.
3622
while path_index < len(current_dir_info[1]):
3623
current_path_info = current_dir_info[1][path_index]
3624
if self.want_unversioned:
3625
if current_path_info[2] == 'directory':
3626
if self.tree._directory_is_tree_reference(
3627
current_path_info[0].decode('utf8')):
3628
current_path_info = current_path_info[:2] + \
3629
('tree-reference',) + current_path_info[3:]
3630
new_executable = bool(
3631
stat.S_ISREG(current_path_info[3].st_mode)
3632
and stat.S_IEXEC & current_path_info[3].st_mode)
3634
(None, utf8_decode(current_path_info[0])[0]),
3638
(None, utf8_decode(current_path_info[1])[0]),
3639
(None, current_path_info[2]),
3640
(None, new_executable))
3641
# dont descend into this unversioned path if it is
3643
if current_path_info[2] in ('directory',
3645
del current_dir_info[1][path_index]
3649
# This dir info has been handled, go to the next
3651
current_dir_info = dir_iterator.next()
3652
except StopIteration:
3653
current_dir_info = None
3655
# We have a dirblock entry for this location, but there
3656
# is no filesystem path for this. This is most likely
3657
# because a directory was removed from the disk.
3658
# We don't have to report the missing directory,
3659
# because that should have already been handled, but we
3660
# need to handle all of the files that are contained
3662
for current_entry in current_block[1]:
3663
# entry referring to file not present on disk.
3664
# advance the entry only, after processing.
3665
result, changed = _process_entry(current_entry, None)
3666
if changed is not None:
3667
if changed or self.include_unchanged:
3670
if (block_index < len(self.state._dirblocks) and
3671
osutils.is_inside(current_root,
3672
self.state._dirblocks[block_index][0])):
3673
current_block = self.state._dirblocks[block_index]
3675
current_block = None
3678
if current_block and entry_index < len(current_block[1]):
3679
current_entry = current_block[1][entry_index]
3681
current_entry = None
3682
advance_entry = True
3684
if current_dir_info and path_index < len(current_dir_info[1]):
3685
current_path_info = current_dir_info[1][path_index]
3686
if current_path_info[2] == 'directory':
3687
if self.tree._directory_is_tree_reference(
3688
current_path_info[0].decode('utf8')):
3689
current_path_info = current_path_info[:2] + \
3690
('tree-reference',) + current_path_info[3:]
3692
current_path_info = None
3694
path_handled = False
3695
while (current_entry is not None or
3696
current_path_info is not None):
3697
if current_entry is None:
3698
# the check for path_handled when the path is advanced
3699
# will yield this path if needed.
3701
elif current_path_info is None:
3702
# no path is fine: the per entry code will handle it.
3703
result, changed = _process_entry(current_entry, current_path_info)
3704
if changed is not None:
3705
if changed or self.include_unchanged:
3707
elif (current_entry[0][1] != current_path_info[1]
3708
or current_entry[1][self.target_index][0] in 'ar'):
3709
# The current path on disk doesn't match the dirblock
3710
# record. Either the dirblock is marked as absent, or
3711
# the file on disk is not present at all in the
3712
# dirblock. Either way, report about the dirblock
3713
# entry, and let other code handle the filesystem one.
3715
# Compare the basename for these files to determine
3717
if current_path_info[1] < current_entry[0][1]:
3718
# extra file on disk: pass for now, but only
3719
# increment the path, not the entry
3720
advance_entry = False
3722
# entry referring to file not present on disk.
3723
# advance the entry only, after processing.
3724
result, changed = _process_entry(current_entry, None)
3725
if changed is not None:
3726
if changed or self.include_unchanged:
3728
advance_path = False
3730
result, changed = _process_entry(current_entry, current_path_info)
3731
if changed is not None:
3733
if changed or self.include_unchanged:
3735
if advance_entry and current_entry is not None:
3737
if entry_index < len(current_block[1]):
3738
current_entry = current_block[1][entry_index]
3740
current_entry = None
3742
advance_entry = True # reset the advance flaga
3743
if advance_path and current_path_info is not None:
3744
if not path_handled:
3745
# unversioned in all regards
3746
if self.want_unversioned:
3747
new_executable = bool(
3748
stat.S_ISREG(current_path_info[3].st_mode)
3749
and stat.S_IEXEC & current_path_info[3].st_mode)
3751
relpath_unicode = utf8_decode(current_path_info[0])[0]
3752
except UnicodeDecodeError:
3753
raise errors.BadFilenameEncoding(
3754
current_path_info[0], osutils._fs_enc)
3756
(None, relpath_unicode),
3760
(None, utf8_decode(current_path_info[1])[0]),
3761
(None, current_path_info[2]),
3762
(None, new_executable))
3763
# dont descend into this unversioned path if it is
3765
if current_path_info[2] in ('directory'):
3766
del current_dir_info[1][path_index]
3768
# dont descend the disk iterator into any tree
3770
if current_path_info[2] == 'tree-reference':
3771
del current_dir_info[1][path_index]
3774
if path_index < len(current_dir_info[1]):
3775
current_path_info = current_dir_info[1][path_index]
3776
if current_path_info[2] == 'directory':
3777
if self.tree._directory_is_tree_reference(
3778
current_path_info[0].decode('utf8')):
3779
current_path_info = current_path_info[:2] + \
3780
('tree-reference',) + current_path_info[3:]
3782
current_path_info = None
3783
path_handled = False
3785
advance_path = True # reset the advance flagg.
3786
if current_block is not None:
3788
if (block_index < len(self.state._dirblocks) and
3789
osutils.is_inside(current_root, self.state._dirblocks[block_index][0])):
3790
current_block = self.state._dirblocks[block_index]
3792
current_block = None
3793
if current_dir_info is not None:
3795
current_dir_info = dir_iterator.next()
3796
except StopIteration:
3797
current_dir_info = None
3800
# Try to load the compiled form if possible
3802
from bzrlib._dirstate_helpers_pyx import (
3808
ProcessEntryC as _process_entry,
3809
update_entry as update_entry,
3812
from bzrlib._dirstate_helpers_py import (
3819
# FIXME: It would be nice to be able to track moved lines so that the
3820
# corresponding python code can be moved to the _dirstate_helpers_py
3821
# module. I don't want to break the history for this important piece of
3822
# code so I left the code here -- vila 20090622
3823
update_entry = py_update_entry
3824
_process_entry = ProcessEntryPython
2390
dirname_split = dirname.split('/')
2391
cache[dirname] = dirname_split
2394
# Grab the dirname for the current dirblock
2395
cur = dirblocks[mid][0]
2397
cur_split = cache[cur]
2399
cur_split = cur.split('/')
2400
cache[cur] = cur_split
2401
if cur_split < dirname_split: lo = mid+1