711
713
return compatible
714
class Inventory(object):
716
class CommonInventory(object):
717
"""Basic inventory logic, defined in terms of primitives like has_id."""
719
def __contains__(self, file_id):
720
"""True if this entry contains a file with given id.
722
>>> inv = Inventory()
723
>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))
724
InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None, revision=None)
730
Note that this method along with __iter__ are not encouraged for use as
731
they are less clear than specific query methods - they may be rmeoved
734
return self.has_id(file_id)
736
def id2path(self, file_id):
737
"""Return as a string the path to file_id.
740
>>> e = i.add(InventoryDirectory('src-id', 'src', ROOT_ID))
741
>>> e = i.add(InventoryFile('foo-id', 'foo.c', parent_id='src-id'))
742
>>> print i.id2path('foo-id')
745
# get all names, skipping root
746
return '/'.join(reversed(
747
[parent.name for parent in
748
self._iter_file_id_parents(file_id)][:-1]))
750
def iter_entries(self, from_dir=None):
751
"""Return (path, entry) pairs, in order by name."""
753
if self.root is None:
757
elif isinstance(from_dir, basestring):
758
from_dir = self[from_dir]
760
# unrolling the recursive called changed the time from
761
# 440ms/663ms (inline/total) to 116ms/116ms
762
children = from_dir.children.items()
764
children = collections.deque(children)
765
stack = [(u'', children)]
767
from_dir_relpath, children = stack[-1]
770
name, ie = children.popleft()
772
# we know that from_dir_relpath never ends in a slash
773
# and 'f' doesn't begin with one, we can do a string op, rather
774
# than the checks of pathjoin(), though this means that all paths
776
path = from_dir_relpath + '/' + name
780
if ie.kind != 'directory':
783
# But do this child first
784
new_children = ie.children.items()
786
new_children = collections.deque(new_children)
787
stack.append((path, new_children))
788
# Break out of inner loop, so that we start outer loop with child
791
# if we finished all children, pop it off the stack
794
def iter_entries_by_dir(self, from_dir=None, specific_file_ids=None,
795
yield_parents=False):
796
"""Iterate over the entries in a directory first order.
798
This returns all entries for a directory before returning
799
the entries for children of a directory. This is not
800
lexicographically sorted order, and is a hybrid between
801
depth-first and breadth-first.
803
:param yield_parents: If True, yield the parents from the root leading
804
down to specific_file_ids that have been requested. This has no
805
impact if specific_file_ids is None.
806
:return: This yields (path, entry) pairs
808
if specific_file_ids and not isinstance(specific_file_ids, set):
809
specific_file_ids = set(specific_file_ids)
810
# TODO? Perhaps this should return the from_dir so that the root is
811
# yielded? or maybe an option?
813
if self.root is None:
815
# Optimize a common case
816
if (not yield_parents and specific_file_ids is not None and
817
len(specific_file_ids) == 1):
818
file_id = list(specific_file_ids)[0]
820
yield self.id2path(file_id), self[file_id]
823
if (specific_file_ids is None or yield_parents or
824
self.root.file_id in specific_file_ids):
826
elif isinstance(from_dir, basestring):
827
from_dir = self[from_dir]
829
if specific_file_ids is not None:
830
# TODO: jam 20070302 This could really be done as a loop rather
831
# than a bunch of recursive calls.
834
def add_ancestors(file_id):
835
if file_id not in byid:
837
parent_id = byid[file_id].parent_id
838
if parent_id is None:
840
if parent_id not in parents:
841
parents.add(parent_id)
842
add_ancestors(parent_id)
843
for file_id in specific_file_ids:
844
add_ancestors(file_id)
848
stack = [(u'', from_dir)]
850
cur_relpath, cur_dir = stack.pop()
853
for child_name, child_ie in sorted(cur_dir.children.iteritems()):
855
child_relpath = cur_relpath + child_name
857
if (specific_file_ids is None or
858
child_ie.file_id in specific_file_ids or
859
(yield_parents and child_ie.file_id in parents)):
860
yield child_relpath, child_ie
862
if child_ie.kind == 'directory':
863
if parents is None or child_ie.file_id in parents:
864
child_dirs.append((child_relpath+'/', child_ie))
865
stack.extend(reversed(child_dirs))
867
def _make_delta(self, old):
868
"""Make an inventory delta from two inventories."""
871
adds = new_ids - old_ids
872
deletes = old_ids - new_ids
873
common = old_ids.intersection(new_ids)
875
for file_id in deletes:
876
delta.append((old.id2path(file_id), None, file_id, None))
878
delta.append((None, self.id2path(file_id), file_id, self[file_id]))
879
for file_id in common:
880
if old[file_id] != self[file_id]:
881
delta.append((old.id2path(file_id), self.id2path(file_id),
882
file_id, self[file_id]))
885
def _get_mutable_inventory(self):
886
"""Returns a mutable copy of the object.
888
Some inventories are immutable, yet working trees, for example, needs
889
to mutate exisiting inventories instead of creating a new one.
891
raise NotImplementedError(self._get_mutable_inventory)
893
def make_entry(self, kind, name, parent_id, file_id=None):
894
"""Simple thunk to bzrlib.inventory.make_entry."""
895
return make_entry(kind, name, parent_id, file_id)
898
"""Return list of (path, ie) for all entries except the root.
900
This may be faster than iter_entries.
903
def descend(dir_ie, dir_path):
904
kids = dir_ie.children.items()
906
for name, ie in kids:
907
child_path = osutils.pathjoin(dir_path, name)
908
accum.append((child_path, ie))
909
if ie.kind == 'directory':
910
descend(ie, child_path)
912
descend(self.root, u'')
915
def directories(self):
916
"""Return (path, entry) pairs for all directories, including the root.
919
def descend(parent_ie, parent_path):
920
accum.append((parent_path, parent_ie))
922
kids = [(ie.name, ie) for ie in parent_ie.children.itervalues() if ie.kind == 'directory']
925
for name, child_ie in kids:
926
child_path = osutils.pathjoin(parent_path, name)
927
descend(child_ie, child_path)
928
descend(self.root, u'')
931
def path2id(self, name):
932
"""Walk down through directories to return entry of last component.
934
names may be either a list of path components, or a single
935
string, in which case it is automatically split.
937
This returns the entry of the last component in the path,
938
which may be either a file or a directory.
940
Returns None IFF the path is not found.
942
if isinstance(name, basestring):
943
name = osutils.splitpath(name)
945
# mutter("lookup path %r" % name)
949
except errors.NoSuchId:
950
# root doesn't exist yet so nothing else can
956
children = getattr(parent, 'children', None)
965
return parent.file_id
967
def filter(self, specific_fileids):
968
"""Get an inventory view filtered against a set of file-ids.
970
Children of directories and parents are included.
972
The result may or may not reference the underlying inventory
973
so it should be treated as immutable.
975
interesting_parents = set()
976
for fileid in specific_fileids:
978
interesting_parents.update(self.get_idpath(fileid))
979
except errors.NoSuchId:
980
# This fileid is not in the inventory - that's ok
982
entries = self.iter_entries()
983
if self.root is None:
984
return Inventory(root_id=None)
985
other = Inventory(entries.next()[1].file_id)
986
other.root.revision = self.root.revision
987
other.revision_id = self.revision_id
988
directories_to_expand = set()
989
for path, entry in entries:
990
file_id = entry.file_id
991
if (file_id in specific_fileids
992
or entry.parent_id in directories_to_expand):
993
if entry.kind == 'directory':
994
directories_to_expand.add(file_id)
995
elif file_id not in interesting_parents:
997
other.add(entry.copy())
1000
def get_idpath(self, file_id):
1001
"""Return a list of file_ids for the path to an entry.
1003
The list contains one element for each directory followed by
1004
the id of the file itself. So the length of the returned list
1005
is equal to the depth of the file in the tree, counting the
1006
root directory as depth 1.
1009
for parent in self._iter_file_id_parents(file_id):
1010
p.insert(0, parent.file_id)
1014
class Inventory(CommonInventory):
715
1015
"""Inventory of versioned files in a tree.
717
1017
This describes which file_id is present at each point in the tree,
877
1181
other.add(entry.copy())
1184
def _get_mutable_inventory(self):
1185
"""See CommonInventory._get_mutable_inventory."""
1186
return deepcopy(self)
880
1188
def __iter__(self):
1189
"""Iterate over all file-ids."""
881
1190
return iter(self._byid)
1192
def iter_just_entries(self):
1193
"""Iterate over all entries.
1195
Unlike iter_entries(), just the entries are returned (not (path, ie))
1196
and the order of entries is undefined.
1198
XXX: We may not want to merge this into bzr.dev.
1200
if self.root is None:
1202
for _, ie in self._byid.iteritems():
883
1205
def __len__(self):
884
1206
"""Returns number of entries."""
885
1207
return len(self._byid)
887
def iter_entries(self, from_dir=None):
888
"""Return (path, entry) pairs, in order by name."""
890
if self.root is None:
894
elif isinstance(from_dir, basestring):
895
from_dir = self._byid[from_dir]
897
# unrolling the recursive called changed the time from
898
# 440ms/663ms (inline/total) to 116ms/116ms
899
children = from_dir.children.items()
901
children = collections.deque(children)
902
stack = [(u'', children)]
904
from_dir_relpath, children = stack[-1]
907
name, ie = children.popleft()
909
# we know that from_dir_relpath never ends in a slash
910
# and 'f' doesn't begin with one, we can do a string op, rather
911
# than the checks of pathjoin(), though this means that all paths
913
path = from_dir_relpath + '/' + name
917
if ie.kind != 'directory':
920
# But do this child first
921
new_children = ie.children.items()
923
new_children = collections.deque(new_children)
924
stack.append((path, new_children))
925
# Break out of inner loop, so that we start outer loop with child
928
# if we finished all children, pop it off the stack
931
def iter_entries_by_dir(self, from_dir=None, specific_file_ids=None,
932
yield_parents=False):
933
"""Iterate over the entries in a directory first order.
935
This returns all entries for a directory before returning
936
the entries for children of a directory. This is not
937
lexicographically sorted order, and is a hybrid between
938
depth-first and breadth-first.
940
:param yield_parents: If True, yield the parents from the root leading
941
down to specific_file_ids that have been requested. This has no
942
impact if specific_file_ids is None.
943
:return: This yields (path, entry) pairs
945
if specific_file_ids and not isinstance(specific_file_ids, set):
946
specific_file_ids = set(specific_file_ids)
947
# TODO? Perhaps this should return the from_dir so that the root is
948
# yielded? or maybe an option?
950
if self.root is None:
952
# Optimize a common case
953
if (not yield_parents and specific_file_ids is not None and
954
len(specific_file_ids) == 1):
955
file_id = list(specific_file_ids)[0]
957
yield self.id2path(file_id), self[file_id]
960
if (specific_file_ids is None or yield_parents or
961
self.root.file_id in specific_file_ids):
963
elif isinstance(from_dir, basestring):
964
from_dir = self._byid[from_dir]
966
if specific_file_ids is not None:
967
# TODO: jam 20070302 This could really be done as a loop rather
968
# than a bunch of recursive calls.
971
def add_ancestors(file_id):
972
if file_id not in byid:
974
parent_id = byid[file_id].parent_id
975
if parent_id is None:
977
if parent_id not in parents:
978
parents.add(parent_id)
979
add_ancestors(parent_id)
980
for file_id in specific_file_ids:
981
add_ancestors(file_id)
985
stack = [(u'', from_dir)]
987
cur_relpath, cur_dir = stack.pop()
990
for child_name, child_ie in sorted(cur_dir.children.iteritems()):
992
child_relpath = cur_relpath + child_name
994
if (specific_file_ids is None or
995
child_ie.file_id in specific_file_ids or
996
(yield_parents and child_ie.file_id in parents)):
997
yield child_relpath, child_ie
999
if child_ie.kind == 'directory':
1000
if parents is None or child_ie.file_id in parents:
1001
child_dirs.append((child_relpath+'/', child_ie))
1002
stack.extend(reversed(child_dirs))
1004
def make_entry(self, kind, name, parent_id, file_id=None):
1005
"""Simple thunk to bzrlib.inventory.make_entry."""
1006
return make_entry(kind, name, parent_id, file_id)
1009
"""Return list of (path, ie) for all entries except the root.
1011
This may be faster than iter_entries.
1014
def descend(dir_ie, dir_path):
1015
kids = dir_ie.children.items()
1017
for name, ie in kids:
1018
child_path = osutils.pathjoin(dir_path, name)
1019
accum.append((child_path, ie))
1020
if ie.kind == 'directory':
1021
descend(ie, child_path)
1023
descend(self.root, u'')
1026
def directories(self):
1027
"""Return (path, entry) pairs for all directories, including the root.
1030
def descend(parent_ie, parent_path):
1031
accum.append((parent_path, parent_ie))
1033
kids = [(ie.name, ie) for ie in parent_ie.children.itervalues() if ie.kind == 'directory']
1036
for name, child_ie in kids:
1037
child_path = osutils.pathjoin(parent_path, name)
1038
descend(child_ie, child_path)
1039
descend(self.root, u'')
1042
def __contains__(self, file_id):
1043
"""True if this entry contains a file with given id.
1045
>>> inv = Inventory()
1046
>>> inv.add(InventoryFile('123', 'foo.c', ROOT_ID))
1047
InventoryFile('123', 'foo.c', parent_id='TREE_ROOT', sha1=None, len=None)
1053
return (file_id in self._byid)
1055
1209
def __getitem__(self, file_id):
1056
1210
"""Return the entry for given file_id.
1058
1212
>>> inv = Inventory()
1059
1213
>>> inv.add(InventoryFile('123123', 'hello.c', ROOT_ID))
1060
InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None)
1214
InventoryFile('123123', 'hello.c', parent_id='TREE_ROOT', sha1=None, len=None, revision=None)
1061
1215
>>> inv['123123'].name
1338
1433
def is_root(self, file_id):
1339
1434
return self.root is not None and file_id == self.root.file_id
1341
def filter(self, specific_fileids):
1342
"""Get an inventory view filtered against a set of file-ids.
1344
Children of directories and parents are included.
1346
The result may or may not reference the underlying inventory
1347
so it should be treated as immutable.
1349
interesting_parents = set()
1350
for fileid in specific_fileids:
1437
class CHKInventory(CommonInventory):
1438
"""An inventory persisted in a CHK store.
1440
By design, a CHKInventory is immutable so many of the methods
1441
supported by Inventory - add, rename, apply_delta, etc - are *not*
1442
supported. To create a new CHKInventory, use create_by_apply_delta()
1443
or from_inventory(), say.
1445
Internally, a CHKInventory has one or two CHKMaps:
1447
* id_to_entry - a map from (file_id,) => InventoryEntry as bytes
1448
* parent_id_basename_to_file_id - a map from (parent_id, basename_utf8)
1451
The second map is optional and not present in early CHkRepository's.
1453
No caching is performed: every method call or item access will perform
1454
requests to the storage layer. As such, keep references to objects you
1458
def __init__(self, search_key_name):
1459
CommonInventory.__init__(self)
1460
self._fileid_to_entry_cache = {}
1461
self._path_to_fileid_cache = {}
1462
self._search_key_name = search_key_name
1464
def _entry_to_bytes(self, entry):
1465
"""Serialise entry as a single bytestring.
1467
:param Entry: An inventory entry.
1468
:return: A bytestring for the entry.
1471
ENTRY ::= FILE | DIR | SYMLINK | TREE
1472
FILE ::= "file: " COMMON SEP SHA SEP SIZE SEP EXECUTABLE
1473
DIR ::= "dir: " COMMON
1474
SYMLINK ::= "symlink: " COMMON SEP TARGET_UTF8
1475
TREE ::= "tree: " COMMON REFERENCE_REVISION
1476
COMMON ::= FILE_ID SEP PARENT_ID SEP NAME_UTF8 SEP REVISION
1479
if entry.parent_id is not None:
1480
parent_str = entry.parent_id
1483
name_str = entry.name.encode("utf8")
1484
if entry.kind == 'file':
1485
if entry.executable:
1489
return "file: %s\n%s\n%s\n%s\n%s\n%d\n%s" % (
1490
entry.file_id, parent_str, name_str, entry.revision,
1491
entry.text_sha1, entry.text_size, exec_str)
1492
elif entry.kind == 'directory':
1493
return "dir: %s\n%s\n%s\n%s" % (
1494
entry.file_id, parent_str, name_str, entry.revision)
1495
elif entry.kind == 'symlink':
1496
return "symlink: %s\n%s\n%s\n%s\n%s" % (
1497
entry.file_id, parent_str, name_str, entry.revision,
1498
entry.symlink_target.encode("utf8"))
1499
elif entry.kind == 'tree-reference':
1500
return "tree: %s\n%s\n%s\n%s\n%s" % (
1501
entry.file_id, parent_str, name_str, entry.revision,
1502
entry.reference_revision)
1504
raise ValueError("unknown kind %r" % entry.kind)
1507
def _bytes_to_utf8name_key(bytes):
1508
"""Get the file_id, revision_id key out of bytes."""
1509
# We don't normally care about name, except for times when we want
1510
# to filter out empty names because of non rich-root...
1511
sections = bytes.split('\n')
1512
kind, file_id = sections[0].split(': ')
1513
return (sections[2], file_id, sections[3])
1515
def _bytes_to_entry(self, bytes):
1516
"""Deserialise a serialised entry."""
1517
sections = bytes.split('\n')
1518
if sections[0].startswith("file: "):
1519
result = InventoryFile(sections[0][6:],
1520
sections[2].decode('utf8'),
1522
result.text_sha1 = sections[4]
1523
result.text_size = int(sections[5])
1524
result.executable = sections[6] == "Y"
1525
elif sections[0].startswith("dir: "):
1526
result = CHKInventoryDirectory(sections[0][5:],
1527
sections[2].decode('utf8'),
1529
elif sections[0].startswith("symlink: "):
1530
result = InventoryLink(sections[0][9:],
1531
sections[2].decode('utf8'),
1533
result.symlink_target = sections[4].decode('utf8')
1534
elif sections[0].startswith("tree: "):
1535
result = TreeReference(sections[0][6:],
1536
sections[2].decode('utf8'),
1538
result.reference_revision = sections[4]
1540
raise ValueError("Not a serialised entry %r" % bytes)
1541
result.revision = sections[3]
1542
if result.parent_id == '':
1543
result.parent_id = None
1544
self._fileid_to_entry_cache[result.file_id] = result
1547
def _get_mutable_inventory(self):
1548
"""See CommonInventory._get_mutable_inventory."""
1549
entries = self.iter_entries()
1550
if self.root_id is not None:
1552
inv = Inventory(self.root_id, self.revision_id)
1553
for path, inv_entry in entries:
1557
def create_by_apply_delta(self, inventory_delta, new_revision_id,
1558
propagate_caches=False):
1559
"""Create a new CHKInventory by applying inventory_delta to this one.
1561
:param inventory_delta: The inventory delta to apply. See
1562
Inventory.apply_delta for details.
1563
:param new_revision_id: The revision id of the resulting CHKInventory.
1564
:param propagate_caches: If True, the caches for this inventory are
1565
copied to and updated for the result.
1566
:return: The new CHKInventory.
1568
result = CHKInventory(self._search_key_name)
1569
if propagate_caches:
1570
# Just propagate the path-to-fileid cache for now
1571
result._path_to_fileid_cache = dict(self._path_to_fileid_cache.iteritems())
1572
search_key_func = chk_map.search_key_registry.get(self._search_key_name)
1573
self.id_to_entry._ensure_root()
1574
maximum_size = self.id_to_entry._root_node.maximum_size
1575
result.revision_id = new_revision_id
1576
result.id_to_entry = chk_map.CHKMap(
1577
self.id_to_entry._store,
1578
self.id_to_entry.key(),
1579
search_key_func=search_key_func)
1580
result.id_to_entry._ensure_root()
1581
result.id_to_entry._root_node.set_maximum_size(maximum_size)
1582
parent_id_basename_delta = []
1583
if self.parent_id_basename_to_file_id is not None:
1584
result.parent_id_basename_to_file_id = chk_map.CHKMap(
1585
self.parent_id_basename_to_file_id._store,
1586
self.parent_id_basename_to_file_id.key(),
1587
search_key_func=search_key_func)
1588
result.parent_id_basename_to_file_id._ensure_root()
1589
self.parent_id_basename_to_file_id._ensure_root()
1590
result_p_id_root = result.parent_id_basename_to_file_id._root_node
1591
p_id_root = self.parent_id_basename_to_file_id._root_node
1592
result_p_id_root.set_maximum_size(p_id_root.maximum_size)
1593
result_p_id_root._key_width = p_id_root._key_width
1595
result.parent_id_basename_to_file_id = None
1596
result.root_id = self.root_id
1597
id_to_entry_delta = []
1598
for old_path, new_path, file_id, entry in inventory_delta:
1601
result.root_id = file_id
1602
if new_path is None:
1607
if propagate_caches:
1609
del result._path_to_fileid_cache[old_path]
1613
new_key = (file_id,)
1614
new_value = result._entry_to_bytes(entry)
1615
# Update caches. It's worth doing this whether
1616
# we're propagating the old caches or not.
1617
result._path_to_fileid_cache[new_path] = file_id
1618
if old_path is None:
1621
old_key = (file_id,)
1622
id_to_entry_delta.append((old_key, new_key, new_value))
1623
if result.parent_id_basename_to_file_id is not None:
1624
# parent_id, basename changes
1625
if old_path is None:
1628
old_entry = self[file_id]
1629
old_key = self._parent_id_basename_key(old_entry)
1630
if new_path is None:
1634
new_key = self._parent_id_basename_key(entry)
1636
if old_key != new_key:
1637
# If the two keys are the same, the value will be unchanged
1638
# as its always the file id.
1639
parent_id_basename_delta.append((old_key, new_key, new_value))
1640
result.id_to_entry.apply_delta(id_to_entry_delta)
1641
if parent_id_basename_delta:
1642
result.parent_id_basename_to_file_id.apply_delta(parent_id_basename_delta)
1646
def deserialise(klass, chk_store, bytes, expected_revision_id):
1647
"""Deserialise a CHKInventory.
1649
:param chk_store: A CHK capable VersionedFiles instance.
1650
:param bytes: The serialised bytes.
1651
:param expected_revision_id: The revision ID we think this inventory is
1653
:return: A CHKInventory
1655
lines = bytes.split('\n')
1656
assert lines[-1] == ''
1658
if lines[0] != 'chkinventory:':
1659
raise ValueError("not a serialised CHKInventory: %r" % bytes)
1661
allowed_keys = frozenset(['root_id', 'revision_id', 'search_key_name',
1662
'parent_id_basename_to_file_id',
1664
for line in lines[1:]:
1665
key, value = line.split(': ', 1)
1666
if key not in allowed_keys:
1667
raise errors.BzrError('Unknown key in inventory: %r\n%r'
1670
raise errors.BzrError('Duplicate key in inventory: %r\n%r'
1673
revision_id = info['revision_id']
1674
root_id = info['root_id']
1675
search_key_name = info.get('search_key_name', 'plain')
1676
parent_id_basename_to_file_id = info.get(
1677
'parent_id_basename_to_file_id', None)
1678
id_to_entry = info['id_to_entry']
1680
result = CHKInventory(search_key_name)
1681
result.revision_id = revision_id
1682
result.root_id = root_id
1683
search_key_func = chk_map.search_key_registry.get(
1684
result._search_key_name)
1685
if parent_id_basename_to_file_id is not None:
1686
result.parent_id_basename_to_file_id = chk_map.CHKMap(
1687
chk_store, (parent_id_basename_to_file_id,),
1688
search_key_func=search_key_func)
1690
result.parent_id_basename_to_file_id = None
1692
result.id_to_entry = chk_map.CHKMap(chk_store, (id_to_entry,),
1693
search_key_func=search_key_func)
1694
if (result.revision_id,) != expected_revision_id:
1695
raise ValueError("Mismatched revision id and expected: %r, %r" %
1696
(result.revision_id, expected_revision_id))
1700
def from_inventory(klass, chk_store, inventory, maximum_size=0, search_key_name='plain'):
1701
"""Create a CHKInventory from an existing inventory.
1703
The content of inventory is copied into the chk_store, and a
1704
CHKInventory referencing that is returned.
1706
:param chk_store: A CHK capable VersionedFiles instance.
1707
:param inventory: The inventory to copy.
1708
:param maximum_size: The CHKMap node size limit.
1709
:param search_key_name: The identifier for the search key function
1711
result = CHKInventory(search_key_name)
1712
result.revision_id = inventory.revision_id
1713
result.root_id = inventory.root.file_id
1714
search_key_func = chk_map.search_key_registry.get(search_key_name)
1715
result.id_to_entry = chk_map.CHKMap(chk_store, None, search_key_func)
1716
result.id_to_entry._root_node.set_maximum_size(maximum_size)
1718
result.parent_id_basename_to_file_id = chk_map.CHKMap(chk_store,
1719
None, search_key_func)
1720
result.parent_id_basename_to_file_id._root_node.set_maximum_size(
1722
result.parent_id_basename_to_file_id._root_node._key_width = 2
1723
parent_id_delta = []
1724
for path, entry in inventory.iter_entries():
1725
file_id_delta.append((None, (entry.file_id,),
1726
result._entry_to_bytes(entry)))
1727
parent_id_delta.append(
1728
(None, result._parent_id_basename_key(entry),
1730
result.id_to_entry.apply_delta(file_id_delta)
1731
result.parent_id_basename_to_file_id.apply_delta(parent_id_delta)
1734
def _parent_id_basename_key(self, entry):
1735
"""Create a key for a entry in a parent_id_basename_to_file_id index."""
1736
if entry.parent_id is not None:
1737
parent_id = entry.parent_id
1740
return parent_id, entry.name.encode('utf8')
1742
def __getitem__(self, file_id):
1743
"""map a single file_id -> InventoryEntry."""
1745
raise errors.NoSuchId(self, file_id)
1746
result = self._fileid_to_entry_cache.get(file_id, None)
1747
if result is not None:
1750
return self._bytes_to_entry(
1751
self.id_to_entry.iteritems([(file_id,)]).next()[1])
1752
except StopIteration:
1753
# really we're passing an inventory, not a tree...
1754
raise errors.NoSuchId(self, file_id)
1756
def has_id(self, file_id):
1757
# Perhaps have an explicit 'contains' method on CHKMap ?
1758
if self._fileid_to_entry_cache.get(file_id, None) is not None:
1760
return len(list(self.id_to_entry.iteritems([(file_id,)]))) == 1
1762
def is_root(self, file_id):
1763
return file_id == self.root_id
1765
def _iter_file_id_parents(self, file_id):
1766
"""Yield the parents of file_id up to the root."""
1767
while file_id is not None:
1352
interesting_parents.update(self.get_idpath(fileid))
1353
except errors.NoSuchId:
1354
# This fileid is not in the inventory - that's ok
1356
entries = self.iter_entries()
1357
if self.root is None:
1358
return Inventory(root_id=None)
1359
other = Inventory(entries.next()[1].file_id)
1360
other.root.revision = self.root.revision
1361
other.revision_id = self.revision_id
1362
directories_to_expand = set()
1363
for path, entry in entries:
1364
file_id = entry.file_id
1365
if (file_id in specific_fileids
1366
or entry.parent_id in directories_to_expand):
1367
if entry.kind == 'directory':
1368
directories_to_expand.add(file_id)
1369
elif file_id not in interesting_parents:
1771
raise errors.NoSuchId(tree=self, file_id=file_id)
1773
file_id = ie.parent_id
1776
"""Iterate over all file-ids."""
1777
for key, _ in self.id_to_entry.iteritems():
1780
def iter_just_entries(self):
1781
"""Iterate over all entries.
1783
Unlike iter_entries(), just the entries are returned (not (path, ie))
1784
and the order of entries is undefined.
1786
XXX: We may not want to merge this into bzr.dev.
1788
for key, entry in self.id_to_entry.iteritems():
1790
ie = self._fileid_to_entry_cache.get(file_id, None)
1792
ie = self._bytes_to_entry(entry)
1793
self._fileid_to_entry_cache[file_id] = ie
1796
def iter_changes(self, basis):
1797
"""Generate a Tree.iter_changes change list between this and basis.
1799
:param basis: Another CHKInventory.
1800
:return: An iterator over the changes between self and basis, as per
1801
tree.iter_changes().
1803
# We want: (file_id, (path_in_source, path_in_target),
1804
# changed_content, versioned, parent, name, kind,
1806
for key, basis_value, self_value in \
1807
self.id_to_entry.iter_changes(basis.id_to_entry):
1809
if basis_value is not None:
1810
basis_entry = basis._bytes_to_entry(basis_value)
1811
path_in_source = basis.id2path(file_id)
1812
basis_parent = basis_entry.parent_id
1813
basis_name = basis_entry.name
1814
basis_executable = basis_entry.executable
1816
path_in_source = None
1819
basis_executable = None
1820
if self_value is not None:
1821
self_entry = self._bytes_to_entry(self_value)
1822
path_in_target = self.id2path(file_id)
1823
self_parent = self_entry.parent_id
1824
self_name = self_entry.name
1825
self_executable = self_entry.executable
1827
path_in_target = None
1830
self_executable = None
1831
if basis_value is None:
1833
kind = (None, self_entry.kind)
1834
versioned = (False, True)
1835
elif self_value is None:
1837
kind = (basis_entry.kind, None)
1838
versioned = (True, False)
1840
kind = (basis_entry.kind, self_entry.kind)
1841
versioned = (True, True)
1842
changed_content = False
1843
if kind[0] != kind[1]:
1844
changed_content = True
1845
elif kind[0] == 'file':
1846
if (self_entry.text_size != basis_entry.text_size or
1847
self_entry.text_sha1 != basis_entry.text_sha1):
1848
changed_content = True
1849
elif kind[0] == 'symlink':
1850
if self_entry.symlink_target != basis_entry.symlink_target:
1851
changed_content = True
1852
elif kind[0] == 'tree-reference':
1853
if (self_entry.reference_revision !=
1854
basis_entry.reference_revision):
1855
changed_content = True
1856
parent = (basis_parent, self_parent)
1857
name = (basis_name, self_name)
1858
executable = (basis_executable, self_executable)
1859
if (not changed_content
1860
and parent[0] == parent[1]
1861
and name[0] == name[1]
1862
and executable[0] == executable[1]):
1863
# Could happen when only the revision changed for a directory
1371
other.add(entry.copy())
1866
yield (file_id, (path_in_source, path_in_target), changed_content,
1867
versioned, parent, name, kind, executable)
1870
"""Return the number of entries in the inventory."""
1871
return len(self.id_to_entry)
1873
def _make_delta(self, old):
1874
"""Make an inventory delta from two inventories."""
1875
if type(old) != CHKInventory:
1876
return CommonInventory._make_delta(self, old)
1878
for key, old_value, self_value in \
1879
self.id_to_entry.iter_changes(old.id_to_entry):
1881
if old_value is not None:
1882
old_path = old.id2path(file_id)
1885
if self_value is not None:
1886
entry = self._bytes_to_entry(self_value)
1887
self._fileid_to_entry_cache[file_id] = entry
1888
new_path = self.id2path(file_id)
1892
delta.append((old_path, new_path, file_id, entry))
1895
def path2id(self, name):
1896
"""See CommonInventory.path2id()."""
1897
result = self._path_to_fileid_cache.get(name, None)
1899
result = CommonInventory.path2id(self, name)
1900
self._path_to_fileid_cache[name] = result
1904
"""Serialise the inventory to lines."""
1905
lines = ["chkinventory:\n"]
1906
if self._search_key_name != 'plain':
1907
# custom ordering grouping things that don't change together
1908
lines.append('search_key_name: %s\n' % (self._search_key_name,))
1909
lines.append("root_id: %s\n" % self.root_id)
1910
lines.append('parent_id_basename_to_file_id: %s\n' %
1911
self.parent_id_basename_to_file_id.key())
1912
lines.append("revision_id: %s\n" % self.revision_id)
1913
lines.append("id_to_entry: %s\n" % self.id_to_entry.key())
1915
lines.append("revision_id: %s\n" % self.revision_id)
1916
lines.append("root_id: %s\n" % self.root_id)
1917
if self.parent_id_basename_to_file_id is not None:
1918
lines.append('parent_id_basename_to_file_id: %s\n' %
1919
self.parent_id_basename_to_file_id.key())
1920
lines.append("id_to_entry: %s\n" % self.id_to_entry.key())
1925
"""Get the root entry."""
1926
return self[self.root_id]
1929
class CHKInventoryDirectory(InventoryDirectory):
1930
"""A directory in an inventory."""
1932
__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',
1933
'text_id', 'parent_id', '_children', 'executable',
1934
'revision', 'symlink_target', 'reference_revision',
1937
def __init__(self, file_id, name, parent_id, chk_inventory):
1938
# Don't call InventoryDirectory.__init__ - it isn't right for this
1940
InventoryEntry.__init__(self, file_id, name, parent_id)
1941
self._children = None
1942
self.kind = 'directory'
1943
self._chk_inventory = chk_inventory
1947
"""Access the list of children of this directory.
1949
With a parent_id_basename_to_file_id index, loads all the children,
1950
without loads the entire index. Without is bad. A more sophisticated
1951
proxy object might be nice, to allow partial loading of children as
1952
well when specific names are accessed. (So path traversal can be
1953
written in the obvious way but not examine siblings.).
1955
if self._children is not None:
1956
return self._children
1957
# No longer supported
1958
if self._chk_inventory.parent_id_basename_to_file_id is None:
1959
raise AssertionError("Inventories without"
1960
" parent_id_basename_to_file_id are no longer supported")
1962
# XXX: Todo - use proxy objects for the children rather than loading
1963
# all when the attribute is referenced.
1964
parent_id_index = self._chk_inventory.parent_id_basename_to_file_id
1966
for (parent_id, name_utf8), file_id in parent_id_index.iteritems(
1967
key_filter=[(self.file_id,)]):
1968
child_keys.add((file_id,))
1970
for file_id_key in child_keys:
1971
entry = self._chk_inventory._fileid_to_entry_cache.get(
1972
file_id_key[0], None)
1973
if entry is not None:
1974
result[entry.name] = entry
1975
cached.add(file_id_key)
1976
child_keys.difference_update(cached)
1977
# populate; todo: do by name
1978
id_to_entry = self._chk_inventory.id_to_entry
1979
for file_id_key, bytes in id_to_entry.iteritems(child_keys):
1980
entry = self._chk_inventory._bytes_to_entry(bytes)
1981
result[entry.name] = entry
1982
self._chk_inventory._fileid_to_entry_cache[file_id_key[0]] = entry
1983
self._children = result
1375
1987
entry_factory = {