34
45
An InventoryEntry has the following fields, which are also
35
46
present in the XML inventory-entry element:
38
* *name*: (only the basename within the directory, must not
40
* *kind*: "directory" or "file"
41
* *directory_id*: (if absent/null means the branch root directory)
42
* *text_sha1*: only for files
43
* *text_size*: in bytes, only for files
44
* *text_id*: identifier for the text version, only for files
46
InventoryEntries can also exist inside a WorkingTree
47
inventory, in which case they are not yet bound to a
48
particular revision of the file. In that case the text_sha1,
49
text_size and text_id are absent.
51
(within the parent directory)
54
file_id of the parent directory, or ROOT_ID
57
the revision_id in which this variation of this file was
61
Indicates that this file should be executable on systems
65
sha-1 of the text of the file
68
size in bytes of the text of the file
70
(reading a version 4 tree created a text_id field.)
52
72
>>> i = Inventory()
55
>>> i.add(InventoryEntry('123', 'src', 'directory', ROOT_ID))
56
>>> i.add(InventoryEntry('2323', 'hello.c', 'file', parent_id='123'))
75
>>> i.add(InventoryDirectory('123', 'src', ROOT_ID))
76
InventoryDirectory('123', 'src', parent_id='TREE_ROOT')
77
>>> i.add(InventoryFile('2323', 'hello.c', parent_id='123'))
78
InventoryFile('2323', 'hello.c', parent_id='123')
57
79
>>> for j in i.iter_entries():
60
('src', InventoryEntry('123', 'src', kind='directory', parent_id='TREE_ROOT'))
61
('src/hello.c', InventoryEntry('2323', 'hello.c', kind='file', parent_id='123'))
62
>>> i.add(InventoryEntry('2323', 'bye.c', 'file', '123'))
82
('src', InventoryDirectory('123', 'src', parent_id='TREE_ROOT'))
83
('src/hello.c', InventoryFile('2323', 'hello.c', parent_id='123'))
84
>>> i.add(InventoryFile('2323', 'bye.c', '123'))
63
85
Traceback (most recent call last):
65
87
BzrError: inventory already contains entry with id {2323}
66
>>> i.add(InventoryEntry('2324', 'bye.c', 'file', '123'))
67
>>> i.add(InventoryEntry('2325', 'wibble', 'directory', '123'))
88
>>> i.add(InventoryFile('2324', 'bye.c', '123'))
89
InventoryFile('2324', 'bye.c', parent_id='123')
90
>>> i.add(InventoryDirectory('2325', 'wibble', '123'))
91
InventoryDirectory('2325', 'wibble', parent_id='123')
68
92
>>> i.path2id('src/wibble')
72
>>> i.add(InventoryEntry('2326', 'wibble.c', 'file', '2325'))
96
>>> i.add(InventoryFile('2326', 'wibble.c', '2325'))
97
InventoryFile('2326', 'wibble.c', parent_id='2325')
74
InventoryEntry('2326', 'wibble.c', kind='file', parent_id='2325')
75
>>> for j in i.iter_entries():
77
... assert i.path2id(j[0])
99
InventoryFile('2326', 'wibble.c', parent_id='2325')
100
>>> for path, entry in i.iter_entries():
101
... print path.replace('\\\\', '/') # for win32 os.sep
102
... assert i.path2id(path)
83
108
src/wibble/wibble.c
109
>>> i.id2path('2326').replace('\\\\', '/')
85
110
'src/wibble/wibble.c'
87
TODO: Maybe also keep the full path of the entry, and the children?
88
But those depend on its position within a particular inventory, and
89
it would be nice not to need to hold the backpointer here.
92
# TODO: split InventoryEntry into subclasses for files,
93
# directories, etc etc.
95
113
__slots__ = ['text_sha1', 'text_size', 'file_id', 'name', 'kind',
96
'text_id', 'parent_id', 'children', ]
98
def __init__(self, file_id, name, kind, parent_id, text_id=None):
114
'text_id', 'parent_id', 'children', 'executable',
117
def _add_text_to_weave(self, new_lines, parents, weave_store, transaction):
118
weave_store.add_text(self.file_id, self.revision, new_lines, parents,
121
def detect_changes(self, old_entry):
122
"""Return a (text_modified, meta_modified) from this to old_entry.
124
_read_tree_state must have been called on self and old_entry prior to
125
calling detect_changes.
129
def diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,
130
output_to, reverse=False):
131
"""Perform a diff from this to to_entry.
133
text_diff will be used for textual difference calculation.
134
This is a template method, override _diff in child classes.
136
self._read_tree_state(tree)
138
# cannot diff from one kind to another - you must do a removal
139
# and an addif they do not match.
140
assert self.kind == to_entry.kind
141
to_entry._read_tree_state(to_tree)
142
self._diff(text_diff, from_label, tree, to_label, to_entry, to_tree,
145
def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,
146
output_to, reverse=False):
147
"""Perform a diff between two entries of the same kind."""
149
def find_previous_heads(self, previous_inventories, entry_weave):
150
"""Return the revisions and entries that directly preceed this.
152
Returned as a map from revision to inventory entry.
154
This is a map containing the file revisions in all parents
155
for which the file exists, and its revision is not a parent of
156
any other. If the file is new, the set will be empty.
158
def get_ancestors(weave, entry):
159
return set(map(weave.idx_to_name,
160
weave.inclusions([weave.lookup(entry.revision)])))
163
for inv in previous_inventories:
164
if self.file_id in inv:
165
ie = inv[self.file_id]
166
assert ie.file_id == self.file_id
167
if ie.revision in heads:
168
# fixup logic, there was a bug in revision updates.
169
# with x bit support.
171
if heads[ie.revision].executable != ie.executable:
172
heads[ie.revision].executable = False
173
ie.executable = False
174
except AttributeError:
176
assert heads[ie.revision] == ie
178
# may want to add it.
179
# may already be covered:
180
already_present = 0 != len(
181
[head for head in heads
182
if ie.revision in head_ancestors[head]])
184
# an ancestor of a known head.
187
ancestors = get_ancestors(entry_weave, ie)
188
# may knock something else out:
189
check_heads = list(heads.keys())
190
for head in check_heads:
191
if head in ancestors:
192
# this head is not really a head
194
head_ancestors[ie.revision] = ancestors
195
heads[ie.revision] = ie
198
def get_tar_item(self, root, dp, now, tree):
199
"""Get a tarfile item and a file stream for its content."""
200
item = tarfile.TarInfo(os.path.join(root, dp))
201
# TODO: would be cool to actually set it to the timestamp of the
202
# revision it was last changed
204
fileobj = self._put_in_tar(item, tree)
208
"""Return true if the object this entry represents has textual data.
210
Note that textual data includes binary content.
212
Also note that all entries get weave files created for them.
213
This attribute is primarily used when upgrading from old trees that
214
did not have the weave index for all inventory entries.
218
def __init__(self, file_id, name, parent_id, text_id=None):
99
219
"""Create an InventoryEntry
101
221
The filename must be a single component, relative to the
102
222
parent directory; it cannot be a whole path or relative name.
104
>>> e = InventoryEntry('123', 'hello.c', 'file', ROOT_ID)
224
>>> e = InventoryFile('123', 'hello.c', ROOT_ID)
109
>>> e = InventoryEntry('123', 'src/hello.c', 'file', ROOT_ID)
229
>>> e = InventoryFile('123', 'src/hello.c', ROOT_ID)
110
230
Traceback (most recent call last):
111
231
BzrCheckError: InventoryEntry name 'src/hello.c' is invalid
233
assert isinstance(name, basestring), name
113
234
if '/' in name or '\\' in name:
114
235
raise BzrCheckError('InventoryEntry name %r is invalid' % name)
237
self.executable = False
116
239
self.text_sha1 = None
117
240
self.text_size = None
119
241
self.file_id = file_id
122
243
self.text_id = text_id
123
244
self.parent_id = parent_id
124
if kind == 'directory':
129
raise BzrError("unhandled entry kind %r" % kind)
245
self.symlink_target = None
247
def kind_character(self):
248
"""Return a short kind indicator useful for appending to names."""
249
raise BzrError('unknown kind %r' % self.kind)
251
known_kinds = ('file', 'directory', 'symlink', 'root_directory')
253
def _put_in_tar(self, item, tree):
254
"""populate item for stashing in a tar, and return the content stream.
256
If no content is available, return None.
258
raise BzrError("don't know how to export {%s} of kind %r" %
259
(self.file_id, self.kind))
261
def put_on_disk(self, dest, dp, tree):
262
"""Create a representation of self on disk in the prefix dest.
264
This is a template method - implement _put_on_disk in subclasses.
266
fullpath = appendpath(dest, dp)
267
self._put_on_disk(fullpath, tree)
268
mutter(" export {%s} kind %s to %s" % (self.file_id, self.kind, fullpath))
270
def _put_on_disk(self, fullpath, tree):
271
"""Put this entry onto disk at fullpath, from tree tree."""
272
raise BzrError("don't know how to export {%s} of kind %r" % (self.file_id, self.kind))
133
274
def sorted_children(self):
134
275
l = self.children.items()
280
def versionable_kind(kind):
281
return kind in ('file', 'directory', 'symlink')
283
def check(self, checker, rev_id, inv, tree):
284
"""Check this inventory entry is intact.
286
This is a template method, override _check for kind specific
289
if self.parent_id != None:
290
if not inv.has_id(self.parent_id):
291
raise BzrCheckError('missing parent {%s} in inventory for revision {%s}'
292
% (self.parent_id, rev_id))
293
self._check(checker, rev_id, tree)
295
def _check(self, checker, rev_id, tree):
296
"""Check this inventory entry for kind specific errors."""
297
raise BzrCheckError('unknown entry kind %r in revision {%s}' %
140
other = InventoryEntry(self.file_id, self.name, self.kind,
141
self.parent_id, text_id=self.text_id)
142
other.text_sha1 = self.text_sha1
143
other.text_size = self.text_size
144
# note that children are *not* copied; they're pulled across when
302
"""Clone this inventory entry."""
303
raise NotImplementedError
305
def _get_snapshot_change(self, previous_entries):
306
if len(previous_entries) > 1:
308
elif len(previous_entries) == 0:
311
return 'modified/renamed/reparented'
149
313
def __repr__(self):
150
return ("%s(%r, %r, kind=%r, parent_id=%r)"
314
return ("%s(%r, %r, parent_id=%r)"
151
315
% (self.__class__.__name__,
158
def to_element(self):
159
"""Convert to XML element"""
160
from bzrlib.xml import Element
164
e.set('name', self.name)
165
e.set('file_id', self.file_id)
166
e.set('kind', self.kind)
168
if self.text_size != None:
169
e.set('text_size', '%d' % self.text_size)
171
for f in ['text_id', 'text_sha1']:
176
# to be conservative, we don't externalize the root pointers
177
# for now, leaving them as null in the xml form. in a future
178
# version it will be implied by nested elements.
179
if self.parent_id != ROOT_ID:
180
assert isinstance(self.parent_id, basestring)
181
e.set('parent_id', self.parent_id)
188
def from_element(cls, elt):
189
assert elt.tag == 'entry'
191
## original format inventories don't have a parent_id for
192
## nodes in the root directory, but it's cleaner to use one
194
parent_id = elt.get('parent_id')
195
if parent_id == None:
198
self = cls(elt.get('file_id'), elt.get('name'), elt.get('kind'), parent_id)
199
self.text_id = elt.get('text_id')
200
self.text_sha1 = elt.get('text_sha1')
202
## mutter("read inventoryentry: %r" % (elt.attrib))
204
v = elt.get('text_size')
205
self.text_size = v and int(v)
210
from_element = classmethod(from_element)
320
def snapshot(self, revision, path, previous_entries,
321
work_tree, weave_store, transaction):
322
"""Make a snapshot of this entry which may or may not have changed.
324
This means that all its fields are populated, that it has its
325
text stored in the text store or weave.
327
mutter('new parents of %s are %r', path, previous_entries)
328
self._read_tree_state(work_tree)
329
if len(previous_entries) == 1:
330
# cannot be unchanged unless there is only one parent file rev.
331
parent_ie = previous_entries.values()[0]
332
if self._unchanged(parent_ie):
333
mutter("found unchanged entry")
334
self.revision = parent_ie.revision
336
return self.snapshot_revision(revision, previous_entries,
337
work_tree, weave_store, transaction)
339
def snapshot_revision(self, revision, previous_entries, work_tree,
340
weave_store, transaction):
341
"""Record this revision unconditionally."""
342
mutter('new revision for {%s}', self.file_id)
343
self.revision = revision
344
change = self._get_snapshot_change(previous_entries)
345
self._snapshot_text(previous_entries, work_tree, weave_store,
349
def _snapshot_text(self, file_parents, work_tree, weave_store, transaction):
350
"""Record the 'text' of this entry, whatever form that takes.
352
This default implementation simply adds an empty text.
354
mutter('storing file {%s} in revision {%s}',
355
self.file_id, self.revision)
356
self._add_text_to_weave([], file_parents, weave_store, transaction)
212
358
def __eq__(self, other):
213
359
if not isinstance(other, InventoryEntry):
214
360
return NotImplemented
216
return (self.file_id == other.file_id) \
217
and (self.name == other.name) \
218
and (self.text_sha1 == other.text_sha1) \
219
and (self.text_size == other.text_size) \
220
and (self.text_id == other.text_id) \
221
and (self.parent_id == other.parent_id) \
222
and (self.kind == other.kind)
362
return ((self.file_id == other.file_id)
363
and (self.name == other.name)
364
and (other.symlink_target == self.symlink_target)
365
and (self.text_sha1 == other.text_sha1)
366
and (self.text_size == other.text_size)
367
and (self.text_id == other.text_id)
368
and (self.parent_id == other.parent_id)
369
and (self.kind == other.kind)
370
and (self.revision == other.revision)
371
and (self.executable == other.executable)
225
374
def __ne__(self, other):
226
375
return not (self == other)
246
423
and (self.children == other.children)
426
class InventoryDirectory(InventoryEntry):
427
"""A directory in an inventory."""
429
def _check(self, checker, rev_id, tree):
430
"""See InventoryEntry._check"""
431
if self.text_sha1 != None or self.text_size != None or self.text_id != None:
432
raise BzrCheckError('directory {%s} has text in revision {%s}'
433
% (self.file_id, rev_id))
436
other = InventoryDirectory(self.file_id, self.name, self.parent_id)
437
other.revision = self.revision
438
# note that children are *not* copied; they're pulled across when
442
def __init__(self, file_id, name, parent_id):
443
super(InventoryDirectory, self).__init__(file_id, name, parent_id)
445
self.kind = 'directory'
447
def kind_character(self):
448
"""See InventoryEntry.kind_character."""
451
def _put_in_tar(self, item, tree):
452
"""See InventoryEntry._put_in_tar."""
453
item.type = tarfile.DIRTYPE
460
def _put_on_disk(self, fullpath, tree):
461
"""See InventoryEntry._put_on_disk."""
465
class InventoryFile(InventoryEntry):
466
"""A file in an inventory."""
468
def _check(self, checker, rev_id, tree):
469
"""See InventoryEntry._check"""
470
revision = self.revision
471
t = (self.file_id, revision)
472
if t in checker.checked_texts:
473
prev_sha = checker.checked_texts[t]
474
if prev_sha != self.text_sha1:
475
raise BzrCheckError('mismatched sha1 on {%s} in {%s}' %
476
(self.file_id, rev_id))
478
checker.repeated_text_cnt += 1
480
mutter('check version {%s} of {%s}', rev_id, self.file_id)
481
file_lines = tree.get_file_lines(self.file_id)
482
checker.checked_text_cnt += 1
483
if self.text_size != sum(map(len, file_lines)):
484
raise BzrCheckError('text {%s} wrong size' % self.text_id)
485
if self.text_sha1 != sha_strings(file_lines):
486
raise BzrCheckError('text {%s} wrong sha1' % self.text_id)
487
checker.checked_texts[t] = self.text_sha1
490
other = InventoryFile(self.file_id, self.name, self.parent_id)
491
other.executable = self.executable
492
other.text_id = self.text_id
493
other.text_sha1 = self.text_sha1
494
other.text_size = self.text_size
495
other.revision = self.revision
498
def detect_changes(self, old_entry):
499
"""See InventoryEntry.detect_changes."""
500
assert self.text_sha1 != None
501
assert old_entry.text_sha1 != None
502
text_modified = (self.text_sha1 != old_entry.text_sha1)
503
meta_modified = (self.executable != old_entry.executable)
504
return text_modified, meta_modified
506
def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,
507
output_to, reverse=False):
508
"""See InventoryEntry._diff."""
509
from_text = tree.get_file(self.file_id).readlines()
511
to_text = to_tree.get_file(to_entry.file_id).readlines()
515
text_diff(from_label, from_text,
516
to_label, to_text, output_to)
518
text_diff(to_label, to_text,
519
from_label, from_text, output_to)
522
"""See InventoryEntry.has_text."""
525
def __init__(self, file_id, name, parent_id):
526
super(InventoryFile, self).__init__(file_id, name, parent_id)
529
def kind_character(self):
530
"""See InventoryEntry.kind_character."""
533
def _put_in_tar(self, item, tree):
534
"""See InventoryEntry._put_in_tar."""
535
item.type = tarfile.REGTYPE
536
fileobj = tree.get_file(self.file_id)
537
item.size = self.text_size
538
if tree.is_executable(self.file_id):
544
def _put_on_disk(self, fullpath, tree):
545
"""See InventoryEntry._put_on_disk."""
546
pumpfile(tree.get_file(self.file_id), file(fullpath, 'wb'))
547
if tree.is_executable(self.file_id):
548
os.chmod(fullpath, 0755)
550
def _read_tree_state(self, work_tree):
551
"""See InventoryEntry._read_tree_state."""
552
self.text_sha1 = work_tree.get_file_sha1(self.file_id)
553
self.executable = work_tree.is_executable(self.file_id)
555
def _snapshot_text(self, file_parents, work_tree, weave_store, transaction):
556
"""See InventoryEntry._snapshot_text."""
557
mutter('storing file {%s} in revision {%s}',
558
self.file_id, self.revision)
559
# special case to avoid diffing on renames or
561
if (len(file_parents) == 1
562
and self.text_sha1 == file_parents.values()[0].text_sha1
563
and self.text_size == file_parents.values()[0].text_size):
564
previous_ie = file_parents.values()[0]
565
weave_store.add_identical_text(
566
self.file_id, previous_ie.revision,
567
self.revision, file_parents, transaction)
569
new_lines = work_tree.get_file(self.file_id).readlines()
570
self._add_text_to_weave(new_lines, file_parents, weave_store,
572
self.text_sha1 = sha_strings(new_lines)
573
self.text_size = sum(map(len, new_lines))
576
def _unchanged(self, previous_ie):
577
"""See InventoryEntry._unchanged."""
578
compatible = super(InventoryFile, self)._unchanged(previous_ie)
579
if self.text_sha1 != previous_ie.text_sha1:
582
# FIXME: 20050930 probe for the text size when getting sha1
583
# in _read_tree_state
584
self.text_size = previous_ie.text_size
585
if self.executable != previous_ie.executable:
590
class InventoryLink(InventoryEntry):
591
"""A file in an inventory."""
593
__slots__ = ['symlink_target']
595
def _check(self, checker, rev_id, tree):
596
"""See InventoryEntry._check"""
597
if self.text_sha1 != None or self.text_size != None or self.text_id != None:
598
raise BzrCheckError('symlink {%s} has text in revision {%s}'
599
% (self.file_id, rev_id))
600
if self.symlink_target == None:
601
raise BzrCheckError('symlink {%s} has no target in revision {%s}'
602
% (self.file_id, rev_id))
605
other = InventoryLink(self.file_id, self.name, self.parent_id)
606
other.symlink_target = self.symlink_target
607
other.revision = self.revision
610
def detect_changes(self, old_entry):
611
"""See InventoryEntry.detect_changes."""
612
# FIXME: which _modified field should we use ? RBC 20051003
613
text_modified = (self.symlink_target != old_entry.symlink_target)
615
mutter(" symlink target changed")
616
meta_modified = False
617
return text_modified, meta_modified
619
def _diff(self, text_diff, from_label, tree, to_label, to_entry, to_tree,
620
output_to, reverse=False):
621
"""See InventoryEntry._diff."""
622
from_text = self.symlink_target
623
if to_entry is not None:
624
to_text = to_entry.symlink_target
629
print >>output_to, '=== target changed %r => %r' % (from_text, to_text)
632
print >>output_to, '=== target was %r' % self.symlink_target
634
print >>output_to, '=== target is %r' % self.symlink_target
636
def __init__(self, file_id, name, parent_id):
637
super(InventoryLink, self).__init__(file_id, name, parent_id)
638
self.kind = 'symlink'
640
def kind_character(self):
641
"""See InventoryEntry.kind_character."""
644
def _put_in_tar(self, item, tree):
645
"""See InventoryEntry._put_in_tar."""
646
iterm.type = tarfile.SYMTYPE
650
item.linkname = self.symlink_target
653
def _put_on_disk(self, fullpath, tree):
654
"""See InventoryEntry._put_on_disk."""
656
os.symlink(self.symlink_target, fullpath)
658
raise BzrError("Failed to create symlink %r -> %r, error: %s" % (fullpath, self.symlink_target, e))
660
def _read_tree_state(self, work_tree):
661
"""See InventoryEntry._read_tree_state."""
662
self.symlink_target = work_tree.get_symlink_target(self.file_id)
664
def _unchanged(self, previous_ie):
665
"""See InventoryEntry._unchanged."""
666
compatible = super(InventoryLink, self)._unchanged(previous_ie)
667
if self.symlink_target != previous_ie.symlink_target:
250
672
class Inventory(object):
251
673
"""Inventory of versioned files in a tree.